-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathpropagate.go
327 lines (284 loc) · 10.3 KB
/
propagate.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
// Copyright (c) 2021 Uber Technologies, Inc.
//
// Licensed under the Uber Non-Commercial License (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at the root directory of this project.
//
// See the License for the specific language governing permissions and
// limitations under the License.
package propagate
// The tool implemented in the propagate package parses and loads Go source files as ASTs
// and uses these to construct a call graph.
//
// At a high level, the context propagation algorithm takes the following input:
// - a list of "leaf functions" (package path/name and function name) - these represent library API
// calls that currently do not take context as an argument but are meant to take it (as the first
// argument) after the refactoring
// - the name and type of context parameter (as strings)
// - the names of functions where the context propagation is supposed to stop (optional)
//
// Given this input, the algorithm visits all nodes in the call graph to locate calls to leaf functions.
// Once these are available, the algorithm follows the call chains originating from these functions,
// collecting both function definitions that need an additional context argument, and call sites
// for theses additional functions that also have to be modified. The algorithm stops visiting call graph
// nodes either when it visits them all or when it encounters a function that is explicitly marked as one
// where the propagation should stop. When processing function calls, the algorithm also keeps track of
// additional language constructs that need to modified in concert with function definition changes
// (e.g. named function types).
//
// Once the list of function definitions, the list of call sites, and the list of additional language
// constructs to be modified are collected, the algorithm visits ASTs one by one and modifies all
// required parts of the program.
import (
"bytes"
"encoding/json"
"flag"
"fmt"
"go/ast"
"go/format"
"go/token"
"go/types"
cg "golang.org/x/tools/go/callgraph"
"golang.org/x/tools/go/callgraph/cha"
"golang.org/x/tools/go/callgraph/rta"
"golang.org/x/tools/go/packages"
"golang.org/x/tools/go/pointer"
"golang.org/x/tools/go/ssa"
"golang.org/x/tools/go/ssa/ssautil"
"io/ioutil"
"log"
"os"
)
// Run is the main entry point for the whole context propgatation process.
func Run(configFilePath string, debugFilePath string, srcPaths []string, debugLevel int) {
results := propagate(configFilePath, debugFilePath, srcPaths, debugLevel)
// write modified files to the same locations as original files with the added "mod" extension
for p, nodes := range results {
for n, ind := range nodes {
var buf bytes.Buffer
err := format.Node(&buf, p.Fset, n)
if err != nil {
ast.Print(p.Fset, n)
log.Fatal(err)
}
err = ioutil.WriteFile(p.CompiledGoFiles[ind]+".mod", buf.Bytes(), 0644)
if err != nil {
log.Fatal(err)
}
}
}
}
// propagate is the main driver for the whole context propgatation process.
func propagate(configFilePath string, debugFilePath string, srcPaths []string, debugLevel int) map[*packages.Package]map[*ast.File]int {
cfg := initialize(configFilePath, debugLevel)
loadPaths := cfg.LoadPaths
if srcPaths != nil && len(srcPaths) > 0 {
// if paths passed explicitly - use them
loadPaths = srcPaths
}
loadConfig := &packages.Config{Mode: packages.LoadAllSyntax, Tests: true}
argsSize := 0
for _, s := range loadPaths {
argsSize += len(s)
}
iter := (argsSize / argBytesLimit) + 1
inc := len(loadPaths) / iter
var initialLoaded []*packages.Package
numPaths := len(loadPaths)
if numPaths > inc {
cfg.largeCode = true
if cfg.debugLevel > 0 {
fmt.Println("INCREMENTAL LOADING")
}
cfg.fsets = make(map[*types.Package]*token.FileSet)
} else if cfg.debugLevel > 0 {
fmt.Println("ONE-TIME LOADING")
}
for i := 0; i < numPaths; i += inc {
end := numPaths
if i+inc < numPaths {
end = i + inc
}
allLoadPaths := append(loadPaths[i:end], cfg.LibPkgPath)
if cfg.LibIface == "" {
allLoadPaths = loadPaths[i:end]
}
loaded, err := packages.Load(loadConfig, allLoadPaths...)
if err != nil {
log.Fatal(err)
}
if cfg.largeCode && len(loaded) > 0 {
for _, l := range loaded {
cfg.fsets[l.Types] = l.Fset
}
}
initialLoaded = append(initialLoaded, loaded...)
}
// ignore packages that have not been loaded correctly, but warn the user about it
for _, p := range initialLoaded {
if len(p.Errors) > 0 {
// ignore this package
// if the debug level is high enough, print detailed info
if cfg.debugLevel > 1 {
fmt.Println("PACKAGE " + p.Name + " (AT " + p.PkgPath + ") BUILD ERRORS: ")
for _, e := range p.Errors {
fmt.Println(e)
}
}
// if debug is enabled at all, collect names of packages that filed to load
if cfg.debugLevel > 0 {
cfg.debugData.Excluded = append(cfg.debugData.Excluded, "package "+p.Name+" at "+p.PkgPath)
}
continue
}
cfg.initial = append(cfg.initial, p)
}
prog, pkgs := ssautil.AllPackages(cfg.initial, ssa.GlobalDebug)
var cgRoots []*ssa.Function
// we could use prog.Build() instead but this would create a call graph including all dependencies
for _, p := range pkgs {
if p != nil {
p.Build()
}
}
var graph *cg.Graph
if cfgType == cfgRTA {
if cfg.debugLevel > 0 {
fmt.Println("GOPATH:", os.Getenv("GOPATH"))
}
// use RTA to construct the callgraph; CHA-style construction overapproximates calls made
// via functions passed as parameters to a larger extent than RTA (creates edges for all
// functions whose signature matches the function parameter rather than for some in case of RTA)
for f, _ := range ssautil.AllFunctions(prog) {
cgRoots = append(cgRoots, f)
}
res := rta.Analyze(cgRoots, true)
if res == nil {
log.Fatalf("error building RTA callgraph")
}
graph = res.CallGraph
} else if cfgType == cfgCHA {
// callgraph constructed using CHA algorithm
graph = cha.CallGraph(prog)
} else {
// callgraph constructed using points-to analysis
// TODO: can't make it to include all required files...
var ptrConfig pointer.Config
mainPkgs := ssautil.MainPackages(pkgs)
// add synthetic main packages to include tests
mainPkgsMap := make(map[*ssa.Package]bool)
for _, p := range mainPkgs {
mainPkgsMap[p] = true
}
for _, p := range pkgs {
if !mainPkgsMap[p] {
prog.CreateTestMainPackage(p)
}
}
mainPkgs = ssautil.MainPackages(prog.AllPackages())
ptrConfig.Mains = mainPkgs
ptrConfig.BuildCallGraph = true
ptrConfig.Reflection = true
res, err := pointer.Analyze(&ptrConfig)
if err != nil {
log.Fatalf("error creating call graph using points-to analysis")
}
graph = res.CallGraph
}
graph.DeleteSyntheticNodes()
transformer := transformerConfig{
config: cfg,
astIfaceModified: make(map[*ast.InterfaceType]bool),
}
analyzer := analyzerConfig{
config: cfg,
prog: prog,
graph: graph,
mapAndSliceFuncs: make(map[*ssa.Package]map[*types.Signature]bool),
}
(&analyzer).analyze()
res := (&transformer).transform()
outputDebugInfo(debugFilePath, cfg)
return res
}
// initialize performs tool initialization.
func initialize(configFilePath string, debugLevel int) *config {
if configFilePath == "" {
fmt.Fprintln(os.Stderr, "USAGE:")
flag.PrintDefaults()
os.Exit(1)
}
buf, ok := ioutil.ReadFile(configFilePath)
if ok != nil {
log.Fatalf("error reading config file " + configFilePath)
}
jsonCfg := jsonConfig{
ExtEmbedTypes: make(typeInfo),
LibFns: make(fnReplacementInfo),
PropagationStops: make(fnInfo),
}
err := json.Unmarshal(buf, &jsonCfg)
if err != nil {
log.Fatalf("error unmarshalling file " + configFilePath + ":\n" + err.Error())
}
cfg := config{
jsonConfig: &jsonCfg,
debugLevel: debugLevel,
largeCode: false,
fnVisited: make(map[uniquePosInfo]int),
callSites: make(map[uniquePosInfo]*replacementInfo),
callSitesRenamed: make(map[uniquePosInfo]string),
ifaceModified: make(map[*types.Interface]map[string]bool),
fnParamsVisited: make(map[uniquePosInfo]bool),
renameParamsVisited: make(map[uniquePosInfo]bool),
}
if cfg.CtxParamInvalid == "" {
log.Fatalf("artificial context expression (CtxParamInvalid) must be specified in the config file")
}
if !(len(cfg.CtxCustomPkgPath) == 0 && len(cfg.CtxCustomPkgName) == 0 && len(cfg.CtxCustomParamType) == 0 && len(cfg.CtxCustomExprExtract) == 0) &&
!(len(cfg.CtxCustomPkgPath) > 0 && len(cfg.CtxCustomPkgName) > 0 && len(cfg.CtxCustomParamType) > 0 && len(cfg.CtxCustomExprExtract) > 0) {
log.Fatalf("either all or none of the custom context options should be specified in the config file")
}
// context param type qualified with both path and name
cfg.ctxParamTypeWithPkgPathName = getQualifiedType(cfg.CtxParamType, cfg.CtxPkgPath, cfg.CtxPkgName)
if len(cfg.CtxCustomParamType) > 0 {
cfg.ctxCustomParamTypeWithPkgPathName = getQualifiedType(cfg.CtxCustomParamType, cfg.CtxCustomPkgPath, cfg.CtxCustomPkgName)
}
cfg.commonCallReplacement = replacementInfo{"", 1, nil, "", cfg.CtxParamName}
return &cfg
}
// outputDebugInfo outputs debug info either to standard output or to
// a file for further processing.
func outputDebugInfo(debugFilePath string, cfg *config) {
if cfg.debugLevel <= 0 {
return
}
if debugFilePath != "" {
debugFile, err := os.OpenFile(debugFilePath, os.O_RDWR|os.O_CREATE|os.O_TRUNC, 0755)
if err != nil {
log.Fatalf("error creating debug file " + debugFilePath)
}
// add generated debug data to a file
debugData, err := json.Marshal(cfg.debugData)
if err != nil {
log.Fatalf("error writing debug file " + debugFilePath)
}
debugFile.WriteString(string(debugData))
debugFile.Close()
} else {
// print generated debug data unless already printed at higher debug level
if cfg.debugLevel < 2 && len(cfg.debugData.Excluded) > 0 {
fmt.Println("PACKAGES EXCLUDED DUE TO BUILD ERRORS:")
for _, pe := range cfg.debugData.Excluded {
fmt.Println(pe)
}
}
if cfg.debugLevel > 0 && len(cfg.debugData.Warnings) > 0 {
fmt.Println("CODE TRANSFORMATION WARNINGS:")
for _, c := range cfg.debugData.Warnings {
fmt.Println(c["msg"])
fmt.Println(c["file"] + " (line " + c["line"] + ")")
}
}
}
}