-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathchocimport.py
385 lines (345 loc) · 14.6 KB
/
chocimport.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
"""
Analyze a JavaScript module for Chocolate Factory usage and update an import
Looks for this line:
const {FORM, LABEL, INPUT} = choc; //autoimport
And calls like this:
set_content("main", FORM(LABEL([B("Name: "), INPUT({name: "name"})])))
And it will update the import to add the B.
This is very primitive static analysis and can recognize only a small set of
possible styles of usage, but the most common ones:
1) Direct usage, see above. Element name must be all-caps.
2) set_content("main", thing()); function thing() {return FORM(...);}
- top-level functions only (otherwise has to be defined before use)
3) function update() {stuff = LABEL(INPUT()); set_content("main", stuff)}
- can handle any assignment within scope including declarations
4) export function make_content() {return B("hello")}
- Requires "--extcall make_content" to signal that make_content is used thus
- Parameter not needed if name in all caps:
export function COMPONENT(x) {return DIV(x.name);}
5) const arr = []; arr.push(LI()); set_content(thing, arr)
6) const arr = stuff.map(thing => LI(thing.name)); set_content(thing, arr)
7) DOM("#foo").appendChild(LI())
- equivalently before(), after(), append(), insertBefore(), replaceWith()
8) (x => ABBR(x.attr, x.text))(stuff)
9) replace_content in any context where set_content is valid
"""
import sys
import esprima # ImportError? pip install -r requirements.txt
DOM_ADDITION_METHODS = ("appendChild", "before", "after", "append", "prepend", "insertBefore", "replaceWith")
DEFAULT_NAMESPACES = {"SVG": "svg"}
NAMESPACE_XFRM = {"svg": lambda fn: fn.lower()}
class Ctx:
@classmethod
def reset(cls, fn="-"):
Ctx.autoimport_line = -1 # If we find "//autoimport" at the end of a line, any declaration surrounding that will be edited.
Ctx.autoimport_range = None
Ctx.got_imports, Ctx.want_imports, Ctx.import_namespaces = { }, { }, { }
Ctx.import_source = "choc" # Will be set to "lindt" if the file uses lindt/replace_content
Ctx.fn = fn
Ctx.source_lines = []
elements = { }
def element(f):
if f.__doc__:
for name in f.__doc__.split(): elements[name] = f
else:
elements[f.__name__] = f
return f
def descend(el, *, sc, **kw):
if not el: return
if isinstance(el, list):
for el in el: descend(el, sc=sc, **kw)
return
# Any given element need only be visited once in any particular context
# Note that a list might have had more appended to it since it was last
# visited, so this check applies to the elements, not the whole list.
if getattr(el, "choc_visited_" + sc, False): return
setattr(el, "choc_visited_" + sc, True)
f = elements.get(el.type)
if f: f(el, sc=sc, **kw)
else:
print("%s:%d: Unknown type: %s" % (Ctx.fn, el.loc.start.line, el.type))
elements[el.type] = lambda el, **kw: None
# Recursive AST descent handlers
# Each one receives the current element and a tuple of current scopes
# On finding any sort of function, descend into it to probe.
@element
def FunctionExpression(el, *, scopes, sc, **kw):
if sc != "return": sc = "" # If we're not *calling* the function, then just probe it, don't process its return value
descend(el.body, scopes=scopes + ({ },), sc=sc, **kw)
@element
def ArrowFunctionExpression(el, *, scopes, sc, **kw):
if sc == "return" and el.expression: # Braceless arrow functions implicitly return
descend(el.body, scopes=scopes + ({ },), sc="set_content", **kw)
else: FunctionExpression(el, scopes=scopes, sc=sc, **kw)
@element
def FunctionDeclaration(el, *, scopes, sc, **kw):
if sc != "return" and el.id: scopes[-1].setdefault(el.id.name, []).append(el)
FunctionExpression(el, scopes=scopes, sc=sc, **kw)
@element
def BodyDescender(el, **kw):
"""BlockStatement LabeledStatement WhileStatement DoWhileStatement CatchClause
ForStatement ForInStatement ForOfStatement"""
descend(el.body, **kw)
@element
def Ignore(el, **kw):
"""Literal RegExpLiteral Directive EmptyStatement DebuggerStatement ThrowStatement UpdateExpression
ImportExpression TemplateLiteral ContinueStatement BreakStatement ThisExpression ObjectPattern ArrayPattern"""
# I assume that template strings will be used only for strings, not for DOM elements.
@element
def MemberExpression(el, **kw):
descend(el.object, **kw)
@element
def Export(el, **kw):
"""ExportNamedDeclaration ExportDefaultDeclaration"""
descend(el.declaration, **kw)
@element
def ImportDeclaration(el, **kw):
# Optionally check that Choc Factory has indeed been imported, and skip the file if not?
descend(el.specifiers, **kw)
@element
def ImportSpec(el, *, scopes, **kw):
"""ImportSpecifier ImportDefaultSpecifier ImportNamespaceSpecifier"""
scopes[-1].setdefault(el.local.name, []) # Mark that it's a known variable but don't attach any code to it
@element
def Identifier(el, *, scopes, sc, **kw):
if sc in ("set_content", "return"):
while scopes:
*scopes, scope = scopes
if el.name in scope:
descend(scope[el.name], scopes=(*scopes, scope), sc=sc, **kw)
break
@element
def Call(el, *, scopes, sc, **kw):
"""CallExpression NewExpression"""
if el.callee.type == "Identifier":
funcname = el.callee.name
prev = kw.get("xmlns", "(none)")
xmlns = Ctx.import_namespaces.get(funcname, DEFAULT_NAMESPACES.get(funcname, kw.pop("xmlns", ""))) # Be sure that xmlns is always popped out
descend(el.arguments, scopes=scopes, sc=sc, xmlns=xmlns, **kw)
if funcname in ("set_content", "replace_content"):
# Alright! We're setting content. First arg is the target, second is the content.
# Note that we don't validate mismatches of choc/replace_content or lindt/set_content.
if len(el.arguments) < 2: return # Huh. Need two args. Whatever.
descend(el.arguments[1], scopes=scopes, sc="set_content", **kw)
if len(el.arguments) > 2:
print("%s:%d: Extra arguments to set_content - did you intend to pass an array?" %
(Ctx.fn, el.loc.start.line), file=sys.stderr)
print(Ctx.source_lines[el.loc.start.line - 1], file=sys.stderr)
if sc == "set_content":
for scope in reversed(scopes):
if funcname in scope:
# Descend into the function. It's possible we've already scanned it
# for actual set_content calls, but now we will scan it for return
# values as well. (If we've already scanned for return values, this
# will quickly return.)
descend(scope[funcname], scopes=scopes[:1], sc="return", **kw)
return
if funcname.isupper():
if xmlns:
fn = NAMESPACE_XFRM.get(xmlns)
Ctx.want_imports[funcname] = '"' + xmlns + ':' + (fn(funcname) if fn else funcname) + '"';
if funcname not in Ctx.import_namespaces: Ctx.import_namespaces[funcname] = xmlns
else: Ctx.want_imports[funcname] = funcname
return
descend(el.arguments, scopes=scopes, sc=sc, **kw) # Assume a function's arguments can be incorporated into its return value
if el.callee.type == "MemberExpression":
c = el.callee
descend(c.object, scopes=scopes, sc="return" if sc == "set_content" else sc, **kw) # "foo(...).spam()" starts out by calling "foo(...)"
if c.computed: descend(c.property, scopes=scopes, sc=sc, **kw) # "foo[x]()" starts out by evaluating x
elif c.property.name in DOM_ADDITION_METHODS:
descend(el.arguments, scopes=scopes, sc="set_content", **kw)
elif c.property.name == "map":
# stuff.map(e => ...) is effectively a call to that function.
if sc == "set_content": sc = "return"
descend(el.arguments[0], scopes=scopes, sc=sc, **kw)
elif c.property.name in ("push", "unshift"):
# Adding to an array is adding code to the definition of the array.
# For static analysis, we consider both of these to have multiple code
# blocks associated with them:
# let x = []; x.push(P("hi")); x.push(DIV("hi"))
# let y; if (cond) y = P("hi"); else y = DIV("hi")
if c.object.type == "Identifier":
name = c.object.name
for scope in reversed(scopes):
if name in scope:
scope[name].append(el.arguments)
return
elif el.callee.type == "ArrowFunctionExpression" or el.callee.type == "FunctionExpression":
# Function expression, immediately called. Might also be being named.
descend(el.callee, scopes=scopes, sc="return" if sc == "set_content" else sc, **kw)
# else: pass # For now, I'm ignoring any unrecognized x.y() or x()() or anything
@element
def ReturnStatement(el, *, sc, **kw):
if sc == "return": sc = "set_content"
descend(el.argument, sc=sc, **kw)
@element
def ExpressionStatement(el, **kw):
descend(el.expression, **kw)
@element
def If(el, **kw):
"""IfStatement ConditionalExpression"""
descend(el.consequent, **kw)
descend(el.alternate, **kw)
@element
def SwitchStatement(el, **kw):
descend(el.cases, **kw)
@element
def SwitchCase(el, **kw):
descend(el.consequent, **kw)
@element
def TryStatement(el, **kw):
descend(el.block, **kw)
descend(el.handler, **kw)
descend(el.finalizer, **kw)
@element
def ArrayExpression(el, **kw):
descend(el.elements, **kw)
@element
def ObjectExpression(el, **kw):
descend(el.properties, **kw)
@element
def Property(el, **kw):
descend(el.key, **kw)
descend(el.value, **kw)
@element
def Unary(el, **kw):
"""UnaryExpression AwaitExpression SpreadElement YieldExpression"""
descend(el.argument, **kw)
@element
def Binary(el, **kw):
"""BinaryExpression LogicalExpression"""
descend(el.left, **kw)
descend(el.right, **kw)
@element
def VariableDeclaration(el, *, scopes, **kw):
if el.loc and el.loc.start.line <= Ctx.autoimport_line and el.loc.end.line >= Ctx.autoimport_line:
Ctx.autoimport_range = el.range
for decl in el.declarations:
if decl.init:
if decl.init.type == "Identifier" and decl.init.name in ("choc", "lindt"):
# It's the import destructuring line.
if decl.id.type != "ObjectPattern": continue # Or maybe not destructuring. Whatever, you do you.
for prop in decl.id.properties:
if prop.value.type == "Identifier" and prop.value.name.isupper():
if prop.key.type == "Identifier":
source = prop.key.name
Ctx.import_namespaces[prop.value.name] = ""
elif prop.key.type == "Literal":
source = prop.key.raw
Ctx.import_namespaces[prop.value.name] = prop.key.value.rpartition(":")[0]
else: print("Unrecognized import destructuring type " + prop.key.type)
Ctx.got_imports[prop.value.name] = source
Ctx.import_source = decl.init.name
continue
# Descend into it, looking for functions; also save it in case it's used later.
descend(decl.init, scopes=scopes, **kw)
scopes[-1].setdefault(decl.id.name, []).append(decl.init)
@element
def AssignmentExpression(el, *, scopes, sc, **kw):
descend(el.left, scopes=scopes, sc=sc, **kw)
descend(el.right, scopes=scopes, sc=sc, **kw)
if el.left.type != "Identifier" or sc == "set_content": return
# Assigning to a simple name stashes the expression in the appropriate scope.
# NOTE: In some situations, an assignment "further down" than the corresponding set_content
# call may be missed. This is lexical analysis, not control-flow analysis.
# Note also that this treats augmented assignment the same as assignment, collecting all
# relevant expressions together.
# Note that destructuring assignment will parse the right-hand-side but not stash it.
# It MAY be better to replicate it across all the names.
name = el.left.name
for scope in reversed(scopes):
if name in scope:
scope[name].append(el.right)
return
# If we didn't find anything to assign to, it's probably landing at top-level. Warn?
scopes[0][name] = [el.right]
@element
def ClassDeclaration(el, **kw):
descend(el.id, **kw)
descend(el.body, **kw)
@element
def ClassBody(el, **kw):
descend(el.body, **kw)
@element
def MethodDefinition(el, **kw):
descend(el.key, **kw)
descend(el.value, **kw)
def process(fn, *, fix=False, extcall=()):
Ctx.reset(fn)
if fn != "-":
with open(fn) as f: data = f.read()
else: data = """
import choc, {set_content, on, DOM} from "https://rosuav.github.io/choc/factory.js";
const {FORM, LABEL, INPUT} = choc; //autoimport
const {DIV} = choc;
const f1 = () => {HP()}, f2 = () => PRE(), f3 = () => {return B("bold");};
let f4 = "test";
function update() {
let el = FORM(LABEL(["Speak thy mind:", INPUT({name: "thought"})]))
set_content("main", [el, f1(), f2(), f3(), f4(), f5()])
}
f4 = () => DIV(); //Won't be found (violates DBU)
function f5() {return SPAN();}
export function COMPONENT(x) {return FIGURE(x.name);}
function NONCOMPONENT(x) {return FIGCAPTION(x.name);} //Non-exported won't be detected unless called
"""
module = esprima.parseModule(data, {"loc": True, "range": True})
Ctx.source_lines = data.split("\n")
for i, line in enumerate(Ctx.source_lines):
if line.strip().endswith("autoimport"):
Ctx.autoimport_line = i + 1
break
# First pass: Collect top-level function declarations (the ones that get hoisted)
scope = { }
exporteds = []
for el in module.body:
# Anything exported, just look at the base thing
exported = el.type in ("ExportNamedDeclaration", "ExportDefaultDeclaration")
if exported:
el = el.declaration
if not el: continue # Possibly a reexport or something
# function func(x) {y}
if el.type == "FunctionDeclaration" and el.id:
scope[el.id.name] = [el]
# export function COMPONENT() { }
if exported and el.id.name.isupper(): exporteds.append(el)
# Second pass: Recursively look for all set_content calls.
descend(module.body, scopes=(scope,), sc="")
# Some exported functions can return DOM elements. It's possible that they've
# already been scanned, but that's okay, we'll deduplicate in descend().
for func in extcall or ():
if func in scope: descend(scope[func], scopes=(scope,), sc="return")
descend(exporteds, scopes=(scope,), sc="return");
have = sorted(Ctx.got_imports)
want = sorted(Ctx.want_imports)
if want != Ctx.got_imports:
print(fn)
lose = [x for x in have if x not in Ctx.want_imports]
gain = [x for x in want if x not in Ctx.got_imports]
if lose: print("LOSE:", lose)
if gain: print("GAIN:", gain)
wanted = []
for func in want:
prev = Ctx.got_imports.get(func, Ctx.want_imports[func]);
if prev == func: wanted.append(func)
else: wanted.append(prev + ": " + func)
wanted = ", ".join(wanted)
print("WANT:", wanted)
if Ctx.autoimport_range:
start, end = Ctx.autoimport_range
data = data[:start] + "const {" + wanted + "} = " + Ctx.import_source + ";" + data[end:]
# Write-back if the user wants it
if fn == "-": print(data)
if fix:
with open(fn, "w") as f:
f.write(data)
def main(args):
import argparse
p = argparse.ArgumentParser(description="Validate Chocolate Factory imports")
p.add_argument("file", nargs="+", help="File(s) to process")
p.add_argument("--fix", action="store_true", help="Fix any discrepancies automatically")
p.add_argument("--extcall", action="append", help="Identify an externally-called DOM generation function")
args = vars(p.parse_args(args))
files = args.pop("file")
for fn in files: process(fn, **args)
if __name__ == "__main__": main(sys.argv[1:])