wmc.py 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281
  1. #!/usr/bin/python
  2. import os
  3. import os.path
  4. import sys
  5. import lark
  6. GRAMMAR = r"""
  7. start: toplevel+
  8. ?toplevel: include
  9. | funcdef
  10. | arrdec ";"
  11. | vardec ";"
  12. | varinit ";"
  13. | arrinit ";"
  14. | asm ";"
  15. include: "#" "include" FILENAME
  16. FILENAME: "<" /.+/ ">"
  17. funcdef: NAME "(" params ")" block
  18. varinit: NAME
  19. arrinit: NAME "[" INTEGER "]"
  20. vardec: NAME "=" expr
  21. arrdec: NAME "[" expr "]" ("=" expr)?
  22. params:
  23. | NAME ("," NAME)*
  24. block: "{" op* "}"
  25. asm: "asm" "(" STRING+ ")"
  26. ?op: block
  27. | label
  28. | goto ";"
  29. | vardec ";"
  30. | arrdec ";"
  31. | varinit ";"
  32. | arrinit ";"
  33. | inc ";"
  34. | dec ";"
  35. | rinc ";"
  36. | rdec ";"
  37. | asm ";"
  38. | funcall ";"
  39. | if
  40. | while
  41. | for
  42. | return ";"
  43. label: NAME ":"
  44. goto: "goto" NAME
  45. if: "if" "(" expr ")" op ("else" op)?
  46. while: "while" "(" expr ")" op
  47. for: "for" "(" vardec ";" expr ";" (inc|dec|vardec|funcall) ")" op
  48. return: "return" expr
  49. inc: NAME "++"
  50. dec: NAME "--"
  51. rinc: "++" NAME
  52. rdec: "--" NAME
  53. funcall: NAME "(" args ")"
  54. args:
  55. | [expr ("," expr)*]
  56. ?expr: op1
  57. | op1 "?" op1 ":" expr -> ifexpr
  58. ?op1: op2
  59. | vardec
  60. | op1 "==" op1 -> equals
  61. | op1 "!=" op1 -> not_equals
  62. | op1 "+" op2 -> plus
  63. | op1 "-" op2 -> minus
  64. ?op2: op3
  65. | op2 "*" op2 -> times
  66. | op2 "/" op3 -> divide
  67. | op2 "%" op3 -> modulo
  68. | op2 "<" op3 -> less
  69. | op2 ">" op3 -> greater
  70. | op2 "<=" op3 -> less_or_equals
  71. | op2 ">=" op3 -> greater_or_equals
  72. ?op3: op4
  73. | op3 "**" op4 -> raise
  74. ?op4: op5
  75. | op4 "||" op4 -> or
  76. | op4 "&&" op4 -> and
  77. | "!" atom -> not
  78. | "*" atom -> deref
  79. ?op5: atom
  80. | op5 "[" op1 "]" -> index
  81. ?atom: "(" op1 ")"
  82. | NAME
  83. | INTEGER
  84. | FLOAT
  85. | CHAR
  86. | STRING
  87. | "-" atom -> negate
  88. | array
  89. | funcall
  90. | inc
  91. | dec
  92. | rinc
  93. | rdec
  94. array: "{" atom ("," atom)* "}"
  95. NAME: /[A-Za-z_][a-zA-Z0-9_]*/
  96. INTEGER: /[0-9]+/
  97. FLOAT: /[0-9]+\.[0-9]+/
  98. CHAR: /'(.|(\\.))'/
  99. _STRING_INNER: /(.|\n)*?/
  100. _STRING_ESC_INNER: _STRING_INNER /(?<!\\)(\\\\)*?/
  101. STRING: "\"" _STRING_ESC_INNER "\""
  102. IG: /[ \t\r\n]+/
  103. COM: /\/\*(.|\!)*\*\//
  104. %ignore IG
  105. %ignore COM
  106. """
  107. def parse_escape(s):
  108. return bytes(s, "utf-8").decode("unicode_escape")
  109. class Buffer:
  110. def __init__(self, *init):
  111. self.buffer = list(init)
  112. def emit(self, asm, *args):
  113. if type(asm) is list:
  114. self.buffer.extend(asm)
  115. elif type(asm) is Buffer:
  116. self.buffer.extend(asm.buffer)
  117. else:
  118. self.buffer.append(asm.format(*args))
  119. def generate(self):
  120. return "\n".join(self.buffer)
  121. def __add__(self, other):
  122. if type(other) is Buffer:
  123. return Buffer(
  124. *self.buffer + other.buffer
  125. )
  126. raise TypeError
  127. class Scope:
  128. def __init__(self):
  129. self.scopes = []
  130. self.ndx = 0
  131. self.names = set()
  132. def new(self):
  133. self.scopes.append((self.ndx, {}, {}))
  134. self.ndx += 1
  135. def leave(self):
  136. self.scopes.pop()
  137. def add_label(self, name):
  138. renamed = f"__{self.scopes[-1][0]}l_{name}"
  139. self.scopes[-1][2][name] = renamed
  140. return renamed
  141. def get_label(self, name):
  142. if name not in self.scopes[-1][2]:
  143. raise Exception(f"Undeclared label: '{name}`.")
  144. return self.scopes[-1][2][name]
  145. def is_local(self, name):
  146. return name in self.scopes[-1][1]
  147. def insert(self, name):
  148. renamed = f"__{self.scopes[-1][0]}_{name}"
  149. self.scopes[-1][1][name] = renamed
  150. self.names.add(renamed)
  151. return renamed
  152. def find(self, name):
  153. for _, scope, _ in self.scopes[::-1]:
  154. if name in scope:
  155. return scope[name]
  156. raise Exception(f"Undeclared identifier: '{name}`.")
  157. def __contains__(self, name):
  158. for _, scope, _ in self.scopes[::-1]:
  159. if name in scope:
  160. return True
  161. return False
  162. def __getitem__(self, name):
  163. if name in self:
  164. return self.find(name)
  165. return self.insert(name)
  166. def __iter__(self):
  167. for _, scope, _ in self.scopes[::-1]:
  168. for name in scope:
  169. yield (name, scope[name])
  170. @property
  171. def is_toplevel(self):
  172. return self.scopes[-1][0] == 0
  173. class Func:
  174. def __init__(self, argc, params):
  175. self.argc = argc
  176. self.params = params
  177. class WMC:
  178. def __init__(self):
  179. self.funcs = {}
  180. self.used_symbols = {}
  181. self.where = "toplevel"
  182. self.scope = Scope()
  183. self.scope.new()
  184. self.compiled_funcs = {}
  185. self.arrays_buffer = Buffer()
  186. self.init_buffer = Buffer()
  187. self.buffer = Buffer(
  188. "jw __main",
  189. "pop Y",
  190. "mov 80 _dirBuf",
  191. "mov Y _dirBuf+1",
  192. "dir _dirBuf",
  193. "hlt",
  194. "_dirBuf:0*4",
  195. )
  196. self.label_ndx = 0
  197. self.included_files = set()
  198. self.parser = lark.Lark(GRAMMAR)
  199. def record_usage(self, name):
  200. if name in self.used_symbols:
  201. self.used_symbols[name].add(self.where)
  202. else:
  203. self.used_symbols[name] = set([self.where])
  204. def is_used(self, name):
  205. if name in ("main", "toplevel"):
  206. return True
  207. if name not in self.used_symbols:
  208. return False
  209. for other in self.used_symbols[name]:
  210. if other == name:
  211. continue
  212. if self.is_used(other):
  213. return True
  214. return False
  215. def make_label(self):
  216. name = f"__{self.label_ndx}l"
  217. self.label_ndx += 1
  218. return name
  219. def make_array(self, value):
  220. name = self.make_label()
  221. self.arrays_buffer.emit(
  222. "{}:{}",
  223. name, value
  224. )
  225. return name
  226. def compile_literal(self, node):
  227. if type(node) is lark.Token:
  228. if node.type == "NAME":
  229. value = self.scope.find(node.value)
  230. self.record_usage(value)
  231. return value
  232. elif node.type in ("INTEGER", "FLOAT"):
  233. return node.value
  234. elif node.type == "CHAR":
  235. return str(ord(parse_escape(node.value[1:-1])))
  236. elif node.type == "STRING":
  237. value = parse_escape(node.value[1:-1])
  238. value = map(ord, value)
  239. value = map(str, value)
  240. value = " ".join(value)
  241. value += " 0"
  242. return value
  243. elif node.data == "array":
  244. value = []
  245. for child in node.children:
  246. value.append(
  247. self.compile_literal(child)
  248. )
  249. return " ".join(value)
  250. raise Exception(f"Not implemented: {node}")
  251. def compile_unary_expr(self, node, *ops):
  252. buffer = Buffer()
  253. buffer.emit(
  254. self.compile_expr(
  255. node.children[0]
  256. )
  257. )
  258. for op in ops:
  259. buffer.emit(op)
  260. return buffer
  261. def compile_binary_expr(self, node):
  262. buffer = Buffer()
  263. buffer.emit(
  264. self.compile_expr(
  265. node.children[0]
  266. )
  267. )
  268. buffer.emit('push Y')
  269. buffer.emit(
  270. self.compile_expr(
  271. node.children[1]
  272. )
  273. )
  274. buffer.emit('push Y')
  275. buffer.emit('pop X')
  276. buffer.emit('pop Y')
  277. return buffer
  278. def compile_compare_expr(self, node, *ops, true='1', false='0'):
  279. buffer = Buffer()
  280. ret_label = self.make_label()
  281. exit_label = self.make_label()
  282. buffer.emit(
  283. self.compile_binary_expr(
  284. node
  285. )
  286. )
  287. for op in ops:
  288. buffer.emit(
  289. op,
  290. ret_label
  291. )
  292. buffer.emit(
  293. "mov {} Y",
  294. false
  295. )
  296. buffer.emit(
  297. "jmp {}",
  298. exit_label
  299. )
  300. buffer.emit(
  301. "{}:",
  302. ret_label
  303. )
  304. buffer.emit(
  305. "mov {} Y",
  306. true
  307. )
  308. buffer.emit(
  309. "{}:",
  310. exit_label
  311. )
  312. return buffer
  313. def compile_expr(self, node):
  314. buffer = Buffer()
  315. if type(node) is lark.Token:
  316. if node.type == "NAME":
  317. buffer.emit(
  318. "mov {} Y",
  319. self.compile_literal(node)
  320. )
  321. elif node.type in ("INTEGER", "FLOAT"):
  322. buffer.emit(
  323. "mov {} Y",
  324. self.compile_literal(node)
  325. )
  326. elif node.type == "CHAR":
  327. buffer.emit(
  328. "mov {} Y",
  329. self.compile_literal(node)
  330. )
  331. elif node.type == "STRING":
  332. buffer.emit(
  333. "ld {} Y",
  334. self.make_array(
  335. self.compile_literal(node)
  336. )
  337. )
  338. else:
  339. raise Exception(f"Not implemented: {node}")
  340. elif node.data == "ifexpr":
  341. else_label = self.make_label()
  342. exit_label = self.make_label()
  343. buffer.emit(
  344. self.compile_expr(
  345. node.children[0]
  346. )
  347. )
  348. buffer.emit(
  349. "nbnz Y {}",
  350. else_label
  351. )
  352. buffer.emit(
  353. self.compile_expr(
  354. node.children[1]
  355. )
  356. )
  357. buffer.emit(
  358. "jmp {}",
  359. exit_label
  360. )
  361. buffer.emit(
  362. "{}:",
  363. else_label
  364. )
  365. buffer.emit(
  366. self.compile_expr(
  367. node.children[2]
  368. )
  369. )
  370. buffer.emit(
  371. "{}:",
  372. exit_label
  373. )
  374. elif node.data == "equals":
  375. buffer.emit(
  376. self.compile_compare_expr(
  377. node,
  378. "sblez X Y !",
  379. "nbnz Y {}",
  380. true='1',
  381. false='0'
  382. )
  383. )
  384. elif node.data == "not_equals":
  385. buffer.emit(
  386. self.compile_compare_expr(
  387. node,
  388. "sblez X Y !",
  389. "nbnz Y {}",
  390. true='0',
  391. false='1'
  392. )
  393. )
  394. elif node.data == "plus":
  395. buffer.emit(
  396. self.compile_binary_expr(
  397. node
  398. )
  399. )
  400. buffer.emit(
  401. "ablez X Y !"
  402. )
  403. elif node.data == "minus":
  404. buffer.emit(
  405. self.compile_binary_expr(
  406. node
  407. )
  408. )
  409. buffer.emit(
  410. "sblez X Y !"
  411. )
  412. elif node.data == "times":
  413. buffer.emit(
  414. self.compile_binary_expr(
  415. node
  416. )
  417. )
  418. buffer.emit(
  419. "mbnz X Y !"
  420. )
  421. elif node.data == "divide":
  422. buffer.emit(
  423. self.compile_binary_expr(
  424. node
  425. )
  426. )
  427. buffer.emit(
  428. "vblz X Y !"
  429. )
  430. elif node.data == "modulo":
  431. buffer.emit(
  432. self.compile_binary_expr(
  433. node
  434. )
  435. )
  436. buffer.emit(
  437. "modbz X Y !"
  438. )
  439. elif node.data == "raise":
  440. buffer.emit(
  441. self.compile_binary_expr(
  442. node
  443. )
  444. )
  445. buffer.emit(
  446. "mov 12 _dirBuf"
  447. )
  448. buffer.emit(
  449. "mov X _dirBuf+1"
  450. )
  451. buffer.emit(
  452. "mov Y _dirBuf+2"
  453. )
  454. buffer.emit(
  455. "dir _dirBuf"
  456. )
  457. buffer.emit(
  458. "mov _dirBuf+2 Y"
  459. )
  460. elif node.data == "or":
  461. true_label = self.make_label()
  462. exit_label = self.make_label()
  463. buffer.emit(
  464. self.compile_expr(
  465. node.children[0]
  466. )
  467. )
  468. buffer.emit(
  469. "nbnz Y !"
  470. )
  471. buffer.emit(
  472. "nbnz Y {}",
  473. true_label
  474. )
  475. buffer.emit(
  476. self.compile_expr(
  477. node.children[1]
  478. )
  479. )
  480. buffer.emit(
  481. "jmp {}",
  482. exit_label
  483. )
  484. buffer.emit(
  485. "{}:",
  486. true_label
  487. )
  488. buffer.emit(
  489. "mov 1 Y"
  490. )
  491. buffer.emit(
  492. "{}:",
  493. exit_label
  494. )
  495. elif node.data == "and":
  496. false_label = self.make_label()
  497. exit_label = self.make_label()
  498. buffer.emit(
  499. self.compile_expr(
  500. node.children[0]
  501. )
  502. )
  503. buffer.emit(
  504. "nbnz Y {}",
  505. false_label
  506. )
  507. buffer.emit(
  508. self.compile_expr(
  509. node.children[1]
  510. )
  511. )
  512. buffer.emit(
  513. "jmp {}",
  514. exit_label
  515. )
  516. buffer.emit(
  517. "{}:",
  518. false_label
  519. )
  520. buffer.emit(
  521. "mov 0 Y"
  522. )
  523. buffer.emit(
  524. "{}:",
  525. exit_label
  526. )
  527. elif node.data == "less":
  528. buffer.emit(
  529. self.compile_compare_expr(
  530. node,
  531. "inc Y",
  532. "sblez X Y {}"
  533. )
  534. )
  535. elif node.data == "greater":
  536. buffer.emit(
  537. self.compile_compare_expr(
  538. node,
  539. "dec Y",
  540. "sblez X Y {}",
  541. true='0',
  542. false='1'
  543. )
  544. )
  545. elif node.data == "less_or_equals":
  546. buffer.emit(
  547. self.compile_compare_expr(
  548. node,
  549. "sblez X Y {}"
  550. )
  551. )
  552. elif node.data == "greater_or_equals":
  553. buffer.emit(
  554. self.compile_compare_expr(
  555. node,
  556. "inc Y",
  557. "sblez X Y {}",
  558. true='0',
  559. false='1'
  560. )
  561. )
  562. elif node.data == "not":
  563. buffer.emit(
  564. self.compile_unary_expr(
  565. node,
  566. "nbnz Y !"
  567. )
  568. )
  569. elif node.data == "deref":
  570. buffer.emit(
  571. self.compile_unary_expr(
  572. node,
  573. "la Y Y"
  574. )
  575. )
  576. elif node.data == "index":
  577. buffer.emit(
  578. self.compile_binary_expr(
  579. node
  580. )
  581. )
  582. buffer.emit(
  583. "ablez X Y !"
  584. )
  585. buffer.emit(
  586. "la Y Y"
  587. )
  588. elif node.data == "negate":
  589. buffer.emit(
  590. self.compile_unary_expr(
  591. node,
  592. "mov Y X",
  593. "sblez X Y !",
  594. "sblez X Y !",
  595. )
  596. )
  597. elif node.data == "array":
  598. buffer.emit(
  599. "ld {} Y",
  600. self.make_array(
  601. self.compile_literal(node)
  602. )
  603. )
  604. elif node.data == "inc":
  605. name = self.scope[node.children[0].value]
  606. self.record_usage(name)
  607. buffer.emit(
  608. "mov {} Y",
  609. name
  610. )
  611. buffer.emit(
  612. "inc {}",
  613. name
  614. )
  615. elif node.data == "dec":
  616. name = self.scope[node.children[0].value]
  617. self.record_usage(name)
  618. buffer.emit(
  619. "mov {} Y"
  620. )
  621. buffer.emit(
  622. "dec {}",
  623. name
  624. )
  625. elif node.data == "rinc":
  626. name = self.scope[node.children[0].value]
  627. self.record_usage(name)
  628. buffer.emit(
  629. "inc {}",
  630. name
  631. )
  632. buffer.emit(
  633. "mov {} Y",
  634. name
  635. )
  636. elif node.data == "rdec":
  637. name = self.scope[node.children[0].value]
  638. self.record_usage(name)
  639. buffer.emit(
  640. "dec {}",
  641. name
  642. )
  643. buffer.emit(
  644. "mov {} Y"
  645. )
  646. elif node.data == "funcall":
  647. buffer.emit(
  648. self.compile_funcall(node, dest='Y')
  649. )
  650. else:
  651. raise Exception(f"Not implemented: {node}")
  652. return buffer
  653. def compile_funcall(self, node, dest='Y'):
  654. buffer = Buffer()
  655. name = node.children[0].value
  656. if name not in self.funcs:
  657. raise Exception(f"Call to an undeclared function: '{name}`.")
  658. if self.funcs[name].argc != len(node.children[1].children):
  659. raise Exception(f"Function '{name}` expects {self.funcs[name].argc} arguments, but got {node.children[1].children}.")
  660. for arg in node.children[1].children[::-1]:
  661. buffer.emit(
  662. self.compile_expr(arg)
  663. )
  664. buffer.emit(
  665. "push Y"
  666. )
  667. buffer.emit(
  668. "jw __{}",
  669. name
  670. )
  671. buffer.emit(
  672. "pop {}",
  673. dest
  674. )
  675. self.record_usage(name)
  676. return buffer
  677. def compile_asm(self, node):
  678. buffer = Buffer()
  679. table = {}
  680. for name, renamed in self.scope:
  681. table[name] = renamed
  682. for child in node.children:
  683. value = parse_escape(child.value[1:-1])
  684. for name in table:
  685. if f"{{{name}}}" in value:
  686. self.record_usage(table[name])
  687. try:
  688. value = value.format(
  689. **table
  690. )
  691. except:
  692. raise Exception("Malformed asm directive.")
  693. buffer.emit(value)
  694. return buffer
  695. def compile_arrdec(self, node):
  696. buffer = Buffer()
  697. name = node.children[0].value
  698. if name in self.scope and len(node.children) == 3: # Index assignment.
  699. name = self.scope.find(name)
  700. self.record_usage(name)
  701. buffer.emit(
  702. self.compile_expr(
  703. node.children[1]
  704. )
  705. )
  706. buffer.emit(
  707. "mov {} X",
  708. name
  709. )
  710. buffer.emit(
  711. "ablez X Y !"
  712. )
  713. buffer.emit(
  714. "push Y"
  715. )
  716. buffer.emit(
  717. self.compile_expr(
  718. node.children[2]
  719. )
  720. )
  721. buffer.emit(
  722. "pop X"
  723. )
  724. buffer.emit(
  725. "str Y X"
  726. )
  727. return buffer
  728. if not self.scope.is_toplevel and self.scope.is_local(name):
  729. raise Exception(f"Duplicated declaration of a local variable: '{node.children[0].value}`.")
  730. name = self.scope[name]
  731. self.record_usage(name)
  732. count = int(node.children[1].value)
  733. if count <= 0:
  734. raise Exception(f"Illegal array declaration '{node.children[0].value}`: array size should be >0, but it is {count}.")
  735. if len(node.children) == 3:
  736. value = self.compile_literal(node.children[2])
  737. size = len(value.split(" ")) # Dirty.
  738. if size < count:
  739. value += f" 0*{count-size}"
  740. elif size != count:
  741. raise Exception(f"Illegal array declaration '{node.children[0].value}`: value size is {size}, but expected {count}.")
  742. buffer.emit(
  743. "ld {} Y",
  744. self.make_array(value)
  745. )
  746. else:
  747. buffer.emit(
  748. "ld {} Y",
  749. self.make_array(f"0*{count}")
  750. )
  751. buffer.emit(
  752. "mov Y {}",
  753. name
  754. )
  755. return buffer
  756. def compile_op(self, node):
  757. buffer = Buffer()
  758. if node.data == "block":
  759. buffer.emit(
  760. self.compile_block(
  761. node
  762. )
  763. )
  764. elif node.data == "label":
  765. buffer.emit(
  766. "{}:",
  767. self.scope.get_label(node.children[0].value)
  768. )
  769. elif node.data == "goto":
  770. buffer.emit(
  771. "jmp {}",
  772. self.scope.get_label(node.children[0].value)
  773. )
  774. elif node.data == "varinit":
  775. name = node.children[0].value
  776. if self.scope.is_local(name):
  777. raise Exception(f"Duplicated declaration of a local variable: '{name}`.")
  778. self.scope.insert(name)
  779. elif node.data == "vardec":
  780. name = self.scope[node.children[0].value]
  781. self.record_usage(name)
  782. buffer.emit(
  783. self.compile_expr(node.children[1])
  784. )
  785. buffer.emit(
  786. "mov Y {}",
  787. name
  788. )
  789. elif node.data in ("arrdec", "arrinit"):
  790. buffer.emit(
  791. self.compile_arrdec(node)
  792. )
  793. elif node.data in ("inc", "rinc"):
  794. name = self.scope[node.children[0].value]
  795. self.record_usage(name)
  796. buffer.emit(
  797. "inc {}",
  798. name
  799. )
  800. elif node.data == ("dec", "rdec"):
  801. name = self.scope[node.children[0].value]
  802. self.record_usage(name)
  803. buffer.emit(
  804. "dec {}",
  805. name
  806. )
  807. elif node.data == "funcall":
  808. buffer.emit(
  809. self.compile_funcall(node, dest='ZZ')
  810. )
  811. elif node.data == "return":
  812. buffer.emit(
  813. self.compile_expr(
  814. node.children[0]
  815. )
  816. )
  817. buffer.emit("push Y")
  818. buffer.emit("ret")
  819. elif node.data == "asm":
  820. buffer.emit(
  821. self.compile_asm(node)
  822. )
  823. elif node.data == "if":
  824. else_label = self.make_label()
  825. exit_label = self.make_label()
  826. buffer.emit(
  827. self.compile_expr(
  828. node.children[0]
  829. )
  830. )
  831. buffer.emit(
  832. "nbnz Y {}",
  833. else_label
  834. )
  835. buffer.emit(
  836. self.compile_op(
  837. node.children[1]
  838. )
  839. )
  840. buffer.emit(
  841. "jmp {}",
  842. exit_label
  843. )
  844. buffer.emit(
  845. "{}:",
  846. else_label
  847. )
  848. if len(node.children) == 3:
  849. buffer.emit(
  850. self.compile_op(
  851. node.children[2]
  852. )
  853. )
  854. buffer.emit(
  855. "{}:",
  856. exit_label
  857. )
  858. elif node.data == "while":
  859. loop_label = self.make_label()
  860. exit_label = self.make_label()
  861. buffer.emit(
  862. "{}:",
  863. loop_label
  864. )
  865. buffer.emit(
  866. self.compile_expr(
  867. node.children[0]
  868. )
  869. )
  870. buffer.emit(
  871. "nbnz Y {}",
  872. exit_label
  873. )
  874. buffer.emit(
  875. self.compile_op(
  876. node.children[1]
  877. )
  878. )
  879. buffer.emit(
  880. "jmp {}",
  881. loop_label
  882. )
  883. buffer.emit(
  884. "{}:",
  885. exit_label
  886. )
  887. elif node.data == "for":
  888. loop_label = self.make_label()
  889. exit_label = self.make_label()
  890. self.scope.new()
  891. buffer.emit(
  892. self.compile_op(
  893. node.children[0]
  894. )
  895. )
  896. buffer.emit(
  897. "{}:",
  898. loop_label
  899. )
  900. buffer.emit(
  901. self.compile_expr(
  902. node.children[1]
  903. )
  904. )
  905. buffer.emit(
  906. "nbnz Y {}",
  907. exit_label
  908. )
  909. buffer.emit(
  910. self.compile_op(
  911. node.children[3]
  912. )
  913. )
  914. buffer.emit(
  915. self.compile_op(
  916. node.children[2]
  917. )
  918. )
  919. self.scope.leave()
  920. buffer.emit(
  921. "jmp {}",
  922. loop_label
  923. )
  924. buffer.emit(
  925. "{}:",
  926. exit_label
  927. )
  928. else:
  929. raise Exception(f"Not implemented: {node}")
  930. return buffer
  931. def collect_labels(self, node):
  932. for child in node.children:
  933. if child.data == "label":
  934. self.scope.add_label(child.children[0].value)
  935. def compile_block(self, node, *prepend_names, scope=True):
  936. if scope:
  937. self.scope.new()
  938. for name in prepend_names:
  939. self.scope.insert(name)
  940. buffer = Buffer()
  941. self.collect_labels(node)
  942. for child in node.children:
  943. buffer.emit(
  944. self.compile_op(child)
  945. )
  946. if scope:
  947. self.scope.leave()
  948. return buffer
  949. def compile_toplevel(self, node):
  950. buffer = Buffer()
  951. if node.data == "funcdef":
  952. name = node.children[0].value
  953. params = self.funcs[name].params
  954. buffer.emit("__{}:", name)
  955. for param in params:
  956. buffer.emit(
  957. "pop __{}_{}",
  958. self.scope.ndx, param
  959. )
  960. self.where = name
  961. buffer.emit(
  962. self.compile_block(
  963. node.children[2],
  964. *params
  965. )
  966. )
  967. buffer.emit(
  968. "push Z"
  969. )
  970. buffer.emit(
  971. "ret"
  972. )
  973. elif node.data == "vardec":
  974. name = node.children[0].value
  975. self.init_buffer.emit(
  976. self.compile_expr(node.children[1])
  977. )
  978. self.init_buffer.emit(
  979. "mov Y __0_{}",
  980. name
  981. )
  982. self.record_usage(f"__0__{name}")
  983. elif node.data in ("arrdec", "arrinit"):
  984. self.init_buffer.emit(
  985. self.compile_arrdec(node)
  986. )
  987. elif node.data == "asm":
  988. buffer.emit(
  989. self.compile_asm(node)
  990. )
  991. elif node.data == "include":
  992. filename = node.children[0].value[1:-1]
  993. if not os.path.isfile(filename):
  994. filename = os.path.join(os.getenv("WC_I"), filename)
  995. if not os.path.isfile(filename):
  996. raise Exception(f"No such file: '{os.path.basename(filename)}`.")
  997. if filename not in self.included_files:
  998. with open(filename, "r") as f:
  999. self.compile_program(f.read())
  1000. self.included_files.add(filename)
  1001. elif node.data == "varinit":
  1002. pass
  1003. else:
  1004. raise Exception(f"Not implemented: {node}")
  1005. return buffer
  1006. def collect_toplevel(self, ast):
  1007. for node in ast.children:
  1008. if node.data == "funcdef":
  1009. name = node.children[0].value
  1010. if name in self.funcs:
  1011. raise Exception(f"Duplicated function declaration: '{name}`.")
  1012. self.funcs[name] = Func(
  1013. len(node.children[1].children),
  1014. tuple(map(lambda t: t.value, node.children[1].children))
  1015. )
  1016. elif node.data in ("varinit", "vardec", "arrinit", "arrdec"):
  1017. name = node.children[0].value
  1018. if name in self.scope:
  1019. raise Exception(f"Duplicated top-level variable declaration: '{name}`.")
  1020. self.scope.insert(name) # Because we're at the top-level rn.
  1021. def compile_program(self, text):
  1022. ast = self.parser.parse(text)
  1023. #print(ast.pretty())
  1024. self.collect_toplevel(ast)
  1025. for node in ast.children:
  1026. buffer = self.compile_toplevel(node)
  1027. if node.data == "funcdef":
  1028. self.compiled_funcs[node.children[0].value] = buffer
  1029. else:
  1030. self.buffer.emit(buffer)
  1031. def compile(self, text):
  1032. self.compile_program(text)
  1033. for name in self.compiled_funcs:
  1034. if self.is_used(name):
  1035. self.buffer.emit(self.compiled_funcs[name])
  1036. for param in self.funcs[name].params:
  1037. self.record_usage(param)
  1038. self.buffer = self.init_buffer + self.buffer + self.arrays_buffer
  1039. for name in self.scope.names:
  1040. if self.is_used(name):
  1041. self.buffer.emit(
  1042. "{}:0", name
  1043. )
  1044. if "main" not in self.funcs:
  1045. raise Exception("Missing 'main` function.")
  1046. return self.buffer.generate() + "\n"
  1047. wmc = WMC()
  1048. try:
  1049. if len(sys.argv) == 3:
  1050. with open(sys.argv[1], "r") as fin:
  1051. with open(sys.argv[2], "w") as fout:
  1052. fout.write(wmc.compile(fin.read()))
  1053. else:
  1054. sys.stdout.write(wmc.compile(sys.stdin.read()))
  1055. except Exception as e:
  1056. #__import__('traceback').print_exc()
  1057. print(e)
  1058. sys.exit(1)