| author | Christian Urban <christian.urban@kcl.ac.uk> | 
| Mon, 20 Oct 2025 22:18:21 +0200 | |
| changeset 1013 | 1a23d87d1700 | 
| parent 976 | e9eac62928f5 | 
| permissions | -rw-r--r-- | 
| 901 | 1 | |
| 626 | 2 | // A Small Compiler for a Simple Functional Language | 
| 813 | 3 | // - includes a lexer and a parser | 
| 4 | // - performs tail-call optimisations | |
| 5 | // | |
| 6 | // call with | |
| 7 | // | |
| 956 | 8 | // amm funt.sc main defs.fun | 
| 9 | // amm funt.sc main fact.fun | |
| 813 | 10 | // | 
| 11 | // or | |
| 12 | // | |
| 956 | 13 | // amm funt.sc run defs.fun | 
| 14 | // amm funt.sc run fact.fun | |
| 813 | 15 | // | 
| 16 | // the first prints out the JVM instructions | |
| 17 | // the second runs the generated class files | |
| 18 | ||
| 626 | 19 | |
| 789 | 20 | import $file.fun_tokens, fun_tokens._ | 
| 21 | import $file.fun_parser, fun_parser._ | |
| 626 | 22 | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 23 | // compiler - built-in functions | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 24 | // copied from http://www.ceng.metu.edu.tr/courses/ceng444/link/jvm-cpm.html | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 25 | // | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 26 | |
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 27 | val library = """ | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 28 | .class public XXX.XXX | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 29 | .super java/lang/Object | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 30 | |
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 31 | .method public static write(I)V | 
| 626 | 32 | .limit locals 1 | 
| 33 | .limit stack 2 | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 34 | getstatic java/lang/System/out Ljava/io/PrintStream; | 
| 626 | 35 | iload 0 | 
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 36 | invokevirtual java/io/PrintStream/println(I)V | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 37 | return | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 38 | .end method | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 39 | |
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 40 | """ | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 41 | |
| 626 | 42 | // calculating the maximal needed stack size | 
| 43 | def max_stack_exp(e: Exp): Int = e match {
 | |
| 44 | case Call(_, args) => args.map(max_stack_exp).sum | |
| 813 | 45 | case If(a, e1, e2) => | 
| 46 | max_stack_bexp(a) + (List(max_stack_exp(e1), max_stack_exp(e2)).max) | |
| 626 | 47 | case Write(e) => max_stack_exp(e) + 1 | 
| 48 | case Var(_) => 1 | |
| 49 | case Num(_) => 1 | |
| 50 | case Aop(_, a1, a2) => max_stack_exp(a1) + max_stack_exp(a2) | |
| 51 | case Sequence(e1, e2) => List(max_stack_exp(e1), max_stack_exp(e2)).max | |
| 52 | } | |
| 789 | 53 | |
| 626 | 54 | def max_stack_bexp(e: BExp): Int = e match {
 | 
| 55 | case Bop(_, a1, a2) => max_stack_exp(a1) + max_stack_exp(a2) | |
| 56 | } | |
| 57 | ||
| 58 | ||
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 59 | // for generating new labels | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 60 | var counter = -1 | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 61 | |
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 62 | def Fresh(x: String) = {
 | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 63 | counter += 1 | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 64 | x ++ "_" ++ counter.toString() | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 65 | } | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 66 | |
| 626 | 67 | // convenient string interpolations | 
| 68 | // for instructions, labels and methods | |
| 956 | 69 | extension (sc: StringContext) {
 | 
| 70 | def i(args: Any*): String = " " ++ sc.s(args:_*) ++ "\n" // instructions | |
| 71 | def l(args: Any*): String = sc.s(args:_*) ++ ":\n" // labels | |
| 72 | def m(args: Any*): String = sc.s(args:_*) ++ "\n" // methods | |
| 626 | 73 | } | 
| 74 | ||
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 75 | |
| 626 | 76 | type Env = Map[String, Int] | 
| 77 | ||
| 813 | 78 | def compile_op(op: String) = op match {
 | 
| 79 | case "+" => i"iadd" | |
| 80 | case "-" => i"isub" | |
| 81 | case "*" => i"imul" | |
| 82 | case "/" => i"idiv" | |
| 83 | case "%" => i"irem" | |
| 84 | } | |
| 626 | 85 | |
| 86 | def compile_expT(a: Exp, env : Env, name: String) : String = a match {
 | |
| 87 | case Num(i) => i"ldc $i" | |
| 88 |   case Var(s) => i"iload ${env(s)}"
 | |
| 813 | 89 | case Aop(op, a1, a2) => | 
| 90 | compile_expT(a1, env, "") ++ compile_expT(a2, env, "") ++ compile_op(op) | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 91 |   case If(b, a1, a2) => {
 | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 92 |     val if_else = Fresh("If_else")
 | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 93 |     val if_end = Fresh("If_end")
 | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 94 | compile_bexpT(b, env, if_else) ++ | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 95 | compile_expT(a1, env, name) ++ | 
| 626 | 96 | i"goto $if_end" ++ | 
| 97 | l"$if_else" ++ | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 98 | compile_expT(a2, env, name) ++ | 
| 626 | 99 | l"$if_end" | 
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 100 | } | 
| 958 | 101 |   case Call(n, args) => if (name == n) { // can apply tail-call optimisation
 | 
| 626 | 102 |     val stores = args.zipWithIndex.map { case (x, y) => i"istore $y" } 
 | 
| 103 | args.map(a => compile_expT(a, env, "")).mkString ++ | |
| 104 | stores.reverse.mkString ++ | |
| 105 |     i"goto ${n}_Start" 
 | |
| 958 | 106 |   } else { // normal call
 | 
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 107 | val is = "I" * args.length | 
| 626 | 108 | args.map(a => compile_expT(a, env, "")).mkString ++ | 
| 109 |     i"invokestatic XXX/XXX/${n}(${is})I"
 | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 110 | } | 
| 626 | 111 |   case Sequence(a1, a2) => {
 | 
| 112 | compile_expT(a1, env, "") ++ i"pop" ++ compile_expT(a2, env, name) | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 113 | } | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 114 |   case Write(a1) => {
 | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 115 | compile_expT(a1, env, "") ++ | 
| 626 | 116 | i"dup" ++ | 
| 117 | i"invokestatic XXX/XXX/write(I)V" | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 118 | } | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 119 | } | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 120 | |
| 626 | 121 | def compile_bexpT(b: BExp, env : Env, jmp: String) : String = b match {
 | 
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 122 |   case Bop("==", a1, a2) => 
 | 
| 626 | 123 | compile_expT(a1, env, "") ++ compile_expT(a2, env, "") ++ i"if_icmpne $jmp" | 
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 124 |   case Bop("!=", a1, a2) => 
 | 
| 626 | 125 | compile_expT(a1, env, "") ++ compile_expT(a2, env, "") ++ i"if_icmpeq $jmp" | 
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 126 |   case Bop("<", a1, a2) => 
 | 
| 626 | 127 | compile_expT(a1, env, "") ++ compile_expT(a2, env, "") ++ i"if_icmpge $jmp" | 
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 128 |   case Bop("<=", a1, a2) => 
 | 
| 626 | 129 | compile_expT(a1, env, "") ++ compile_expT(a2, env, "") ++ i"if_icmpgt $jmp" | 
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 130 | } | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 131 | |
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 132 | |
| 626 | 133 | def compile_decl(d: Decl) : String = d match {
 | 
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 134 |   case Def(name, args, a) => { 
 | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 135 | val env = args.zipWithIndex.toMap | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 136 | val is = "I" * args.length | 
| 626 | 137 | m".method public static $name($is)I" ++ | 
| 138 |     m".limit locals ${args.length}" ++
 | |
| 139 |     m".limit stack ${1 + max_stack_exp(a)}" ++
 | |
| 140 |     l"${name}_Start" ++   
 | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 141 | compile_expT(a, env, name) ++ | 
| 626 | 142 | i"ireturn" ++ | 
| 143 | m".end method\n" | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 144 | } | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 145 |   case Main(a) => {
 | 
| 626 | 146 | m".method public static main([Ljava/lang/String;)V" ++ | 
| 147 | m".limit locals 200" ++ | |
| 148 | m".limit stack 200" ++ | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 149 | compile_expT(a, Map(), "") ++ | 
| 626 | 150 | i"invokestatic XXX/XXX/write(I)V" ++ | 
| 789 | 151 | i"return" ++ | 
| 152 | m".end method" | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 153 | } | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 154 | } | 
| 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 155 | |
| 626 | 156 | // main compiler functions | 
| 789 | 157 | def compile(prog: List[Decl], class_name: String) : String = {
 | 
| 158 | val instructions = prog.map(compile_decl).mkString | |
| 976 | 159 |   (library + instructions).replace("XXX", class_name)
 | 
| 626 | 160 | } | 
| 161 | ||
| 869 
81ee93b87258
changed os-lib as a replacement for ammonite-ops
 Christian Urban <christian.urban@kcl.ac.uk> parents: 
813diff
changeset | 162 | // pre-2.5.0 ammonite | 
| 
81ee93b87258
changed os-lib as a replacement for ammonite-ops
 Christian Urban <christian.urban@kcl.ac.uk> parents: 
813diff
changeset | 163 | // import ammonite.ops._ | 
| 
81ee93b87258
changed os-lib as a replacement for ammonite-ops
 Christian Urban <christian.urban@kcl.ac.uk> parents: 
813diff
changeset | 164 | |
| 
81ee93b87258
changed os-lib as a replacement for ammonite-ops
 Christian Urban <christian.urban@kcl.ac.uk> parents: 
813diff
changeset | 165 | // post 2.5.0 ammonite | 
| 901 | 166 | import os._ | 
| 813 | 167 | |
| 168 | def compile_to_file(prog: List[Decl], class_name: String) : Unit = | |
| 169 | write.over(pwd / s"$class_name.j", compile(prog, class_name)) | |
| 170 | ||
| 171 | def compile_and_run(prog: List[Decl], class_name: String) : Unit = {
 | |
| 172 | println(s"Start of compilation") | |
| 173 | compile_to_file(prog, class_name) | |
| 174 | println(s"generated $class_name.j file") | |
| 175 |   os.proc("java", "-jar", "jasmin.jar", s"$class_name.j").call()
 | |
| 176 | println(s"generated $class_name.class file") | |
| 177 | println(s"Run program") | |
| 178 |   os.proc("java", s"${class_name}/${class_name}").call(stdout = os.Inherit)
 | |
| 179 | println(s"done.") | |
| 180 | } | |
| 181 | ||
| 789 | 182 | |
| 183 | @main | |
| 184 | def main(fname: String) = {
 | |
| 185 | val path = os.pwd / fname | |
| 186 |     val class_name = fname.stripSuffix("." ++ path.ext)
 | |
| 187 | val tks = tokenise(os.read(path)) | |
| 188 | val ast = parse_tks(tks) | |
| 189 | println(compile(ast, class_name)) | |
| 626 | 190 | } | 
| 191 | ||
| 813 | 192 | @main | 
| 193 | def run(fname: String) = {
 | |
| 194 | val path = os.pwd / fname | |
| 195 |     val class_name = fname.stripSuffix("." ++ path.ext)
 | |
| 196 | val tks = tokenise(os.read(path)) | |
| 197 | val ast = parse_tks(tks) | |
| 198 | compile_and_run(ast, class_name) | |
| 541 
885cf83ebce3
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 199 | } |