| author | Christian Urban <christian.urban@kcl.ac.uk> | 
| Tue, 21 Oct 2025 17:09:56 +0200 | |
| changeset 1014 | 184a13ff50ed | 
| parent 789 | 966c9fd84693 | 
| permissions | -rw-r--r-- | 
| 625 | 1 | // A Small Compiler for a Simple Functional Language | 
| 644 | 2 | // (includes an external lexer and parser) | 
| 645 | 3 | // | 
| 4 | // call with | |
| 5 | // | |
| 735 
0426cd1336f7
updatd
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
734diff
changeset | 6 | // amm fun.scala fact | 
| 645 | 7 | // | 
| 735 
0426cd1336f7
updatd
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
734diff
changeset | 8 | // amm fun.scala defs | 
| 645 | 9 | // | 
| 10 | // this will generate a .j file and run the jasmin | |
| 11 | // assembler (installed at jvm/jasmin-2.4/jasmin.jar) | |
| 12 | // it runs the resulting JVM file twice for timing | |
| 13 | // purposes. | |
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 14 | |
| 645 | 15 | |
| 16 | import java.io._ | |
| 17 | import scala.util._ | |
| 18 | import scala.sys.process._ | |
| 19 | ||
| 644 | 20 | // Abstract syntax trees for the Fun language | 
| 21 | abstract class Exp extends Serializable | |
| 22 | abstract class BExp extends Serializable | |
| 23 | abstract class Decl extends Serializable | |
| 626 | 24 | |
| 25 | case class Def(name: String, args: List[String], body: Exp) extends Decl | |
| 26 | case class Main(e: Exp) extends Decl | |
| 27 | ||
| 28 | case class Call(name: String, args: List[Exp]) extends Exp | |
| 29 | case class If(a: BExp, e1: Exp, e2: Exp) extends Exp | |
| 30 | case class Write(e: Exp) extends Exp | |
| 31 | case class Var(s: String) extends Exp | |
| 32 | case class Num(i: Int) extends Exp | |
| 33 | case class Aop(o: String, a1: Exp, a2: Exp) extends Exp | |
| 34 | case class Sequence(e1: Exp, e2: Exp) extends Exp | |
| 35 | case class Bop(o: String, a1: Exp, a2: Exp) extends BExp | |
| 36 | ||
| 37 | ||
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 38 | // compiler - built-in functions | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 39 | // copied from http://www.ceng.metu.edu.tr/courses/ceng444/link/jvm-cpm.html | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 40 | // | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 41 | |
| 221 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 42 | val library = """ | 
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 43 | .class public XXX.XXX | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 44 | .super java/lang/Object | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 45 | |
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 46 | .method public static write(I)V | 
| 380 
1e88390e81aa
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
323diff
changeset | 47 | .limit locals 1 | 
| 
1e88390e81aa
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
323diff
changeset | 48 | .limit stack 2 | 
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 49 | getstatic java/lang/System/out Ljava/io/PrintStream; | 
| 380 
1e88390e81aa
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
323diff
changeset | 50 | iload 0 | 
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 51 | invokevirtual java/io/PrintStream/println(I)V | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 52 | return | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 53 | .end method | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 54 | |
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 55 | """ | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 56 | |
| 626 | 57 | // calculating the maximal needed stack size | 
| 58 | def max_stack_exp(e: Exp): Int = e match {
 | |
| 59 | case Call(_, args) => args.map(max_stack_exp).sum | |
| 735 
0426cd1336f7
updatd
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
734diff
changeset | 60 | case If(a, e1, e2) => | 
| 
0426cd1336f7
updatd
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
734diff
changeset | 61 | max_stack_bexp(a) + (List(max_stack_exp(e1), max_stack_exp(e2)).max) | 
| 626 | 62 | case Write(e) => max_stack_exp(e) + 1 | 
| 63 | case Var(_) => 1 | |
| 64 | case Num(_) => 1 | |
| 65 | case Aop(_, a1, a2) => max_stack_exp(a1) + max_stack_exp(a2) | |
| 66 | case Sequence(e1, e2) => List(max_stack_exp(e1), max_stack_exp(e2)).max | |
| 67 | } | |
| 644 | 68 | |
| 626 | 69 | def max_stack_bexp(e: BExp): Int = e match {
 | 
| 70 | case Bop(_, a1, a2) => max_stack_exp(a1) + max_stack_exp(a2) | |
| 71 | } | |
| 72 | ||
| 73 | ||
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 74 | // for generating new labels | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 75 | var counter = -1 | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 76 | |
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 77 | def Fresh(x: String) = {
 | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 78 | counter += 1 | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 79 | x ++ "_" ++ counter.toString() | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 80 | } | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 81 | |
| 625 | 82 | // convenient string interpolations | 
| 83 | // for instructions, labels and methods | |
| 84 | import scala.language.implicitConversions | |
| 85 | import scala.language.reflectiveCalls | |
| 86 | ||
| 87 | implicit def sring_inters(sc: StringContext) = new {
 | |
| 88 | def i(args: Any*): String = " " ++ sc.s(args:_*) ++ "\n" | |
| 89 | def l(args: Any*): String = sc.s(args:_*) ++ ":\n" | |
| 90 | def m(args: Any*): String = sc.s(args:_*) ++ "\n" | |
| 91 | } | |
| 92 | ||
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 93 | |
| 625 | 94 | type Env = Map[String, Int] | 
| 95 | ||
| 96 | // compile expressions | |
| 97 | def compile_exp(a: Exp, env : Env) : String = a match {
 | |
| 98 | case Num(i) => i"ldc $i" | |
| 99 |   case Var(s) => i"iload ${env(s)}"
 | |
| 100 |   case Aop("+", a1, a2) => compile_exp(a1, env) ++ compile_exp(a2, env) ++ i"iadd"
 | |
| 101 |   case Aop("-", a1, a2) => compile_exp(a1, env) ++ compile_exp(a2, env) ++ i"isub"
 | |
| 102 |   case Aop("*", a1, a2) => compile_exp(a1, env) ++ compile_exp(a2, env) ++ i"imul"
 | |
| 103 |   case Aop("/", a1, a2) => compile_exp(a1, env) ++ compile_exp(a2, env) ++ i"idiv"
 | |
| 104 |   case Aop("%", a1, a2) => compile_exp(a1, env) ++ compile_exp(a2, env) ++ i"irem"
 | |
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 105 |   case If(b, a1, a2) => {
 | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 106 |     val if_else = Fresh("If_else")
 | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 107 |     val if_end = Fresh("If_end")
 | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 108 | compile_bexp(b, env, if_else) ++ | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 109 | compile_exp(a1, env) ++ | 
| 625 | 110 | i"goto $if_end" ++ | 
| 111 | l"$if_else" ++ | |
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 112 | compile_exp(a2, env) ++ | 
| 625 | 113 | l"$if_end" | 
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 114 | } | 
| 625 | 115 |   case Call(name, args) => {
 | 
| 221 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 116 | val is = "I" * args.length | 
| 625 | 117 | args.map(a => compile_exp(a, env)).mkString ++ | 
| 118 | i"invokestatic XXX/XXX/$name($is)I" | |
| 221 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 119 | } | 
| 625 | 120 |   case Sequence(a1, a2) => {
 | 
| 121 | compile_exp(a1, env) ++ i"pop" ++ compile_exp(a2, env) | |
| 221 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 122 | } | 
| 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 123 |   case Write(a1) => {
 | 
| 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 124 | compile_exp(a1, env) ++ | 
| 625 | 125 | i"dup" ++ | 
| 126 | i"invokestatic XXX/XXX/write(I)V" | |
| 221 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 127 | } | 
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 128 | } | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 129 | |
| 625 | 130 | // compile boolean expressions | 
| 131 | def compile_bexp(b: BExp, env : Env, jmp: String) : String = b match {
 | |
| 221 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 132 |   case Bop("==", a1, a2) => 
 | 
| 625 | 133 | compile_exp(a1, env) ++ compile_exp(a2, env) ++ i"if_icmpne $jmp" | 
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 134 |   case Bop("!=", a1, a2) => 
 | 
| 625 | 135 | compile_exp(a1, env) ++ compile_exp(a2, env) ++ i"if_icmpeq $jmp" | 
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 136 |   case Bop("<", a1, a2) => 
 | 
| 625 | 137 | compile_exp(a1, env) ++ compile_exp(a2, env) ++ i"if_icmpge $jmp" | 
| 221 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 138 |   case Bop("<=", a1, a2) => 
 | 
| 625 | 139 | compile_exp(a1, env) ++ compile_exp(a2, env) ++ i"if_icmpgt $jmp" | 
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 140 | } | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 141 | |
| 625 | 142 | // compile function for declarations and main | 
| 143 | def compile_decl(d: Decl) : String = d match {
 | |
| 221 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 144 |   case Def(name, args, a) => { 
 | 
| 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 145 | val env = args.zipWithIndex.toMap | 
| 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 146 | val is = "I" * args.length | 
| 625 | 147 | m".method public static $name($is)I" ++ | 
| 669 | 148 |     m".limit locals ${args.length}" ++
 | 
| 625 | 149 |     m".limit stack ${1 + max_stack_exp(a)}" ++
 | 
| 150 |     l"${name}_Start" ++   
 | |
| 223 
e4b29b57f6a3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
221diff
changeset | 151 | compile_exp(a, env) ++ | 
| 625 | 152 | i"ireturn" ++ | 
| 153 | m".end method\n" | |
| 221 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 154 | } | 
| 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 155 |   case Main(a) => {
 | 
| 625 | 156 | m".method public static main([Ljava/lang/String;)V" ++ | 
| 157 | m".limit locals 200" ++ | |
| 158 | m".limit stack 200" ++ | |
| 223 
e4b29b57f6a3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
221diff
changeset | 159 | compile_exp(a, Map()) ++ | 
| 625 | 160 | i"invokestatic XXX/XXX/write(I)V" ++ | 
| 161 | i"return" ++ | |
| 162 | m".end method\n" | |
| 221 
824ffbf66ab4
added fun tail
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
220diff
changeset | 163 | } | 
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 164 | } | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 165 | |
| 626 | 166 | // main compiler functions | 
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 167 | |
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 168 | def time_needed[T](i: Int, code: => T) = {
 | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 169 | val start = System.nanoTime() | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 170 | for (j <- 1 to i) code | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 171 | val end = System.nanoTime() | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 172 | (end - start)/(i * 1.0e9) | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 173 | } | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 174 | |
| 645 | 175 | def deserialise[T](fname: String) : Try[T] = {
 | 
| 176 | import scala.util.Using | |
| 177 |   Using(new ObjectInputStream(new FileInputStream(fname))) {
 | |
| 178 | in => in.readObject.asInstanceOf[T] | |
| 179 | } | |
| 644 | 180 | } | 
| 181 | ||
| 182 | def compile(class_name: String) : String = {
 | |
| 645 | 183 | val ast = deserialise[List[Decl]](class_name ++ ".prs").getOrElse(Nil) | 
| 626 | 184 | val instructions = ast.map(compile_decl).mkString | 
| 185 |   (library + instructions).replaceAllLiterally("XXX", class_name)
 | |
| 186 | } | |
| 187 | ||
| 644 | 188 | def compile_to_file(class_name: String) = {
 | 
| 189 | val output = compile(class_name) | |
| 626 | 190 |   scala.tools.nsc.io.File(s"${class_name}.j").writeAll(output)
 | 
| 191 | } | |
| 192 | ||
| 645 | 193 | def compile_and_run(class_name: String) : Unit = {
 | 
| 644 | 194 | compile_to_file(class_name) | 
| 626 | 195 |   (s"java -jar jvm/jasmin-2.4/jasmin.jar ${class_name}.j").!!
 | 
| 695 
a936b1717b1b
deleted init function from boilerplate code
 Christian Urban <urbanc@in.tum.de> parents: 
669diff
changeset | 196 |   println("Time: " + time_needed(1, (s"java ${class_name}/${class_name}").!))
 | 
| 220 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 197 | } | 
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 198 | |
| 
141041fc76b5
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 199 | |
| 626 | 200 | // some examples of .fun files | 
| 645 | 201 | //compile_to_file("fact")
 | 
| 202 | //compile_and_run("fact")
 | |
| 203 | //compile_and_run("defs")
 | |
| 204 | ||
| 644 | 205 | |
| 649 | 206 | def main(args: Array[String]) : Unit = | 
| 645 | 207 | compile_and_run(args(0)) | 
| 644 | 208 | |
| 209 | ||
| 649 | 210 | } |