// A Small Compiler for the WHILE Language
// (stub for including arrays)
// the abstract syntax trees
abstract class Stmt
abstract class AExp
abstract class BExp
type Block = List[Stmt]
// statements
case object Skip extends Stmt
case class If(a: BExp, bl1: Block, bl2: Block) extends Stmt
case class While(b: BExp, bl: Block) extends Stmt
case class Assign(s: String, a: AExp) extends Stmt
case class AssignA(s: String, a1: AExp, a2: AExp) extends Stmt
case class Write(s: String) extends Stmt // writes out a variable
case class Array(s: String, n: Int) extends Stmt
// arithmetic expressions
case class Var(s: String) extends AExp
case class Num(i: Int) extends AExp
case class Aop(o: String, a1: AExp, a2: AExp) extends AExp
case class Ref(s: String, a1: AExp) extends AExp
// boolean expressions
case object True extends BExp
case object False extends BExp
case class Bop(o: String, a1: AExp, a2: AExp) extends BExp
// compiler headers needed for the JVM
// (contains an init method, as well as methods for read and write)
val beginning = """
.class public XXX.XXX
.super java/lang/Object
.method public <init>()V
invokenonvirtual java/lang/Object/<init>()V
.end method
.method public static write(I)V
.limit locals 1
.limit stack 2
getstatic java/lang/System/out Ljava/io/PrintStream;
iload 0
invokevirtual java/io/PrintStream/print(C)V
.end method
.method public static main([Ljava/lang/String;)V
.limit locals 200
.limit stack 200
val ending = """
.end method
println("Start compilation")
// for generating new labels
var counter = -1
def Fresh(x: String) = {
counter += 1
x ++ "_" ++ counter.toString()
// environments and instructions
type Env = Map[String, String]
type Instrs = List[String]
// arithmetic expression compilation
def compile_aexp(a: AExp, env : Env) : Instrs = a match {
case Num(i) => List("ldc " + i.toString + "\n")
case Var(s) => List("iload " + env(s) + "\n")
case Aop("+", a1, a2) =>
compile_aexp(a1, env) ++
compile_aexp(a2, env) ++ List("iadd\n")
case Aop("-", a1, a2) =>
compile_aexp(a1, env) ++ compile_aexp(a2, env) ++ List("isub\n")
case Aop("*", a1, a2) =>
compile_aexp(a1, env) ++ compile_aexp(a2, env) ++ List("imul\n")
case Ref(s, a1) =>
List("aload " + env(s) + "\n") ++ compile_aexp(a1, env) ++ List("iaload \n")
// boolean expression compilation
def compile_bexp(b: BExp, env : Env, jmp: String) : Instrs = b match {
case True => Nil
case False => List("goto " + jmp + "\n")
case Bop("=", a1, a2) =>
compile_aexp(a1, env) ++ compile_aexp(a2, env) ++
List("if_icmpne " + jmp + "\n")
case Bop("!=", a1, a2) =>
compile_aexp(a1, env) ++ compile_aexp(a2, env) ++
List("if_icmpeq " + jmp + "\n")
case Bop("<", a1, a2) =>
compile_aexp(a1, env) ++ compile_aexp(a2, env) ++
List("if_icmpge " + jmp + "\n")
// statement compilation
def compile_stmt(s: Stmt, env: Env) : (Instrs, Env) = s match {
case Skip => (Nil, env)
case Assign(x, a) => {
val index = if (env.isDefinedAt(x)) env(x) else
(compile_aexp(a, env) ++
List("istore " + index + "\n"), env + (x -> index))
case If(b, bl1, bl2) => {
val if_else = Fresh("If_else")
val if_end = Fresh("If_end")
val (instrs1, env1) = compile_block(bl1, env)
val (instrs2, env2) = compile_block(bl2, env1)
(compile_bexp(b, env, if_else) ++
instrs1 ++
List("goto " + if_end + "\n") ++
List("\n" + if_else + ":\n\n") ++
instrs2 ++
List("\n" + if_end + ":\n\n"), env2)
case While(b, bl) => {
val loop_begin = Fresh("Loop_begin")
val loop_end = Fresh("Loop_end")
val (instrs1, env1) = compile_block(bl, env)
(List("\n" + loop_begin + ":\n\n") ++
compile_bexp(b, env, loop_end) ++
instrs1 ++
List("goto " + loop_begin + "\n") ++
List("\n" + loop_end + ":\n\n"), env1)
case Write(x) =>
(List("iload " + env(x) + "\n" +
"invokestatic XXX/XXX/write(I)V\n"), env)
case Array(s, n) => {
val index = if (env.isDefinedAt(s)) throw new Exception("Array already defined") else
148 |
149 |
150 |
151 |
case AssignA(s, a1, a2) => {
val index = if (env.isDefinedAt(s)) env(s) else
throw new Exception("Array not yet defined")
(List("aload " + index + "\n") ++
compile_aexp(a1, env) ++
158 |
161 |
// compilation of a block (i.e. list of instructions)
case Nil => (Nil, env)
case s::bl => {
val (instrs1, env1) = compile_stmt(s, env)
val (instrs2, env2) = compile_block(bl, env1)
(instrs1 ++ instrs2, env2)
169 |
// main compilation function for blocks
def compile(bl: Block, class_name: String) : String = {
val instructions = compile_block(bl, Map.empty)._1
(beginning ++ instructions.mkString ++ ending).replaceAllLiterally("XXX", class_name)
// compiling and running files
// JVM files can be assembled with
// java -jar jvm/jasmin-2.4/jasmin.jar fib.j
// and started with
187 |
191 |
import scala.util._
import scala.sys.process._
import scala.io
def compile_tofile(bl: Block, class_name: String) = {
val output = compile(bl, class_name)
val fw = new java.io.FileWriter(class_name + ".j")
def compile_all(bl: Block, class_name: String) : Unit = {
compile_tofile(bl, class_name)
println("compiled ")
val test = ("java -jar jvm/jasmin-2.4/jasmin.jar " + class_name + ".j").!!
println("assembled ")
209 |
def time_needed[T](i: Int, code: => T) = {
val start = System.nanoTime()
for (j <- 1 to i) code
val end = System.nanoTime()
(end - start)/(i * 1.0e9)
def compile_run(bl: Block, class_name: String) : Unit = {
println("Start compilation")
compile_all(bl, class_name)
println("Time: " + time_needed(1, ("java " + class_name + "/" + class_name).!))
223 |
// Fibonacci numbers as a test-case
val fib_test =
List(Assign("n", Num(10)), // n := 10;
Assign("minus1",Num(0)), // minus1 := 0;
Assign("temp",Num(0)), // temp := 0;
While(Bop("<",Num(0),Var("n")), // while n > 0 do {
List(Assign("temp",Var("minus2")), // temp := minus2;
233 |
234 |
235 |
236 |
237 |
val arr_test =
List(Array("a", 10), // a[10]
Array("b", 2), // b[2]
AssignA("a", Num(0), Num(10)), // a[0] := 10
Assign("x", Ref("a", Num(0))), // x := a[0]
Write("x"), // write x
AssignA("b", Num(1), Num(5)), // b[1] := 5
Assign("x", Ref("b", Num(1))), // x := b[1]
Write("x")) // write x
252 |
253 |
255 |
// Parser Combinators
258 |
import scala.language.implicitConversions
import scala.language.reflectiveCalls
262 |
abstract class Parser[I <% Seq[_], T] {
def parse(ts: I): Set[(T, I)]
266 |
269 |
def parse(sb: I) =
273 |
281 |
def parse(sb: I) =
282 |
for ((head, tail) <- p.parse(sb)) yield (f(head), tail)
283 |
284 |
285 |
286 |
import scala.util.matching.Regex
287 |
case class RegexParser(reg: Regex) extends Parser[String, String] {
288 |
def parse(sb: String) = reg.findPrefixMatchOf(sb) match {
289 |
case None => Set()
290 |
case Some(m) => Set((m.matched, m.after.toString))
291 |
292 |
293 |
294 |
def StringParser(s: String) = RegexParser(Regex.quote(s).r)
295 |
296 |
297 |
implicit def string2parser(s : String) = StringParser(s)
298 |
299 |
implicit def ParserOps[I<% Seq[_], T](p: Parser[I, T]) = new {
300 |
def | (q : => Parser[I, T]) = new AltParser[I, T](p, q)
301 |
def ==>[S] (f: => T => S) = new FunParser[I, T, S](p, f)
302 |
def ~[S] (q : => Parser[I, S]) = new SeqParser[I, T, S](p, q)
303 |
304 |
305 |
implicit def StringOps(s: String) = new {
306 |
def | (q : => Parser[String, String]) = new AltParser[String, String](s, q)
307 |
def | (r: String) = new AltParser[String, String](s, r)
308 |
def ==>[S] (f: => String => S) = new FunParser[String, String, S](s, f)
309 |
def ~[S](q : => Parser[String, S]) =
310 |
new SeqParser[String, String, S](s, q)
311 |
def ~ (r: String) =
312 |
new SeqParser[String, String, String](s, r)
313 |
314 |
315 |
316 |
val NumParser = RegexParser("[0-9]+".r) ==> (s => s.toInt : Int)
317 |
val IdParser = RegexParser("[a-z][a-z,0-9]*".r)
318 |
319 |
320 |
321 |
// Grammar Rules
322 |
323 |
lazy val AExp: Parser[String, AExp] =
324 |
(Te ~ "+" ~ AExp) ==> { case ((x, _), z) => Aop("+", x, z):AExp } |
325 |
(Te ~ "-" ~ AExp) ==> { case ((x, _), z) => Aop("-", x, z):AExp } | Te
326 |
lazy val Te: Parser[String, AExp] =
327 |
(Fa ~ "*" ~ Te) ==> { case ((x, _), z) => Aop("*", x, z):AExp } | Fa
328 |
lazy val Fa: Parser[String, AExp] =
329 |
("(" ~ AExp ~ ")") ==> { case ((_, y), _) => y } |
330 |
(IdParser ~ "[" ~ AExp ~ "]") ==> { case (((x, _), y), _) => Ref(x, y) } |
331 |
IdParser ==> Var |
332 |
NumParser ==> Num
333 |
334 |
// boolean expressions
335 |
lazy val BExp: Parser[String, BExp] =
336 |
(AExp ~ "=" ~ AExp) ==> { case ((x, y), z) => Bop("=", x, z):BExp } |
337 |
(AExp ~ "!=" ~ AExp) ==> { case ((x, y), z) => Bop("!=", x, z):BExp } |
338 |
(AExp ~ "<" ~ AExp) ==> { case ((x, y), z) => Bop("<", x, z):BExp } |
339 |
(AExp ~ ">" ~ AExp) ==> { case ((x, y), z) => Bop("<", z, x):BExp } |
340 |
("true" ==> ((_) => True:BExp )) |
341 |
("false" ==> ((_) => False:BExp )) |
342 |
("(" ~ BExp ~ ")") ==> { case ((x, y), z) => y}
343 |
344 |
lazy val Stmt: Parser[String, Stmt] =
345 |
("skip" ==> (_ => Skip: Stmt)) |
346 |
(IdParser ~ ":=" ~ AExp) ==> { case ((x, y), z) => Assign(x, z): Stmt } |
347 |
(IdParser ~ "[" ~ AExp ~ "]" ~ ":=" ~ AExp) ==> {
348 |
case (((((x, y), z), v), w), u) => AssignA(x, z, u): Stmt } |
349 |
("if" ~ BExp ~ "then" ~ Block ~ "else" ~ Block) ==>
350 |
{ case (((((x,y),z),u),v),w) => If(y, u, w): Stmt } |
351 |
("while" ~ BExp ~ "do" ~ Block) ==> { case (((x, y), z), w) => While(y, w) } |
352 |
("new" ~ IdParser ~ "[" ~ NumParser ~ "]") ==> { case ((((x, y), z), u), v) => Array(y, u) } |
353 |
("write" ~ IdParser) ==> { case (_, y) => Write(y) }
354 |
355 |
lazy val Stmts: Parser[String, Block] =
356 |
(Stmt ~ ";" ~ Stmts) ==> { case ((x, y), z) => x :: z : Block } |
357 |
(Stmt ==> ((s) => List(s) : Block))
358 |
359 |
360 |
lazy val Block: Parser[String, Block] =
361 |
("{" ~ Stmts ~ "}") ==> { case ((x, y), z) => y} |
362 |
(Stmt ==> (s => List(s)))
363 |
364 |
365 |
366 |
367 |
368 |
369 |
370 |
371 |
372 |
val fib = """
373 |
n := 10;
374 |
minus1 := 0;
375 |
minus2 := 1;
376 |
377 |
while (n > 0) do {
378 |
temp := minus2;
379 |
minus2 := minus1 + minus2;
380 |
minus1 := temp;
381 |
n := n - 1};
382 |
result := minus2;
383 |
write result
384 |
""".replaceAll("\\s+", "")
385 |
386 |
val fib_prog = Stmts.parse_all(fib).toList
387 |
//compile_run(fib_prog.head, "fib")
388 |
389 |
390 |
// BF
391 |
392 |
// simple instructions
393 |
def instr(c: Char) : String = c match {
394 |
case '>' => "ptr := ptr + 1;"
395 |
case '<' => "ptr := ptr - 1;"
396 |
case '+' => "field[ptr] := field[ptr] + 1;"
397 |
case '-' => "field[ptr] := field[ptr] - 1;"
398 |
case '.' => "x := field[ptr]; write x;"
399 |
//case ',' => "XXX" // "ptr = getchar();\n"
400 |
case '[' => "while (field[ptr] != 0) do {"
401 |
case ']' => "skip};"
402 |
case _ => ""
403 |
404 |
405 |
def instrs(prog: String) : String =
406 |
407 |
408 |
409 |
def splice(cs: List[Char], acc: List[(Char, Int)]) : List[(Char, Int)] = (cs, acc) match {
410 |
case (Nil, acc) => acc
411 |
case (c :: cs, Nil) => splice(cs, List((c, 1)))
412 |
case (c :: cs, (d, n) :: acc) =>
413 |
if (c == d) splice(cs, (c, n + 1) :: acc)
414 |
else splice(cs, (c, 1) :: (d, n) :: acc)
415 |
416 |
417 |
def spl(s: String) = splice(s.toList, Nil).reverse
418 |
419 |
def instr2(c: Char, n: Int) : String = c match {
420 |
case '>' => "ptr := ptr + " + n.toString + ";"
421 |
case '<' => "ptr := ptr - " + n.toString + ";"
422 |
case '+' => "field[ptr] := field[ptr] + " + n.toString + ";"
423 |
case '-' => "field[ptr] := field[ptr] - " + n.toString + ";"
424 |
case '.' => "x := field[ptr]; write x;" //* n
425 |
//case ',' => "*ptr = getchar();\n" * n
426 |
case '[' => "while (field[ptr] != 0) do {" * n
427 |
case ']' => "skip};" * n
428 |
case _ => ""
429 |
430 |
431 |
def instrs2(prog: String) : String =
432 |
spl(prog).map{ case (c, n) => instr2(c, n) }.mkString
433 |
434 |
435 |
def bf_str(prog: String) : String = {
436 |
"\n" ++
437 |
//"new field[30000];\n" ++
438 |
"ptr := 15000;" ++
439 |
instrs2(prog) ++
440 |
441 |
442 |
443 |
def bf_run(prog: String, name: String) = {
444 |
println("BF processing start")
445 |
val bf_string = bf_str(prog).replaceAll("\\s", "")
446 |
println(s"BF parsing start (string length ${bf_string.length})")
447 |
val bf_prog = Stmts.parse_all(bf_string).toList.head
448 |
println("BF Compile start")
449 |
compile_run(Array("field", 30000) :: bf_prog, name)
450 |
451 |
452 |
453 |
454 |
val bf1 = """++++++++[>+>++++<<-]>++>>+<[-[>>+<<-]+>>]>+[-<<<[
455 |
456 |
457 |
458 |
bf_run(bf1, "sier")
459 |
460 |
461 |
..+++.>>.<-.<.+++.------.--------.>>+.>++.""", "hello")
462 |
463 |
464 |
465 |
466 |
467 |
468 |
469 |
470 |
471 |
472 |
473 |
[-]]<<[>>+>+<<<-]>>>[<<<+>>>-]<<[<+>-]>[<+>-]<<<-]""", "fibs")