cws/cw05.tex
author Christian Urban <christian.urban@kcl.ac.uk>
Fri, 24 Oct 2025 10:45:17 +0100
changeset 1017 b0d44eb1ecc7
parent 992 c3dd3a98f919
permissions -rw-r--r--
updated
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
630
9b1c15c3eb6f updated
Christian Urban <urbanc@in.tum.de>
parents: 567
diff changeset
     1
% !TEX program = xelatex
200
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
     2
\documentclass{article}
299
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 298
diff changeset
     3
\usepackage{../style}
865
bc2a862a00d4 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 858
diff changeset
     4
\usepackage{../graphicss}
216
f5ec7c597c5b updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 214
diff changeset
     5
\usepackage{../langs}
873
a25da86f7c8c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 868
diff changeset
     6
\definecolor{navyblue}{rgb}{0.0, 0.0, 0.5}
a25da86f7c8c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 868
diff changeset
     7
\definecolor{pansypurple}{rgb}{0.47, 0.09, 0.29}
200
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
     8
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
     9
\begin{document}
873
a25da86f7c8c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 868
diff changeset
    10
a25da86f7c8c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 868
diff changeset
    11
959
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    12
%\color{pansypurple}
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    13
%\section*{RESIT / REPLACEMENT}
917
89e05a230d2d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 905
diff changeset
    14
959
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    15
%{\bf
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    16
%The resit / replacement task is essentially CW5 (listed below) with
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    17
%the exception that the lexer and parser is already provided. The
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    18
%parser will generate an AST (see file \texttt{fun\_llvm.sc}). Your task
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    19
%is to generate an AST for the K-intermediate language and supply
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    20
%sufficient type annotations such that you can generate valid code for
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    21
%the LLVM-IR. The submission deadline is 4th August at 16:00. At the
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    22
%deadline, please send me an email containing a zip-file with your
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    23
%files.
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    24
%Feel free to reuse the files I have uploaded on KEATS (especially
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    25
%the files generating simple LLVM-IR code). Of help might also be the
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    26
%videos of Week~10.\bigskip
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    27
%
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    28
%\noindent
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    29
%Good Luck!}\smallskip\\
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    30
%\noindent
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    31
%Christian
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    32
%\color{black}
873
a25da86f7c8c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 868
diff changeset
    33
200
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
    34
836
a3418ee8c404 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 821
diff changeset
    35
\section*{Coursework 5}
200
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
    36
722
14914b57e207 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 719
diff changeset
    37
14914b57e207 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 719
diff changeset
    38
989
aa976b429904 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 988
diff changeset
    39
\noindent This coursework is worth 20\% and is due on \cwFIVE{} at
877
43460c7b2010 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 875
diff changeset
    40
16:00. You are asked to implement a compiler targeting the LLVM-IR.
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    41
Be careful that this CW needs some material about the LLVM-IR
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    42
that has not been shown in the lectures and your own experiments
959
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    43
and research might be required. You can find information about the LLVM-IR at
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    44
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    45
\begin{itemize}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    46
\item \url{https://bit.ly/3rheZYr}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    47
\item \url{https://llvm.org/docs/LangRef.html}  
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    48
\end{itemize}  
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    49
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    50
\noindent
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    51
You can do the implementation of your compiler in any programming
748
383f2a5952ce updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 722
diff changeset
    52
language you like, but you need to submit the source code with which
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    53
you generated the LLVM-IR files, otherwise a mark of 0\% will be
853
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
    54
awarded. You are asked to submit the code of your compiler, but also
858
13a6eb21706b updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 857
diff changeset
    55
the generated \texttt{.ll} files. No PDF is needed for this
13a6eb21706b updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 857
diff changeset
    56
coursework.  You should use the lexer and parser from the previous
13a6eb21706b updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 857
diff changeset
    57
courseworks, but you need to make some modifications to them for the
13a6eb21706b updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 857
diff changeset
    58
`typed' version of the Fun-language. I will award up to 5\% if a lexer
959
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    59
and a parser are correctly implemented.
853
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
    60
959
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    61
%At the end, please package
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    62
%everything(!) in a zip-file that creates a directory with the name
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    63
%
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    64
%\begin{center}
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    65
%\texttt{YournameYourFamilyname}
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    66
%\end{center}
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    67
%
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    68
%\noindent
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    69
%on my end.
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    70
You will be marked according to the input files
855
1c0a684567d7 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 853
diff changeset
    71
1c0a684567d7 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 853
diff changeset
    72
\begin{itemize}
987
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
    73
\item\href{https://cflmark.nms.kcl.ac.uk/hg/afl-material/raw-file/tip/progs/sqr.fun}{sqr.fun}  
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
    74
\item\href{https://cflmark.nms.kcl.ac.uk/hg/afl-material/raw-file/tip/progs/fact.fun}{fact.fun}
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
    75
\item\href{https://cflmark.nms.kcl.ac.uk/hg/afl-material/raw-file/tip/progs/mand.fun}{mand.fun}
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
    76
\item\href{https://cflmark.nms.kcl.ac.uk/hg/afl-material/raw-file/tip/progs/mand2.fun}{mand2.fun}
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
    77
\item\href{https://cflmark.nms.kcl.ac.uk/hg/afl-material/raw-file/tip/progs/hanoi.fun}{hanoi.fun}   
855
1c0a684567d7 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 853
diff changeset
    78
\end{itemize}  
1c0a684567d7 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 853
diff changeset
    79
1c0a684567d7 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 853
diff changeset
    80
\noindent
959
64ec1884d860 updated and added pascal.while file
Christian Urban <christian.urban@kcl.ac.uk>
parents: 943
diff changeset
    81
which are uploaded to KEATS and Github.
200
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
    82
750
e93a9e74ca8e updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 748
diff changeset
    83
\subsection*{Disclaimer\alert}
358
b3129cff41e9 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 333
diff changeset
    84
750
e93a9e74ca8e updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 748
diff changeset
    85
It should be understood that the work you submit represents your own
e93a9e74ca8e updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 748
diff changeset
    86
effort. You have not copied from anyone else. An exception is the
e93a9e74ca8e updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 748
diff changeset
    87
Scala code I showed during the lectures or uploaded to KEATS, which
992
c3dd3a98f919 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 989
diff changeset
    88
you can both use. You can also use your own code from CW~1 --
987
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
    89
CW~4. %But do not
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
    90
%be tempted to ask Github Copilot for help or do any other
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
    91
%shenanigans like this!
200
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
    92
299
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 298
diff changeset
    93
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    94
\subsection*{Task}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
    95
992
c3dd3a98f919 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 989
diff changeset
    96
The goal is to lex and parse five Fun-programs, including the
853
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
    97
Mandelbrot program shown in Figure~\ref{mand}, and generate
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
    98
corresponding code for the LLVM-IR. Unfortunately the calculations for
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
    99
the Mandelbrot Set require floating point arithmetic and therefore we
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   100
cannot be as simple-minded about types as we have been so far
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   101
(remember the LLVM-IR is a fully-typed language and needs to know the
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   102
exact types of each expression). The idea is to deal appropriately
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   103
with three types, namely \texttt{Int}, \texttt{Double} and
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   104
\texttt{Void} (they are represented in the LLVM-IR as \texttt{i32},
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   105
\texttt{double} and \texttt{void}). You need to extend the lexer and
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   106
parser accordingly in order to deal with type annotations. The
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   107
Fun-language includes global constants, such as
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   108
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   109
\begin{lstlisting}[numbers=none]
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   110
  val Ymin: Double = -1.3;
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   111
  val Maxiters: Int = 1000;
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   112
\end{lstlisting}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   113
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   114
\noindent
858
13a6eb21706b updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 857
diff changeset
   115
where you can assume that they are `normal' identifiers, just
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   116
starting with a capital letter---all other identifiers should have
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   117
lower-case letters. Function definitions can take arguments of
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   118
type \texttt{Int} or \texttt{Double}, and need to specify a return
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   119
type, which can be \texttt{Void}, for example
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   120
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   121
\begin{lstlisting}[numbers=none]
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   122
  def foo(n: Int, x: Double) : Double = ...
853
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   123
  def id(n: Int) : Int = ...
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   124
  def bar() : Void = ...
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   125
\end{lstlisting}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   126
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   127
\noindent
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   128
The idea is to record all typing information that is given
853
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   129
in the Fun-program, but then delay any further typing inference to
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   130
after the CPS-translation. That means the parser should
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   131
generate ASTs given by the Scala dataypes:
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   132
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   133
\begin{lstlisting}[numbers=none,language=Scala]
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   134
abstract class Exp 
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   135
abstract class BExp  
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   136
abstract class Decl 
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   137
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   138
case class Def(name: String, args: List[(String, String)],
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   139
               ty: String, body: Exp) extends Decl
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   140
case class Main(e: Exp) extends Decl
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   141
case class Const(name: String, v: Int) extends Decl
868
8fb3b6d3be70 updated to Doubles trhoughout
Christian Urban <christian.urban@kcl.ac.uk>
parents: 865
diff changeset
   142
case class FConst(name: String, x: Double) extends Decl
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   143
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   144
case class Call(name: String, args: List[Exp]) extends Exp
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   145
case class If(a: BExp, e1: Exp, e2: Exp) extends Exp
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   146
case class Var(s: String) extends Exp
853
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   147
case class Num(i: Int) extends Exp     // integer numbers
868
8fb3b6d3be70 updated to Doubles trhoughout
Christian Urban <christian.urban@kcl.ac.uk>
parents: 865
diff changeset
   148
case class FNum(i: Double) extends Exp  // floating numbers
857
2b11eb06af76 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 855
diff changeset
   149
case class ChConst(c: Int) extends Exp // char constants
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   150
case class Aop(o: String, a1: Exp, a2: Exp) extends Exp
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   151
case class Sequence(e1: Exp, e2: Exp) extends Exp
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   152
case class Bop(o: String, a1: Exp, a2: Exp) extends BExp
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   153
\end{lstlisting}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   154
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   155
\noindent
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   156
This datatype distinguishes whether the global constant is an integer
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   157
constant or floating constant. Also a function definition needs to
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   158
record the return type of the function, namely the argument
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   159
\texttt{ty} in \texttt{Def}, and the arguments consist of an pairs of
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   160
identifier names and types (\texttt{Int} or \texttt{Double}). The hard
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   161
part of the CW is to design the K-intermediate language and infer all
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   162
necessary types in order to generate LLVM-IR code. You can check
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   163
your LLVM-IR code by running it with the interpreter \texttt{lli}.
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   164
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   165
\begin{figure}[t]
857
2b11eb06af76 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 855
diff changeset
   166
\lstinputlisting[language=Scala]{../cwtests/cw05/mand.fun}
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   167
\caption{The Mandelbrot program in the `typed' Fun-language.\label{mand}}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   168
\end{figure}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   169
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   170
\begin{figure}[t]
943
5365ef60707e updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 917
diff changeset
   171
\includegraphics[scale=0.35]{../solutions/cw5/out.png}
865
bc2a862a00d4 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 858
diff changeset
   172
\caption{Ascii output of the Mandelbrot program.\label{mand2}}
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   173
\end{figure}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   174
853
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   175
Also note that the second version of the Mandelbrot program and also
858
13a6eb21706b updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 857
diff changeset
   176
the Tower of Hanoi program use character constants, like \texttt{'a'},
853
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   177
\texttt{'1'}, \texttt{'$\backslash$n'} and so on. When they are tokenised,
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   178
such characters should be interpreted as the corresponding ASCII code (an
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   179
integer), such that we can use them in calculations like \texttt{'a' + 10}
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   180
where the result should be 107. As usual, the character \texttt{'$\backslash$n'} is the
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   181
ASCII code 10.
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   182
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   183
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   184
\subsection*{LLVM-IR}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   185
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   186
There are some subtleties in the LLVM-IR you need to be aware of:
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   187
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   188
\begin{itemize}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   189
\item \textbf{Global constants}: While global constants such as
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   190
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   191
\begin{lstlisting}[numbers=none]  
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   192
val Max : Int = 10;
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   193
\end{lstlisting}
200
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   194
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   195
\noindent
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   196
can be easily defined in the LLVM-IR as follows
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   197
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   198
\begin{lstlisting}[numbers=none]  
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   199
@Max = global i32 10
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   200
\end{lstlisting}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   201
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   202
\noindent
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   203
they cannot easily be referenced. If you want to use
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   204
this constant then you need to generate code such as
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   205
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   206
\begin{lstlisting}[numbers=none]  
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   207
%tmp_22 = load i32, i32* @Max
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   208
\end{lstlisting}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   209
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   210
\noindent
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   211
first, which treats \texttt{@Max} as an Integer-pointer (type
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   212
\texttt{i32*}) that needs to be loaded into a local variable,
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   213
here \texttt{\%tmp\_22}.
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   214
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   215
\item \textbf{Void-Functions}: While integer and double functions
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   216
  can easily be called and their results can be allocated to a
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   217
  temporary variable:
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   218
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   219
  \begin{lstlisting}[numbers=none]  
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   220
   %tmp_23 = call i32 @sqr (i32 %n)
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   221
  \end{lstlisting}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   222
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   223
  void-functions cannot be allocated to a variable. They need to be
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   224
  called just as
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   225
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   226
  \begin{lstlisting}[numbers=none]  
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   227
  call void @print_int (i32 %tmp_23)
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   228
\end{lstlisting}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   229
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   230
\item \textbf{Floating-Point Operations}: While integer operations
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   231
  are specified in the LLVM-IR as
201
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 200
diff changeset
   232
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   233
  \begin{lstlisting}[numbers=none,language=Scala]
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   234
  def compile_op(op: String) = op match {
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   235
    case "+" => "add i32 "
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   236
    case "*" => "mul i32 "
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   237
    case "-" => "sub i32 "
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   238
    case "==" => "icmp eq i32 "
853
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   239
    case "!=" => "icmp ne i32 "
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   240
    case "<=" => "icmp sle i32 " // signed less or equal
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   241
    case "<"  => "icmp slt i32 " // signed less than
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   242
  }\end{lstlisting}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   243
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   244
  the corresponding operations on doubles are
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   245
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   246
  \begin{lstlisting}[numbers=none,language=Scala]
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   247
  def compile_dop(op: String) = op match {
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   248
    case "+" => "fadd double "
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   249
    case "*" => "fmul double "
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   250
    case "-" => "fsub double "
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   251
    case "==" => "fcmp oeq double "
853
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   252
    case "!=" => "fcmp one double "
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   253
    case "<=" => "fcmp ole double "   
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   254
    case "<"  => "fcmp olt double "   
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   255
  }\end{lstlisting}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   256
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   257
\item \textbf{Typing}: In order to leave the CPS-translations
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   258
  as is, it makes sense to defer the full type-inference to the
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   259
  K-intermediate-language. For this it is good to define
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   260
  the \texttt{KVar} constructor as
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   261
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   262
\begin{lstlisting}[numbers=none,language=Scala]  
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   263
case class KVar(s: String, ty: Ty = "UNDEF") extends KVal\end{lstlisting}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   264
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   265
  where first a default type, for example \texttt{UNDEF}, is
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   266
  given. Then you need to define two typing functions
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   267
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   268
  \begin{lstlisting}[numbers=none,language=Scala]  
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   269
    def typ_val(v: KVal, ts: TyEnv) = ???
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   270
    def typ_exp(a: KExp, ts: TyEnv) = ???
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   271
  \end{lstlisting}
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   272
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   273
  Both functions require a typing-environment that updates
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   274
  the information about what type each variable, operation
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   275
  and so on receives. Once the types are inferred, the
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   276
  LLVM-IR code can be generated. Since we are dealing only
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   277
  with simple first-order functions, nothing on the scale
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   278
  as the `Hindley-Milner' typing-algorithm is needed. I suggest
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   279
  to just look at what data is avaliable and generate all
836
a3418ee8c404 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 821
diff changeset
   280
  missing information by ``simple means''\ldots rather than
a3418ee8c404 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 821
diff changeset
   281
  looking at the literature which solves the problem
a3418ee8c404 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 821
diff changeset
   282
  with much heavier machinery.
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   283
987
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
   284
\item \textbf{Built-In Functions}: The `prelude' comes
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
   285
  with several built-in functions: \texttt{new\_line()},
853
568671822d52 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 836
diff changeset
   286
  \texttt{skip}, \texttt{print\_int(n)}, \texttt{print\_space()},
987
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
   287
  \texttt{print\_star()} as well as \texttt{print\_char(n)}. You 
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
   288
  can find the `prelude' for
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
   289
  example in the file \texttt{sqr.ll}. When printing strings, you 
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
   290
  can assume programs only contain string \emph{constants}. (see
ad5ad452223c updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 959
diff changeset
   291
  for example sqr.fun and hanoi.fun).
820
7fd1f611c21d updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 752
diff changeset
   292
\end{itemize}  
205
0b59588d28d2 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 204
diff changeset
   293
200
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   294
\end{document}
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   295
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   296
%%% Local Variables: 
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   297
%%% mode: latex
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   298
%%% TeX-master: t
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   299
%%% End: