pep-material: cws/cw05.tex@21c69dc3dbf7 (annotated)

251 3dd550b9b0e3 updated Christian Urban <urbanc@in.tum.de> parents: 247 diff changeset	1	% !TEX program = xelatex
6 aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	2	\documentclass{article}
62 2151c77e1e24 updated Christian Urban <urbanc@in.tum.de> parents: 6 diff changeset	3	\usepackage{../style}
78 85f2f75abeeb updated Christian Urban <urbanc@in.tum.de> parents: 75 diff changeset	4	\usepackage{../langs}
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	5	\usepackage{disclaimer}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	6	\usepackage{tikz}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	7	\usepackage{pgf}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	8	\usepackage{pgfplots}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	9	\usepackage{stackengine}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	10	%% \usepackage{accents}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	11	\newcommand\barbelow[1]{\stackunder[1.2pt]{#1}{\raisebox{-4mm}{\boldmath$\uparrow$}}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	12
6 aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	13
aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	14	\begin{document}
aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	15
241 c650a91db720 updated Christian Urban <urbanc@in.tum.de> parents: 237 diff changeset	16	\section*{Coursework 10 (Scala)}
6 aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	17
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	18	This coursework is worth 10\%. It is about a small programming
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	19	language called brainf***. The first part is due on 13 December at
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	20	11pm; the second, more advanced part, is due on 20 December at
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	21	11pm.\bigskip
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	22
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	23	\IMPORTANT{}
62 2151c77e1e24 updated Christian Urban <urbanc@in.tum.de> parents: 6 diff changeset	24
2151c77e1e24 updated Christian Urban <urbanc@in.tum.de> parents: 6 diff changeset	25	\noindent
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	26	Also note that the running time of each part will be restricted to a
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	27	maximum of 30 seconds on my laptop.
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	28
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	29	\DISCLAIMER{}
86 f8a781322499 updated Christian Urban <urbanc@in.tum.de> parents: 79 diff changeset	30
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	31	\subsection*{Reference Implementation}
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	32
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	33	As usual, this Scala assignment comes with a reference implementation in form of
241 c650a91db720 updated Christian Urban <urbanc@in.tum.de> parents: 237 diff changeset	34	two \texttt{jar}-files. You can download them from KEATS. They allow you to run any
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	35	test cases on your own computer. For example you can call Scala on the command line with the
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	36	option \texttt{-cp bf.jar} and then query any function from the
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	37	\texttt{bf.scala} template file. You have to
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	38	prefix the calls with \texttt{CW10a} and \texttt{CW10b}, respectively. For example
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	39
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	40
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	41	\begin{lstlisting}[language={},xleftmargin=1mm,numbers=none,basicstyle=\ttfamily\small]
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	42	$ scala -cp bf.jar
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	43	scala> import CW10a._
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	44	scala> run(load_bff("sierpinski.bf"))
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	45	*
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	46	* *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	47	* *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	48	* * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	49	* *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	50	* * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	51	* * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	52	* * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	53	* *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	54	* * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	55	* * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	56	* * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	57	* * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	58	* * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	59	* * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	60	* * * * * * * * * * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	61	* *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	62	* * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	63	* * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	64	* * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	65	* * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	66	* * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	67	* * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	68	* * * * * * * * * * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	69	* * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	70	* * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	71	* * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	72	* * * * * * * * * * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	73	* * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	74	* * * * * * * * * * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	75	* * * * * * * * * * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	76	* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * *
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	77	\end{lstlisting}%$
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	78
6 aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	79
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	80
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	81	\subsection*{Part 1 (6 Marks)}
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	82
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	83	Coming from Java or C++, you might think Scala is a rather esoteric
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	84	programming language. But remember, some serious companies have built
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	85	their business on
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	86	Scala.\footnote{\url{https://en.wikipedia.org/wiki/Scala_(programming_language)\#Companies}}
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	87	I claim functional programming is not a fad. And there are far, far
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	88	more esoteric languages out there. One is called \emph{brainf***}. You
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	89	are asked in this part to implement an interpreter for
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	90	this language.
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	91
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	92	Urban M\"uller developed brainf*** in 1993. A close relative of this
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	93	language was already introduced in 1964 by Corado B\"ohm, an Italian
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	94	computer pioneer. The main feature of brainf*** is its minimalistic
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	95	set of instructions---just 8 instructions in total and all of which
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	96	are single characters. Despite the minimalism, this language has been
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	97	shown to be Turing complete\ldots{}if this doesn't ring any bell with
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	98	you: it roughly means that every(!) algorithm can, in principle,
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	99	be implemented in brainf***. It just takes a lot of determination and
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	100	quite a lot of memory resources. Some relatively sophisticated sample
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	101	programs in brainf*** are given in the file \texttt{bf.scala}, including
247 50a3b874008a updated Christian Urban <urbanc@in.tum.de> parents: 241 diff changeset	102	a brainf*** program for the Sierpinski triangle and the Mandelbrot set.
50a3b874008a updated Christian Urban <urbanc@in.tum.de> parents: 241 diff changeset	103	There seems to be even a dedicated Windows IDE for bf programs, though
50a3b874008a updated Christian Urban <urbanc@in.tum.de> parents: 241 diff changeset	104	I am not sure whether this is just an elaborate April fools' joke---judge
50a3b874008a updated Christian Urban <urbanc@in.tum.de> parents: 241 diff changeset	105	yourself:
50a3b874008a updated Christian Urban <urbanc@in.tum.de> parents: 241 diff changeset	106
50a3b874008a updated Christian Urban <urbanc@in.tum.de> parents: 241 diff changeset	107	\begin{center}
50a3b874008a updated Christian Urban <urbanc@in.tum.de> parents: 241 diff changeset	108	\url{https://www.microsoft.com/en-us/p/brainf-ck/9nblgggzhvq5}
50a3b874008a updated Christian Urban <urbanc@in.tum.de> parents: 241 diff changeset	109	\end{center}
50a3b874008a updated Christian Urban <urbanc@in.tum.de> parents: 241 diff changeset	110
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	111
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	112	\noindent
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	113	As mentioned above, brainf*** has 8 single-character commands, namely
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	114	\texttt{'>'}, \texttt{'<'}, \texttt{'+'}, \texttt{'-'}, \texttt{'.'},
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	115	\texttt{','}, \texttt{'['} and \texttt{']'}. Every other character is
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	116	considered a comment. Brainf*** operates on memory cells containing
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	117	integers. For this it uses a single memory pointer that points at each
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	118	stage to one memory cell. This pointer can be moved forward by one
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	119	memory cell by using the command \texttt{'>'}, and backward by using
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	120	\texttt{'<'}. The commands \texttt{'+'} and \texttt{'-'} increase,
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	121	respectively decrease, by 1 the content of the memory cell to which
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	122	the memory pointer currently points to. The commands for input/output
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	123	are \texttt{','} and \texttt{'.'}. Output works by reading the content
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	124	of the memory cell to which the memory pointer points to and printing
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	125	it out as an ASCII character. Input works the other way, taking some
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	126	user input and storing it in the cell to which the memory pointer
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	127	points to. The commands \texttt{'['} and \texttt{']'} are looping
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	128	constructs. Everything in between \texttt{'['} and \texttt{']'} is
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	129	repeated until a counter (memory cell) reaches zero. A typical
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	130	program in brainf*** looks as follows:
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	131
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	132	\begin{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	133	\begin{verbatim}
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	134	++++++++[>++++[>++>+++>+++>+<<<<-]>+>+>->>+[<]<-]>>.>---.++
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	135	+++++..+++.>>.<-.<.+++.------.--------.>>+.>++.
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	136	\end{verbatim}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	137	\end{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	138
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	139	\noindent
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	140	This one prints out Hello World\ldots{}obviously ;o)
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	141
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	142	\subsubsection*{Tasks (file bf.scala)}
109 293ea84d82ca updated Christian Urban <urbanc@in.tum.de> parents: 105 diff changeset	143
293ea84d82ca updated Christian Urban <urbanc@in.tum.de> parents: 105 diff changeset	144	\begin{itemize}
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	145	\item[(1)] Write a function that takes a filename (a string) as an argument
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	146	and requests the corresponding file from disk. It returns the
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	147	content of the file as a string. If the file does not exists,
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	148	the function should return the empty string.\\
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	149	\mbox{}\hfill[1 Mark]
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	150
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	151	\item[(2)] Brainf*** memory is represented by a \texttt{Map} from
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	152	integers to integers. The empty memory is represented by
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	153	\texttt{Map()}, that is nothing is stored in the
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	154	memory; \texttt{Map(0 -> 1, 2 -> 3)} stores \texttt{1} at
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	155	memory location \texttt{0}, and at \texttt{2} it stores \texttt{3}. The
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	156	convention is that if we query the memory at a location that is
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	157	\emph{not} defined in the \texttt{Map}, we return \texttt{0}. Write
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	158	a function, \texttt{sread}, that takes a memory (a \texttt{Map}) and
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	159	a memory pointer (an \texttt{Int}) as arguments, and `safely' reads the
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	160	corresponding memory location. If the \texttt{Map} is not defined at
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	161	the memory pointer, \texttt{sread} returns \texttt{0}.
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	162
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	163	Write another function \texttt{write}, which takes a memory, a
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	164	memory pointer and an integer value as arguments and updates the
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	165	\texttt{Map} with the value at the given memory location. As usual,
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	166	the \texttt{Map} is not updated `in-place' but a new map is created
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	167	with the same data, except the new value is stored at the given memory
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	168	pointer.\hfill[1 Mark]
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	169
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	170	\item[(3)] Write two functions, \texttt{jumpRight} and
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	171	\texttt{jumpLeft}, that are needed to implement the loop constructs
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	172	in brainf***. They take a program (a \texttt{String}) and a program
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	173	counter (an \texttt{Int}) as arguments and move right (respectively
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	174	left) in the string in order to find the \textbf{matching}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	175	opening/closing bracket. For example, given the following program
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	176	with the program counter indicated by an arrow:
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	177
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	178	\begin{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	179	\texttt{--[\barbelow{.}.+>--],>,++}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	180	\end{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	181
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	182	then the matching closing bracket is in 9th position (counting from 0) and
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	183	\texttt{jumpRight} is supposed to return the position just after this
109 293ea84d82ca updated Christian Urban <urbanc@in.tum.de> parents: 105 diff changeset	184
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	185	\begin{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	186	\texttt{--[..+>--]\barbelow{,}>,++}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	187	\end{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	188
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	189	meaning it jumps to after the loop. Similarly, if you are in 8th position,
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	190	then \texttt{jumpLeft} is supposed to jump to just after the opening
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	191	bracket (that is jumping to the beginning of the loop):
109 293ea84d82ca updated Christian Urban <urbanc@in.tum.de> parents: 105 diff changeset	192
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	193	\begin{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	194	\texttt{--[..+>-\barbelow{-}],>,++}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	195	\qquad$\stackrel{\texttt{jumpLeft}}{\longrightarrow}$\qquad
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	196	\texttt{--[\barbelow{.}.+>--],>,++}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	197	\end{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	198
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	199	Unfortunately we have to take into account that there might be
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	200	other opening and closing brackets on the `way' to find the
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	201	matching bracket. For example in the brainf*** program
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	202
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	203	\begin{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	204	\texttt{--[\barbelow{.}.[+>]--],>,++}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	205	\end{center}
109 293ea84d82ca updated Christian Urban <urbanc@in.tum.de> parents: 105 diff changeset	206
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	207	we do not want to return the index for the \texttt{'-'} in the 9th
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	208	position, but the program counter for \texttt{','} in 12th
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	209	position. The easiest to find out whether a bracket is matched is by
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	210	using levels (which are the third argument in \texttt{jumpLeft} and
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	211	\texttt{jumpLeft}). In case of \texttt{jumpRight} you increase the
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	212	level by one whenever you find an opening bracket and decrease by
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	213	one for a closing bracket. Then in \texttt{jumpRight} you are looking
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	214	for the closing bracket on level \texttt{0}. For \texttt{jumpLeft} you
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	215	do the opposite. In this way you can find \textbf{matching} brackets
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	216	in strings such as
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	217
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	218	\begin{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	219	\texttt{--[\barbelow{.}.[[-]+>[.]]--],>,++}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	220	\end{center}
109 293ea84d82ca updated Christian Urban <urbanc@in.tum.de> parents: 105 diff changeset	221
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	222	for which \texttt{jumpRight} should produce the position:
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	223
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	224	\begin{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	225	\texttt{--[..[[-]+>[.]]--]\barbelow{,}>,++}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	226	\end{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	227
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	228	It is also possible that the position returned by \texttt{jumpRight} or
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	229	\texttt{jumpLeft} is outside the string in cases where there are
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	230	no matching brackets. For example
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	231
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	232	\begin{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	233	\texttt{--[\barbelow{.}.[[-]+>[.]]--,>,++}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	234	\qquad$\stackrel{\texttt{jumpRight}}{\longrightarrow}$\qquad
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	235	\texttt{--[..[[-]+>[.]]-->,++\barbelow{\;\phantom{+}}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	236	\end{center}
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	237	\hfill[2 Marks]
109 293ea84d82ca updated Christian Urban <urbanc@in.tum.de> parents: 105 diff changeset	238
293ea84d82ca updated Christian Urban <urbanc@in.tum.de> parents: 105 diff changeset	239
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	240	\item[(4)] Write a recursive function \texttt{compute} that runs a
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	241	brainf*** program. It takes a program, a program counter, a memory
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	242	pointer and a memory as arguments. If the program counter is outside
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	243	the program string, the execution stops and \texttt{compute} returns the
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	244	memory. If the program counter is inside the string, it reads the
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	245	corresponding character and updates the program counter \texttt{pc},
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	246	memory pointer \texttt{mp} and memory \texttt{mem} according to the
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	247	rules shown in Figure~\ref{comms}. It then calls recursively
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	248	\texttt{compute} with the updated data. The most convenient way to
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	249	implement the brainf**k rules in Scala is to use pattern-matching
bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	250	and to calculate a triple consisting of the updated \texttt{pc},
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	251	\texttt{mp} and \texttt{mem}.
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	252
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	253	Write another function \texttt{run} that calls \texttt{compute} with a
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	254	given brainfu** program and memory, and the program counter and memory pointer
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	255	set to~$0$. Like \texttt{compute}, it returns the memory after the execution
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	256	of the program finishes. You can test your brainf**k interpreter with the
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	257	Sierpinski triangle or the Hello world programs (they seem to be particularly
5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	258	useful for debugging purposes), or have a look at
109 293ea84d82ca updated Christian Urban <urbanc@in.tum.de> parents: 105 diff changeset	259
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	260	\begin{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	261	\url{https://esolangs.org/wiki/Brainfuck}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	262	\end{center}\hfill[2 Marks]
109 293ea84d82ca updated Christian Urban <urbanc@in.tum.de> parents: 105 diff changeset	263
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	264	\begin{figure}[p]
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	265	\begin{center}
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	266	\begin{tabular}{\|@{\hspace{0.5mm}}p{0.8cm}\|l\|}
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	267	\hline
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	268	\hfill\texttt{'>'} & \begin{tabular}[t]{@{}l@{\hspace{2mm}}l@{}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	269	$\bullet$ & $\texttt{pc} + 1$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	270	$\bullet$ & $\texttt{mp} + 1$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	271	$\bullet$ & \texttt{mem} unchanged
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	272	\end{tabular}\\\hline
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	273	\hfill\texttt{'<'} & \begin{tabular}[t]{@{}l@{\hspace{2mm}}l@{}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	274	$\bullet$ & $\texttt{pc} + 1$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	275	$\bullet$ & $\texttt{mp} - 1$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	276	$\bullet$ & \texttt{mem} unchanged
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	277	\end{tabular}\\\hline
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	278	\hfill\texttt{'+'} & \begin{tabular}[t]{@{}l@{\hspace{2mm}}l@{}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	279	$\bullet$ & $\texttt{pc} + 1$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	280	$\bullet$ & $\texttt{mp}$ unchanged\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	281	$\bullet$ & \texttt{mem} updated with \texttt{mp -> mem(mp) + 1}\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	282	\end{tabular}\\\hline
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	283	\hfill\texttt{'-'} & \begin{tabular}[t]{@{}l@{\hspace{2mm}}l@{}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	284	$\bullet$ & $\texttt{pc} + 1$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	285	$\bullet$ & $\texttt{mp}$ unchanged\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	286	$\bullet$ & \texttt{mem} updated with \texttt{mp -> mem(mp) - 1}\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	287	\end{tabular}\\\hline
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	288	\hfill\texttt{'.'} & \begin{tabular}[t]{@{}l@{\hspace{2mm}}l@{}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	289	$\bullet$ & $\texttt{pc} + 1$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	290	$\bullet$ & $\texttt{mp}$ and \texttt{mem} unchanged\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	291	$\bullet$ & print out \,\texttt{mem(mp)} as a character\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	292	\end{tabular}\\\hline
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	293	\hfill\texttt{','} & \begin{tabular}[t]{@{}l@{\hspace{2mm}}l@{}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	294	$\bullet$ & $\texttt{pc} + 1$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	295	$\bullet$ & $\texttt{mp}$ unchanged\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	296	$\bullet$ & \texttt{mem} updated with \texttt{mp -> \textrm{input}}\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	297	\multicolumn{2}{@{}l}{the input is given by \texttt{Console.in.read().toByte}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	298	\end{tabular}\\\hline
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	299	\hfill\texttt{'['} & \begin{tabular}[t]{@{}l@{\hspace{2mm}}l@{}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	300	\multicolumn{2}{@{}l}{if \texttt{mem(mp) == 0} then}\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	301	$\bullet$ & $\texttt{pc = jumpRight(prog, pc + 1, 0)}$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	302	$\bullet$ & $\texttt{mp}$ and \texttt{mem} unchanged\medskip\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	303	\multicolumn{2}{@{}l}{otherwise if \texttt{mem(mp) != 0} then}\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	304	$\bullet$ & $\texttt{pc} + 1$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	305	$\bullet$ & $\texttt{mp}$ and \texttt{mem} unchanged\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	306	\end{tabular}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	307	\\\hline
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	308	\hfill\texttt{']'} & \begin{tabular}[t]{@{}l@{\hspace{2mm}}l@{}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	309	\multicolumn{2}{@{}l}{if \texttt{mem(mp) != 0} then}\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	310	$\bullet$ & $\texttt{pc = jumpLeft(prog, pc - 1, 0)}$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	311	$\bullet$ & $\texttt{mp}$ and \texttt{mem} unchanged\medskip\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	312	\multicolumn{2}{@{}l}{otherwise if \texttt{mem(mp) == 0} then}\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	313	$\bullet$ & $\texttt{pc} + 1$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	314	$\bullet$ & $\texttt{mp}$ and \texttt{mem} unchanged\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	315	\end{tabular}\\\hline
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	316	any other char & \begin{tabular}[t]{@{}l@{\hspace{2mm}}l@{}}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	317	$\bullet$ & $\texttt{pc} + 1$\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	318	$\bullet$ & \texttt{mp} and \texttt{mem} unchanged
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	319	\end{tabular}\\
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	320	\hline
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	321	\end{tabular}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	322	\end{center}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	323	\caption{The rules for how commands in the brainf*** language update the program counter \texttt{pc},
230 bebe34c975a8 updated Christian Urban <urbanc@in.tum.de> parents: 229 diff changeset	324	the memory pointer \texttt{mp} and the memory \texttt{mem}.\label{comms}}
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	325	\end{figure}
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	326	\end{itemize}\bigskip
22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	327
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	328	\newpage
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	329
229 5549016ab10f updated Christian Urban <urbanc@in.tum.de> parents: 221 diff changeset	330	\subsection*{Part 2 (4 Marks)}
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	331
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	332	I am sure you agree while it is fun to look at bf-programs, like the
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	333	Sierpinski triangle or the Mandelbrot program, being interpreted, it
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	334	is much more fun to write a compiler for the bf-language.
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	335
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	336
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	337	\subsubsection*{Tasks (file bfc.scala)}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	338
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	339	\begin{itemize}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	340	\item[(5)] Compilers in general attempt to make programs run
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	341	faster by precomputing as much information as possible
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	342	before running the program. In our case we can precompute the
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	343	addresses where we need to jump at the beginning and end of
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	344	loops.
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	345
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	346	For this write a function \texttt{jtable} that precomputes the ``jump
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	347	table'' for a bf-program. This function takes a bf-program
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	348	as an argument and returns a \texttt{Map[Int, Int]}. The
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	349	purpose of this Map is to record the information, in cases
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	350	a pc-position points to a '\texttt{[}' or a '\texttt{]}',
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	351	to which pc-position do we need to jump next?
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	352
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	353	For example for the program
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	354
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	355	\begin{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	356	\texttt{+++++[->++++++++++<]>--<+++[->>++++++++++}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	357	\texttt{<<]>>++<<----------[+>.>.<+<]}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	358	\end{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	359
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	360	we obtain the Map (note the precise numbers might differ depending on white
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	361	spaces etc.~in the bf-program):
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	362
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	363	\begin{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	364	\texttt{Map(69 -> 61, 5 -> 20, 60 -> 70, 27 -> 44, 43 -> 28, 19 -> 6)}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	365	\end{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	366
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	367	This Map states that for the '\texttt{[}' on position 5, we need to
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	368	jump to position 20, which is just after the corresponding '\texttt{]}'.
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	369	Similarly, for the '\texttt{]}' on position 19, we need to jump to
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	370	position 6, which is just after the '\texttt{[}' on position 5, and so
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	371	on. The idea is to not calculate this information each time
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	372	we hit a bracket, but just look up this information in the
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	373	\texttt{jtable}.
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	374
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	375	Then adapt the \texttt{compute} and \texttt{run} functions
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	376	from Part 1 in order to take advantage of the information
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	377	stored in the \texttt{jtable}. This means whenever \texttt{jumpLeft}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	378	and \texttt{jumpRight} was called previously, you should look
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	379	up the jump address in the \texttt{jtable}. Feel free to reuse
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	380	the function \texttt{jumpLeft} and \texttt{jumpRight} for
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	381	calculating the \texttt{jtable}.\hfill{[1 Mark]}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	382
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	383	\item[(6)] Compilers try to eliminate any ``dead'' code that could
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	384	slow down programs and also perform what is often called
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	385	\emph{peephole
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	386	optimisations}.\footnote{\url{https://en.wikipedia.org/wiki/Peephole_optimization}}
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	387	For the latter consider that it is difficult for compilers to
241 c650a91db720 updated Christian Urban <urbanc@in.tum.de> parents: 237 diff changeset	388	comprehend what is intended with whole programs, but they are very good
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	389	at finding out what small snippets of code do, and then try to
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	390	generate faster code for such snippets.
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	391
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	392	In our case, dead code is everything that is not a bf-command.
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	393	Therefore write a function \texttt{optimise} which deletes such
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	394	dead code from a bf-program. Moreover this function should replace every substring
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	395	of the form \pcode{[-]} by a new command \texttt{0}.
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	396	The idea is that the loop \pcode{[-]} just resets the
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	397	memory at the current location to 0. It is more efficient
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	398	to do this in a single step, rather than stepwise in a loop as in
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	399	the original bf-programs.
218 22705d22c105 updated Christian Urban <urbanc@in.tum.de> parents: 111 diff changeset	400
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	401	In the extended \texttt{compute3} and \texttt{run3} functions you should
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	402	implement this command by writing 0 to \pcode{mem(mp)}, that is use
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	403	\pcode{write(mem, mp, 0)} as the rule for the command \texttt{0}.
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	404	The easiest way to modify a string in this way is to use the regular
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	405	expression \pcode{"""[^<>+-.,\\[\\]]"""}, which recognises everything that is
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	406	not a bf-command. Similarly, the
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	407	regular expression \pcode{"""\\[-\\]"""} finds all occurrences of \pcode{[-]}. By using the Scala method \pcode{.replaceAll} you can replace substrings
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	408	with new strings.\\
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	409	\mbox{}\hfill{[1 Mark]}
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	410
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	411	\item[(7)] Finally, real compilers try to take advantage of CPUs which often
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	412	provide complex operations in hardware that can combine many smaller
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	413	instructions into a single faster instruction.
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	414
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	415	In our case we can optimise the several single increments performed at a
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	416	memory cell, for example \pcode{++++}, by a single ``increment by
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	417	4''. For this optimisation we just have to make sure these single
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	418	increments are all next to each other. Similar optimisations should apply
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	419	for the bf-commands \pcode{-}, \pcode{<} and
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	420	\pcode{>}, which can all be replaced by extended versions that take
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	421	the amount of the increment (decrement) into account. We will do
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	422	this by introducing two-character bf-commands. For example
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	423
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	424	\begin{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	425	\begin{tabular}{l\|l}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	426	original bf-cmds & replacement\\
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	427	\hline
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	428	\pcode{+} & \pcode{+A}\\
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	429	\pcode{++} & \pcode{+B}\\
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	430	\pcode{+++} & \pcode{+C}\\
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	431	\ldots{} & \ldots{}\\
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	432	\pcode{+++....++} & \pcode{+Z}\\
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	433	\hspace{5mm}(these are 26 \pcode{+}'s)\\
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	434	\end{tabular}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	435	\end{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	436
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	437
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	438	If there are more
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	439	than 26 \pcode{+}'s in a row, then more than one ``two-character''
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	440	bf-commands need to be generated (the idea is that more than
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	441	26 copies of a single bf-command in a row is a rare occurrence in
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	442	actual bf-programs). Similar replacements apply
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	443	for \pcode{-}, \pcode{<} and \pcode{>}, but
db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	444	all other bf-commands should be unaffected by this
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	445	change.
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	446
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	447	For this write a function \texttt{combine} which replaces sequences
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	448	of repeated increment and decrement commands by appropriate
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	449	two-character commands. In the functions \pcode{compute4} and
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	450	\pcode{run4}, the ``combine'' and the optimisation from (6) should
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	451	be performed. Make sure that when a two-character bf-command is
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	452	encountered you need to increase the \pcode{pc}-counter by two in
237 db4d2fcd8063 updated Christian Urban <urbanc@in.tum.de> parents: 234 diff changeset	453	order to progress to the next command. For example
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	454
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	455	\begin{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	456	\pcode{combine(optimise(load_bff("benchmark.bf")))}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	457	\end{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	458
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	459	generates the improved program
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	460
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	461	\begin{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	462	\pcode{>A+B[<A+M>A-A]<A[[}\hspace{3mm}\ldots{}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	463	\end{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	464
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	465	for the original benchmark program
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	466
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	467	\begin{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	468	\pcode{>++[<+++++++++++++>-]<[[}\hspace{3mm}\ldots
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	469	\end{center}
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	470
241 c650a91db720 updated Christian Urban <urbanc@in.tum.de> parents: 237 diff changeset	471	As you can see, the compiler bets on saving a lot of time on the
c650a91db720 updated Christian Urban <urbanc@in.tum.de> parents: 237 diff changeset	472	\pcode{+B} and \pcode{+M} steps so that the optimisations is
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	473	worthwhile overall (of course for the \pcode{>A}'s and so on, the compiler incurs a
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	474	penalty). Luckily, after you have performed all
38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	475	optimisations in (5) - (7), you can expect that the
234 c51305a2217f updated Christian Urban <urbanc@in.tum.de> parents: 233 diff changeset	476	\pcode{benchmark.bf} program runs four to five times faster.
c51305a2217f updated Christian Urban <urbanc@in.tum.de> parents: 233 diff changeset	477	You can also test whether your compiler produces the correct result
c51305a2217f updated Christian Urban <urbanc@in.tum.de> parents: 233 diff changeset	478	by for example testing
c51305a2217f updated Christian Urban <urbanc@in.tum.de> parents: 233 diff changeset	479
c51305a2217f updated Christian Urban <urbanc@in.tum.de> parents: 233 diff changeset	480	\begin{center}
c51305a2217f updated Christian Urban <urbanc@in.tum.de> parents: 233 diff changeset	481	\pcode{run(load_bff("sierpinski.bf")) == run4(load_bff("sierpinski.bf"))}
c51305a2217f updated Christian Urban <urbanc@in.tum.de> parents: 233 diff changeset	482	\end{center}
c51305a2217f updated Christian Urban <urbanc@in.tum.de> parents: 233 diff changeset	483
c51305a2217f updated Christian Urban <urbanc@in.tum.de> parents: 233 diff changeset	484	which should return true for all the different compiler stages. \\
c51305a2217f updated Christian Urban <urbanc@in.tum.de> parents: 233 diff changeset	485	\mbox{}\hfill{[2 Marks]}
233 38ea26f227af updated Christian Urban <urbanc@in.tum.de> parents: 230 diff changeset	486	\end{itemize}
6 aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	487
aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	488	\end{document}
aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	489
68 8da9e0c16194 updated Christian Urban <urbanc@in.tum.de> parents: 62 diff changeset	490
6 aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	491	%%% Local Variables:
aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	492	%%% mode: latex
aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	493	%%% TeX-master: t
aae256985251 updated Christian Urban <urbanc@in.tum.de> parents: diff changeset	494	%%% End:

author	Christian Urban <urbanc@in.tum.de>
	Sat, 02 Feb 2019 13:35:07 +0000 (2019-02-02)
changeset 262	21c69dc3dbf7
parent 251	3dd550b9b0e3
child 268	e43f7e92ba26
permissions	-rw-r--r--