| author | Christian Urban <christian.urban@kcl.ac.uk> | 
| Sun, 01 Oct 2023 12:04:51 +0100 | |
| changeset 932 | c54e0c472891 | 
| parent 918 | 19a5d332cb49 | 
| child 933 | 4d9674598682 | 
| permissions | -rw-r--r-- | 
| 630 | 1 | % !TEX program = xelatex | 
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 2 | \documentclass{article}
 | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 3 | \usepackage{../style}
 | 
| 216 
f5ec7c597c5b
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
200diff
changeset | 4 | \usepackage{../langs}
 | 
| 918 | 5 | \usepackage[normalem]{ulem}
 | 
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 6 | |
| 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 7 | \begin{document}
 | 
| 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 8 | |
| 748 | 9 | \section*{Coursework 2}
 | 
| 198 
f54972b0f641
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
182diff
changeset | 10 | |
| 835 | 11 | \noindent This coursework is worth 10\% and is due on \cwTWO{} at
 | 
| 877 | 12 | 16:00. You are asked to implement the Sulzmann \& Lu lexer for the | 
| 748 | 13 | WHILE language. You can do the implementation in any programming | 
| 14 | language you like, but you need to submit the source code with which | |
| 15 | you answered the questions, otherwise a mark of 0\% will be | |
| 918 | 16 | awarded. You need to submit your written | 
| 17 | answers as pdf---see attached questionaire. Code send as code. If you use | |
| 18 | Scala in your code, a good place to start is the file \texttt{re3.sc}
 | |
| 19 | that is uploaded to Github. | |
| 180 
50e8dcd95ae3
added cw
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
179diff
changeset | 20 | |
| 750 | 21 | \subsection*{Disclaimer\alert}
 | 
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 22 | |
| 358 
b3129cff41e9
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
333diff
changeset | 23 | It should be understood that the work you submit represents | 
| 918 | 24 | your own effort. You have not copied from anyone else | 
| 25 | including CoPilot, ChatGPT \& Co. An | |
| 363 
0d6deecdb2eb
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
358diff
changeset | 26 | exception is the Scala code from KEATS and the code I showed | 
| 419 
4110ab35e5d8
updated courseworks
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
396diff
changeset | 27 | during the lectures, which you can both freely use. You can | 
| 918 | 28 | also use your own code from the CW~1. | 
| 29 | %But do not | |
| 30 | %be tempted to ask Github Copilot for help or do any other | |
| 31 | %shenanigans like this! | |
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 32 | |
| 419 
4110ab35e5d8
updated courseworks
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
396diff
changeset | 33 | \subsection*{Question 1}
 | 
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 34 | |
| 419 
4110ab35e5d8
updated courseworks
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
396diff
changeset | 35 | To implement a lexer for the WHILE language, you first | 
| 358 
b3129cff41e9
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
333diff
changeset | 36 | need to design the appropriate regular expressions for the | 
| 748 | 37 | following eleven syntactic entities: | 
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 38 | |
| 180 
50e8dcd95ae3
added cw
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
179diff
changeset | 39 | \begin{enumerate}
 | 
| 
50e8dcd95ae3
added cw
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
179diff
changeset | 40 | \item keywords are | 
| 
50e8dcd95ae3
added cw
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
179diff
changeset | 41 | |
| 748 | 42 | \begin{center}
 | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 43 | \texttt{while}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 44 | \texttt{if}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 45 | \texttt{then}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 46 | \texttt{else}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 47 | \texttt{do}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 48 | \texttt{for}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 49 | \texttt{to}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 50 | \texttt{true}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 51 | \texttt{false}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 52 | \texttt{read}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 53 | \texttt{write},
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 54 | \texttt{skip}
 | 
| 748 | 55 | \end{center} 
 | 
| 180 
50e8dcd95ae3
added cw
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
179diff
changeset | 56 | |
| 748 | 57 | \item operators are: | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 58 | \texttt{+}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 59 | \texttt{-}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 60 | \texttt{*}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 61 | \texttt{\%},
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 62 | \texttt{/},
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 63 | \texttt{==}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 64 | \texttt{!=}, 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 65 | \texttt{>}, 
 | 
| 748 | 66 | \texttt{<},
 | 
| 67 | \texttt{<=}, 
 | |
| 68 | \texttt{>=},
 | |
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 69 | \texttt{:=},
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 70 | \texttt{\&\&},
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 71 | \texttt{||}
 | 
| 748 | 72 | |
| 73 | \item letters are uppercase and lowercase | |
| 180 
50e8dcd95ae3
added cw
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
179diff
changeset | 74 | |
| 748 | 75 | \item symbols are letters plus the characters | 
| 76 |   \texttt{.},
 | |
| 77 |   \texttt{\_},
 | |
| 78 |   \texttt{>},
 | |
| 79 |   \texttt{<},
 | |
| 80 |   \texttt{=},
 | |
| 81 |   \texttt{;},
 | |
| 850 | 82 |   \texttt{,} (comma),
 | 
| 833 | 83 |   \texttt{$\backslash$} and
 | 
| 748 | 84 |   \texttt{:}
 | 
| 85 | ||
| 850 | 86 | \item strings are enclosed by double quotes, like \texttt{"\ldots"}, and consisting of
 | 
| 748 | 87 | symbols, whitespaces and digits | 
| 180 
50e8dcd95ae3
added cw
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
179diff
changeset | 88 | \item parentheses are \texttt{(}, \texttt{\{}, \texttt{)} and \texttt{\}}
 | 
| 
50e8dcd95ae3
added cw
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
179diff
changeset | 89 | \item there are semicolons \texttt{;}
 | 
| 447 
68769db65185
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
428diff
changeset | 90 | \item whitespaces are either \texttt{" "} (one or more) or \texttt{$\backslash$n} or
 | 
| 845 | 91 |   \texttt{$\backslash$t} or \texttt{$\backslash$r}
 | 
| 180 
50e8dcd95ae3
added cw
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
179diff
changeset | 92 | \item identifiers are letters followed by underscores \texttt{\_\!\_}, letters
 | 
| 
50e8dcd95ae3
added cw
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
179diff
changeset | 93 | or digits | 
| 396 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 94 | \item numbers are \pcode{0}, \pcode{1}, \ldots and so on; give 
 | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 95 | a regular expression that can recognise \pcode{0}, but not numbers 
 | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 96 | with leading zeroes, such as \pcode{001}
 | 
| 748 | 97 | \item comments start with \texttt{//} and contain symbols, spaces and digits until the end of the line
 | 
| 180 
50e8dcd95ae3
added cw
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
179diff
changeset | 98 | \end{enumerate}
 | 
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 99 | |
| 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 100 | \noindent | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 101 | You can use the basic regular expressions | 
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 102 | |
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 103 | \[ | 
| 419 
4110ab35e5d8
updated courseworks
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
396diff
changeset | 104 | \ZERO,\; \ONE,\; c,\; r_1 + r_2,\; r_1 \cdot r_2,\; r^* | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 105 | \] | 
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 106 | |
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 107 | \noindent | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 108 | but also the following extended regular expressions | 
| 182 
9ce2414e470e
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
181diff
changeset | 109 | |
| 
9ce2414e470e
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
181diff
changeset | 110 | \begin{center}
 | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 111 | \begin{tabular}{ll}
 | 
| 494 | 112 | $[c_1,c_2,\ldots,c_n]$ & a set of characters\\ | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 113 | $r^+$ & one or more times $r$\\ | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 114 | $r^?$ & optional $r$\\ | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 115 | $r^{\{n\}}$ & n-times $r$\\
 | 
| 182 
9ce2414e470e
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
181diff
changeset | 116 | \end{tabular}
 | 
| 
9ce2414e470e
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
181diff
changeset | 117 | \end{center}
 | 
| 
9ce2414e470e
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
181diff
changeset | 118 | |
| 458 | 119 | \noindent | 
| 473 | 120 | Later on you will also need the record regular expression: | 
| 458 | 121 | |
| 122 | \begin{center}
 | |
| 123 | \begin{tabular}{ll}
 | |
| 124 | $REC(x:r)$ & record regular expression\\ | |
| 125 | \end{tabular}
 | |
| 126 | \end{center}
 | |
| 127 | ||
| 396 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 128 | \noindent Try to design your regular expressions to be as | 
| 494 | 129 | small as possible. For example you should use character sets | 
| 130 | for identifiers and numbers. Feel free to use the general | |
| 131 | character constructor \textit{CFUN} introduced in CW 1.
 | |
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 132 | |
| 419 
4110ab35e5d8
updated courseworks
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
396diff
changeset | 133 | \subsection*{Question 2}
 | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 134 | |
| 419 
4110ab35e5d8
updated courseworks
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
396diff
changeset | 135 | Implement the Sulzmann \& Lu lexer from the lectures. For | 
| 358 
b3129cff41e9
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
333diff
changeset | 136 | this you need to implement the functions $nullable$ and $der$ | 
| 369 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 137 | (you can use your code from CW~1), as well as $mkeps$ and | 
| 358 
b3129cff41e9
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
333diff
changeset | 138 | $inj$. These functions need to be appropriately extended for | 
| 918 | 139 | the extended regular expressions from Q1. Write down in the | 
| 140 | questionaire at the end the | |
| 369 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 141 | clauses for | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 142 | |
| 369 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 143 | \begin{center}
 | 
| 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 144 | \begin{tabular}{@ {}l@ {\hspace{2mm}}c@ {\hspace{2mm}}l@ {}}
 | 
| 494 | 145 | $mkeps([c_1,c_2,\ldots,c_n])$ & $\dn$ & $?$\\ | 
| 369 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 146 | $mkeps(r^+)$ & $\dn$ & $?$\\ | 
| 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 147 | $mkeps(r^?)$ & $\dn$ & $?$\\ | 
| 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 148 | $mkeps(r^{\{n\}})$             & $\dn$ & $?$\medskip\\
 | 
| 494 | 149 | $inj\, ([c_1,c_2,\ldots,c_n])\,c\,\ldots$ & $\dn$ & $?$\\ | 
| 369 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 150 | $inj\, (r^+)\,c\,\ldots$ & $\dn$ & $?$\\ | 
| 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 151 | $inj\, (r^?)\,c\,\ldots$ & $\dn$ & $?$\\ | 
| 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 152 | $inj\, (r^{\{n\}})\,c\,\ldots$             & $\dn$ & $?$\\
 | 
| 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 153 | \end{tabular}
 | 
| 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 154 | \end{center}
 | 
| 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 155 | |
| 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 156 | \noindent where $inj$ takes three arguments: a regular | 
| 396 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 157 | expression, a character and a value. Test your lexer code | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 158 | with at least the two small examples below: | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 159 | |
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 160 | \begin{center}
 | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 161 | \begin{tabular}{ll}
 | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 162 | regex: & string:\smallskip\\ | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 163 | $a^{\{3\}}$ & $aaa$\\
 | 
| 458 | 164 | $(a + \ONE)^{\{3\}}$ & $aa$
 | 
| 396 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 165 | \end{tabular}
 | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 166 | \end{center}
 | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 167 | |
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 168 | |
| 598 | 169 | \noindent Both strings should be successfully lexed by the | 
| 396 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 170 | respective regular expression, that means the lexer returns | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 171 | in both examples a value. | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 172 | |
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 173 | |
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 174 | Also add the record regular expression from the | 
| 419 
4110ab35e5d8
updated courseworks
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
396diff
changeset | 175 | lectures to your lexer and implement a function, say | 
| 396 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 176 | \pcode{env}, that returns all assignments from a value (such
 | 
| 
4cd75c619e06
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
395diff
changeset | 177 | that you can extract easily the tokens from a value).\medskip | 
| 369 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 178 | |
| 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 179 | \noindent | 
| 384 
4629448c1bd9
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
369diff
changeset | 180 | Finally give the tokens for your regular expressions from Q1 and the | 
| 369 
43c0ed473720
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
364diff
changeset | 181 | string | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 182 | |
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 183 | \begin{center}
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 184 | \code{"read n;"}
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 185 | \end{center} 
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 186 | |
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 187 | \noindent | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 188 | and use your \pcode{env} function to give the token sequence.
 | 
| 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 189 | |
| 333 
8890852e18b7
updated coursework
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
328diff
changeset | 190 | |
| 419 
4110ab35e5d8
updated courseworks
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
396diff
changeset | 191 | \subsection*{Question 3}
 | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 192 | |
| 748 | 193 | Extend your lexer from Q2 to also simplify regular expressions after | 
| 194 | each derivation step and rectify the computed values after each | |
| 419 
4110ab35e5d8
updated courseworks
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
396diff
changeset | 195 | injection. Use this lexer to tokenize the programs in | 
| 748 | 196 | Figures~\ref{fib} -- \ref{collatz}. You can find the programms also on
 | 
| 197 | KEATS. Give the tokens of these programs where whitespaces are | |
| 198 | filtered out. Make sure you can tokenise \textbf{exactly} these
 | |
| 199 | programs.\bigskip | |
| 182 
9ce2414e470e
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
181diff
changeset | 200 | |
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 201 | |
| 578 | 202 | \begin{figure}[h]
 | 
| 860 | 203 | \mbox{\lstinputlisting[language=While,xleftmargin=10mm]{../cwtests/cw02/fib.while}}
 | 
| 181 
1f98d215df71
added material
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
180diff
changeset | 204 | \caption{Fibonacci program in the WHILE language.\label{fib}}
 | 
| 
1f98d215df71
added material
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
180diff
changeset | 205 | \end{figure}
 | 
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 206 | |
| 578 | 207 | \begin{figure}[h]
 | 
| 860 | 208 | \mbox{\lstinputlisting[language=While,xleftmargin=10mm]{../cwtests/cw02/loops.while}}
 | 
| 275 
618c7640cf66
updated
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
216diff
changeset | 209 | \caption{The three-nested-loops program in the WHILE language. 
 | 
| 578 | 210 | (Usually used for timing measurements.)\label{loop}}
 | 
| 181 
1f98d215df71
added material
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
180diff
changeset | 211 | \end{figure}
 | 
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 212 | |
| 659 | 213 | \begin{figure}[h]
 | 
| 860 | 214 | \mbox{\lstinputlisting[language=While,xleftmargin=10mm]{../cwtests/cw02/factors.while}}
 | 
| 659 | 215 | \caption{A program that calculates factors for numbers in the WHILE
 | 
| 216 |   language.\label{factors}}
 | |
| 217 | \end{figure}
 | |
| 218 | ||
| 748 | 219 | \begin{figure}[h]
 | 
| 220 | \mbox{\lstinputlisting[language=While,xleftmargin=10mm]{../progs/while-tests/collatz2.while}}
 | |
| 221 | \caption{A program that calculates the Collatz series for numbers
 | |
| 222 |   between 1 and 100.\label{collatz}}
 | |
| 223 | \end{figure}
 | |
| 224 | ||
| 918 | 225 | \clearpage | 
| 226 | \newpage | |
| 227 | \section*{Answers}
 | |
| 228 | ||
| 229 | \mbox{}
 | |
| 230 | ||
| 231 | \noindent | |
| 232 | \textbf{Question 2:}
 | |
| 233 | ||
| 234 | \begin{center}
 | |
| 235 |   \def\arraystretch{1.6}  
 | |
| 236 | \begin{tabular}{@ {}l@ {\hspace{2mm}}c@ {\hspace{2mm}}l@ {}}
 | |
| 237 | $mkeps([c_1,c_2,\ldots,c_n])$  & $\dn$ & \uline{\hspace{8cm}}\\
 | |
| 238 | $mkeps(r^+)$                   & $\dn$ & \uline{\hspace{8cm}}\\
 | |
| 239 | $mkeps(r^?)$                   & $\dn$ & \uline{\hspace{8cm}}\\
 | |
| 240 | $mkeps(r^{\{n\}})$             & $\dn$ & \uline{\hspace{8cm}}\bigskip\\
 | |
| 241 | $inj\, ([c_1,c_2,\ldots,c_n])\,c\,\ldots$  & $\dn$ & \uline{\hspace{8cm}}\\
 | |
| 242 | $inj\, (r^+)\,c\,\ldots$                   & $\dn$ & \uline{\hspace{8cm}}\\
 | |
| 243 | $inj\, (r^?)\,c\,\ldots$                   & $\dn$ & \uline{\hspace{8cm}}\\
 | |
| 244 | $inj\, (r^{\{n\}})\,c\,\ldots$             & $\dn$ & \uline{\hspace{8cm}}\\
 | |
| 245 | \end{tabular}
 | |
| 246 | \end{center}\bigskip
 | |
| 247 | ||
| 248 | \noindent | |
| 249 | Tokens for \code{"read n;"}\\
 | |
| 250 | ||
| 251 | \noindent | |
| 252 | \uline{\hfill}\medskip
 | |
| 253 | ||
| 254 | \noindent | |
| 255 | \uline{\hfill}\medskip
 | |
| 256 | ||
| 257 | \noindent | |
| 258 | \uline{\hfill}\medskip
 | |
| 259 | ||
| 260 | \noindent | |
| 261 | \uline{\hfill}\medskip
 | |
| 262 | ||
| 263 | ||
| 178 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 264 | \end{document}
 | 
| 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 265 | |
| 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 266 | %%% Local Variables: | 
| 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 267 | %%% mode: latex | 
| 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 268 | %%% TeX-master: t | 
| 
d36363d648e3
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 269 | %%% End: |