pep-material: changeset 498:0f1b97538ad4

Binary file cws/core_cw01.pdf has changed

--- a/cws/core_cw01.tex	Mon Nov 10 16:24:46 2025 +0000
+++ b/cws/core_cw01.tex	Thu Nov 13 17:44:58 2025 +0000
@@ -8,7 +8,7 @@
 
 \begin{document}
 
-\section*{Core Part 1 (Scala, 3 Marks)}
+\section*{Core Part 1 (Scala, 1.5 Marks)}
 
 \mbox{}\hfill\textit{``The most effective debugging tool is still careful thought,}\\
 \mbox{}\hfill\textit{coupled with judiciously placed print statements.''}\smallskip\\
@@ -62,7 +62,7 @@
 
 
 \newpage
-\subsection*{Core Part 1 (3 Marks, file collatz.scala)}
+\subsection*{Core Part 1 (1.5 Marks, file collatz.scala)}
 
 This part is about function definitions and recursion. You are asked
 to implement a Scala program that tests examples of the
@@ -118,15 +118,15 @@
   try out this function with large numbers, you should use
   \texttt{Long} as argument type, instead of \texttt{Int}.  You can
   assume this function will be called with numbers between $1$ and
-  $1$ Million. \hfill[1 Mark]
+  $1$ Million. \hfill[0.5 Marks]
 
 \item[(2)] Write a second function that takes an upper bound as
   an argument and calculates the steps for all numbers in the range from
   1 up to this bound (the bound including). It returns the maximum number of
   steps and the corresponding number that needs that many steps.  More
   precisely it returns a pair where the first component is the number
-  of steps and the second is the corresponding number. \hfill\mbox{[1
-    Mark]}
+  of steps and the second is the corresponding number. \hfill\mbox{[0.5
+    Marks]}
 
 \item[(3)] Write a function that calculates \emph{hard
     numbers} \here{https://medium.com/cantors-paradise/the-collatz-conjecture-some-shocking-results-from-180-000-iterations-7fea130d0377}
@@ -149,7 +149,7 @@
   \[113, 340, 170, \,\fbox{85}\,, 256, 128, 64, 32, 16, 8, 4, 2, 1\]
 
   The \textit{last-odd} function will only be called with numbers that are not
-  powers of 2 themselves.\hfill\mbox{[1 Mark]}
+  powers of 2 themselves.\hfill\mbox{[0.5 Mark]}
 \end{itemize}
 
 \noindent

Binary file cws/core_cw02.pdf has changed

--- a/cws/core_cw02.tex	Mon Nov 10 16:24:46 2025 +0000
+++ b/cws/core_cw02.tex	Thu Nov 13 17:44:58 2025 +0000
@@ -9,7 +9,7 @@
 
 %% should ask to lower case the words.
 
-\section*{Core Part 2 (Scala, 3 Marks)}
+\section*{Core Part 2 (Scala, 1.5 Marks)}
 
 \mbox{}\hfill\textit{``What one programmer can do in one month,}\\
 \mbox{}\hfill\textit{two programmers can do in two months.''}\smallskip\\
@@ -66,7 +66,7 @@
 
 
 \newpage
-\subsection*{Core Part 2 (3 Marks, file docdiff.scala)}
+\subsection*{Core Part 2 (1.5  Marks, file docdiff.scala)}
 
 It seems plagiarism---stealing and submitting someone
 else's code---is a serious problem at other
@@ -87,7 +87,7 @@
   \texttt{\textbackslash{}w+} for recognising words and the library function
   \texttt{findAllIn}. The function should return a document (a list of
   strings).
-  \mbox{}\hfill\mbox{[0.5 Marks]}
+  \mbox{}\hfill\mbox{[0.25 Marks]}
 
 \item[(2)] In order to compute the overlap between two documents, we
   associate each document with a \texttt{Map}. This Map represents the
@@ -108,7 +108,7 @@
   \pcode{occurrences(List("d", "b", "d", "b", "d"))}
   \end{center}
 
-  produces \pcode{Map(d -> 3, b -> 2)}.\hfill[1 Mark]
+  produces \pcode{Map(d -> 3, b -> 2)}.\hfill[0.5 Marks]
 
 \item[(3)] You can think of the Maps calculated under (2) as memory-efficient
   representations of sparse ``vectors''. In this subtask you need to
@@ -130,7 +130,7 @@
     \underbrace{1 * 3}_{"d"} \qquad = 7
   \]  
   
-  \hfill\mbox{[1 Mark]}
+  \hfill\mbox{[0.5 Marks]}
 
 \item[(4)] Implement first a function that calculates the overlap
   between two documents, say $d_1$ and $d_2$, according to the formula
@@ -147,7 +147,7 @@
   two strings, by first extracting the substrings using the clean
   function from (1)
   and then calculating the overlap of the resulting documents.\\
-  \mbox{}\hfill\mbox{[0.5 Marks]}
+  \mbox{}\hfill\mbox{[0.25 Marks]}
 \end{itemize}

Binary file cws/core_cw03.pdf has changed

--- a/cws/core_cw03.tex	Mon Nov 10 16:24:46 2025 +0000
+++ b/cws/core_cw03.tex	Thu Nov 13 17:44:58 2025 +0000
@@ -16,7 +16,7 @@
 % BF IDE
 % https://www.microsoft.com/en-us/p/brainf-ck/9nblgggzhvq5
   
-\section*{Core Part 3 (Scala, 3 Marks)}
+\section*{Core Part 3 (Scala, 2 Marks)}
 
 \mbox{}\hfill\textit{``[Google’s MapReduce] abstraction is inspired by the}\\
 \mbox{}\hfill\textit{map and reduce primitives present in Lisp and many}\\
@@ -62,7 +62,7 @@
 \bigskip
 
 
-\subsection*{Core Part (3 Marks, files postfix.scala, postfix2.scala)}
+\subsection*{Core Part (2 Marks, files postfix.scala, postfix2.scala)}
 
 The \textit{Shunting Yard Algorithm} has been developed by Edsger Dijkstra,
 an influential computer scientist who developed many well-known
@@ -159,7 +159,7 @@
   as argument and evaluates it generating an integer as result. It uses a
   stack to evaluate the postfix expression. The operators $+$, $-$, $*$
   are as usual; $/$ is division on integers, for example $7 / 3 = 2$.
-  \hfill[1 Mark]
+  \hfill[0.5 Marks]
 \end{itemize}
 
 \subsubsection*{Task (file postfix2.scala)}
@@ -171,7 +171,7 @@
   other operators are left-associative.  Left-associative operators
   are popped off if the precedence is bigger or equal, while
   right-associative operators are only popped off if the precedence is
-  bigger.\hfill[1 Marks]
+  bigger.\hfill[0.5 Marks]
 \end{itemize}
 
 \end{document}

--- a/cws/disclaimer.sty	Mon Nov 10 16:24:46 2025 +0000
+++ b/cws/disclaimer.sty	Thu Nov 13 17:44:58 2025 +0000
@@ -4,9 +4,9 @@
 \begin{itemize}
 \item #1  
 \item Make sure the files you submit can be processed by just calling\\
-  \mbox{\texttt{scala-cli compile <<filename.scala>>}} on the command line.\footnote{All
+  \mbox{\texttt{scala compile <<filename.scala>>}} on the command line.\footnote{All
     major OSes, including Windows, have a command line. So there is no
-    good reason to not download scala-cli, install it and run it on your
+    good reason to not download scala, install it and run it on your
     own computer. Just do it!} Use the
   template files provided and do not make any changes to arguments of
   functions or to any types. You are free to implement any auxiliary
@@ -37,9 +37,9 @@
 
 \begin{itemize}
 \item Make sure the files you submit can be processed by just calling\\
-  \mbox{\texttt{scala-cli compile <<filename.scala>>}} on the command line.\footnote{All
+  \mbox{\texttt{scala compile <<filename.scala>>}} on the command line.\footnote{All
     major OSes, including Windows, have a command line. So there is no
-    good reason to not download scala-cli, install it and run it on your
+    good reason to not download scala, install it and run it on your
     own computer. Just do it!} Use the
   template files provided and do not make any changes to arguments of
   functions or to any types. You are free to implement any auxiliary
@@ -71,7 +71,7 @@
 
 \begin{itemize}
 \item Make sure the files you submit can be processed by just calling\\
-  \mbox{\texttt{scala-cli compile <<filename.scala>>}} on the command line. Use the
+  \mbox{\texttt{scala compile <<filename.scala>>}} on the command line. Use the
   template file provided and do not make any changes to arguments of
   functions or to any types. You are free to implement any auxiliary
   function you might need.

Binary file cws/main_cw03.pdf has changed

--- a/cws/main_cw03.tex	Mon Nov 10 16:24:46 2025 +0000
+++ b/cws/main_cw03.tex	Thu Nov 13 17:44:58 2025 +0000
@@ -7,6 +7,8 @@
 \usepackage{pgf}
 \usepackage{pgfplots}
 \usepackage{stackengine}
+\usepackage{scalerel}
+\DeclareMathOperator*{\amp}{\scalerel*{\&}{\sum}}
 %% \usepackage{accents}
 \newcommand\barbelow[1]{\stackunder[1.2pt]{#1}{\raisebox{-4mm}{\boldmath$\uparrow$}}}
 
@@ -119,7 +121,7 @@
 % BF IDE
 % https://www.microsoft.com/en-us/p/brainf-ck/9nblgggzhvq5
   
-\section*{Main Part 3 (Scala, 7 Marks)}
+\section*{Main Part 3 (Scala, 6 Marks)}
 
 \mbox{}\hfill\textit{``Java is the most distressing thing to happen to computing since MS-DOS.''}\smallskip\\
 \mbox{}\hfill\textit{ --- Alan Kay, the inventor of object-oriented programming}\bigskip\medskip
@@ -144,7 +146,7 @@
 
 This Scala assignment comes with a reference implementation in form of
 a \texttt{jar}-file. This allows you to run any test cases on your own
-computer. For example you can call \texttt{scala-cli} on the command
+computer. For example you can call \texttt{scala} on the command
 line with the option \texttt{--extra-jars re.jar} and then query any function
 from the \texttt{re.scala} template file. As usual you have to prefix
 the calls with \texttt{M3} or import this object.  Since some tasks
@@ -155,7 +157,7 @@
 
 
 \begin{lstlisting}[xleftmargin=1mm,numbers=none,basicstyle=\ttfamily\small]
-$ scala-cli --extra-jars re.jar
+$ scala --extra-jars re.jar
 scala> import M3._  
 scala> for (i <- 0 to 5000000 by 500000) {
   println(s"$i: ${time_needed(2, matcher(EVIL, "a" * i))}")
@@ -192,9 +194,11 @@
       &   $|$ & $\ONE$      & can only match the empty string\\
       &   $|$ & $c$         & can match a single character (in this case $c$)\\
       &   $|$ & $r_1 + r_2$ & can match a string either with $r_1$ or with $r_2$\\
-  &   $|$ & $r_1\cdot r_2$ & can match the first part of a string with $r_1$ and\\
+      &   $|$ & $r_1\cdot r_2$ & can match the first part of a string with $r_1$ and\\
           &  & & then the second part with $r_2$\\
+      &   $|$ & $r_1 \,\&\, r_2$ & has to match a string with both $r_1$ and $r_2$\\
       &   $|$ & $r^*$       & can match a string with zero or more copies of $r$\\
+      &   $|$ & $r^{\{n\}}$  & can match a string with exactly n copies of $r$\\
 \end{tabular}
 \end{center}
 
@@ -204,7 +208,7 @@
 are endlessly useful for searching, editing and analysing data in all
 sorts of places (for example analysing network traffic in order to
 detect security breaches). However, you need to be fast, otherwise you
-will stumble over problems such as recently reported at
+will stumble over problems such as reported in
 
 {\small
 \begin{itemize}
@@ -231,27 +235,14 @@
   $\ZERO$ & $\mapsto$ & \texttt{ZERO}\\
   $\ONE$  & $\mapsto$ & \texttt{ONE}\\
   $c$     & $\mapsto$ & \texttt{CHAR(c)}\\
-  $\sum rs$ & $\mapsto$ & \texttt{ALTs(rs)}\\  
   $r_1 + r_2$ & $\mapsto$ & \texttt{ALT(r1, r2)} & \texttt{r1 | r2}\\
-  $\prod rs$ & $\mapsto$ & \texttt{SEQs(rs)}\\  
   $r_1 \cdot r_2$ & $\mapsto$ & \texttt{SEQ(r1, r2)} & \texttt{r1 $\sim$ r2}\\
-  $r^*$ & $\mapsto$ &  \texttt{STAR(r)} & \texttt{r.\%}
+  $r_1 \,\&\, r_2$ & $\mapsto$ & \texttt{AND(r1, r2)}\\
+  $r^*$ & $\mapsto$ &  \texttt{STAR(r)} & \texttt{r.\%}\\
+  $r^{\{n\}}$ & $\mapsto$ &  \texttt{REP(r, n)} & 
 \end{tabular}    
 \end{center}  
 
-\noindent
-The alternative regular expression comes in two versions: one is
-binary (+ / \texttt{ALT}) and the other is n-ary ($\sum$ /
-\texttt{ALTs}). The latter takes a list of regular expressions as
-argument.  In what follows we shall use $rs$ to stand for lists of
-regular expressions. When the list is empty, we shall write $\sum\,[]$;
-if it is non-empty, we sometimes write $\sum\,[r_1,..., r_n]$.
-The binary alternative can be seen as an abbreviation,
-that is $r_1 + r_2 \dn \sum\,[r_1, r_2]$. As a result we can ignore the
-binary version and only implement the n-ary alternative. Similarly
-the sequence regular expression is only implemented with lists and the
-binary version can be obtained by defining $r_1 \cdot r_2 \dn \prod\,[r_1, r_2]$.
-
 \begin{itemize}
 \item[(1)] Implement a function, called \textit{nullable}, by
   recursion over regular expressions. This function tests whether a
@@ -265,9 +256,14 @@
 $\textit{nullable}(\ZERO)$ & $\dn$ & $\textit{false}$\\
 $\textit{nullable}(\ONE)$  & $\dn$ & $\textit{true}$\\
 $\textit{nullable}(c)$     & $\dn$ & $\textit{false}$\\
-$\textit{nullable}(\sum rs)$ & $\dn$ & $\exists r \in rs.\;\textit{nullable}(r)$\\
-$\textit{nullable}(\prod rs)$ & $\dn$ & $\forall r\in rs.\;\textit{nullable}(r)$\\
+$\textit{nullable}(r_1 + r_2)$ & $\dn$ & $\textit{nullable}(r_1) \vee  \textit{nullable}(r_2)$\\
+$\textit{nullable}(r_1 \cdot r_2)$ & $\dn$ & $\textit{nullable}(r_1) \wedge  \textit{nullable}(r_2)$\\
+$\textit{nullable}(r_1 \& r_2)$ & $\dn$ & $\textit{nullable}(r_1) \wedge  \textit{nullable}(r_2)$\\
 $\textit{nullable}(r^*)$ & $\dn$ & $\textit{true}$\\
+$\textit{nullable}(r^{\{n\}})$ & $\dn$ & 
+$\begin{cases}\textit{true} & n = 0\\
+\textit{nullable}(r) & \textit{otherwise}
+\end{cases}$\\
 \end{tabular}
 \end{center}~\hfill[0.5 Marks]
 
@@ -281,131 +277,175 @@
 $\textit{der}\;c\;(\ZERO)$ & $\dn$ & $\ZERO$\\
 $\textit{der}\;c\;(\ONE)$  & $\dn$ & $\ZERO$\\
 $\textit{der}\;c\;(d)$     & $\dn$ & $\textit{if}\; c = d\;\textit{then} \;\ONE \; \textit{else} \;\ZERO$\\
-$\textit{der}\;c\;(\sum\;[r_1,..,r_n])$ & $\dn$ & $\sum\;[\textit{der}\;c\;r_1,..,\textit{der}\;c\;r_n]$\\
-$\textit{der}\;c\;(\prod\;[])$ & $\dn$ & $\ZERO$\\  
-$\textit{der}\;c\;(\prod\;r\!::\!rs)$ & $\dn$ & $\textit{if}\;\textit{nullable}(r)$\\
-      & & $\textit{then}\;(\prod\;(\textit{der}\;c\;r)\!::\!rs) + (\textit{der}\;c\;(\prod rs))$\\
-      & & $\textit{else}\;(\prod\;(\textit{der}\;c\;r)\!::\! rs)$\\
+$\textit{der}\;c\;(r_1 + r_2)$ & $\dn$ & $(\textit{der}\;c\;r_1) + (\textit{der}\;c\;r_2)$\\
+$\textit{der}\;c\;(r_1 \& r_2)$ & $\dn$ & $(\textit{der}\;c\;r_1) \,\&\, (\textit{der}\;c\;r_2)$\\
+$\textit{der}\;c\;(r_1 \cdot r_2)$ & $\dn$ & $\textit{if}\;\textit{nullable}(r_1)$\\
+      & & $\textit{then}\;(\textit{der}\;c\;r_1)\cdot r_2 \,+\, (\textit{der}\;c\;r_2)$\\
+      & & $\textit{else}\;(\textit{der}\;c\;r_1)\cdot r_2$\\
 $\textit{der}\;c\;(r^*)$ & $\dn$ & $(\textit{der}\;c\;r)\cdot (r^*)$\\
+$\textit{der}\;c\;(r^{\{n\}})$ & $\dn$ & 
+$\begin{cases}\ZERO & n = 0\\
+(der\,c\,r)\cdot (r^{\{n-1\}}) & \textit{otherwise}
+\end{cases}$\\
 \end{tabular}
 \end{center}
-\mbox{}\hfill\mbox{[1 Mark]}
+\mbox{}\hfill\mbox{[1.5 Marks]}
+
+% \item[(3)] We next want to simplify regular expressions: essentially
+%   we want to remove $\ZERO$ in regular expressions like $r + \ZERO$
+%   and $\ZERO + r$.  However, our n-ary alternative takes a list of
+%   regular expressions as argument, and we therefore need a more general
+%   ``denesting'' function, which deletes $\ZERO$s and ``spills out'' nested
+%   $\sum$s.  This function, called \texttt{denest}, should analyse a
+%   list of regular expressions, say $rs$, as follows:
 
-\item[(3)] We next want to simplify regular expressions: essentially
-  we want to remove $\ZERO$ in regular expressions like $r + \ZERO$
-  and $\ZERO + r$.  However, our n-ary alternative takes a list of
-  regular expressions as argument, and we therefore need a more general
-  ``denesting'' function, which deletes $\ZERO$s and ``spills out'' nested
-  $\sum$s.  This function, called \texttt{denest}, should analyse a
-  list of regular expressions, say $rs$, as follows:
+%   \begin{center}
+%     \begin{tabular}{lllll}
+%       1) &$rs = []$                & $\dn$ & $[]$ & (empty list)\\
+%       2) &$rs = \ZERO :: rest$     & $\dn$ & $\texttt{denest}\;rest$ & (throw away $\ZERO$)\\
+%       3) &$rs = (\sum rs) :: rest$ & $\dn$ & $rs ::: \texttt{denest}\;rest$ & (spill out $\sum$)\\
+%       4) &$rs = r :: rest$         & $\dn$ & $r :: \texttt{denest}\;rest$ & (otherwise)\\
+%     \end{tabular}  
+%   \end{center}  
+
+%   The first clause states that empty lists cannot be further
+%   denested. The second removes the first $\ZERO$ from the list and recurses.
+%   The third is when the first regular expression is an \texttt{ALTs}, then
+%   the content of this alternative should be spilled out and appended
+%   with the denested rest of the list. The last case is for all other
+%   cases where the head of the list is not $\ZERO$ and not an \texttt{ALTs},
+%   then we just keep the head of the list and denest the rest.\\
+%   \mbox{}\hfill\mbox{[1 Mark]}
+
+\item[(3)] Implement the function \textit{simp}, which recursively
+  traverses a regular expression, and on the way up simplifies every
+  regular expression on the left (see below) to the regular expression
+  on the right, except it does not simplify inside ${}^*$ and ${}^{\{n\}}$-regular
+  expressions.
 
   \begin{center}
-    \begin{tabular}{lllll}
-      1) &$rs = []$                & $\dn$ & $[]$ & (empty list)\\
-      2) &$rs = \ZERO :: rest$     & $\dn$ & $\texttt{denest}\;rest$ & (throw away $\ZERO$)\\
-      3) &$rs = (\sum rs) :: rest$ & $\dn$ & $rs ::: \texttt{denest}\;rest$ & (spill out $\sum$)\\
-      4) &$rs = r :: rest$         & $\dn$ & $r :: \texttt{denest}\;rest$ & (otherwise)\\
-    \end{tabular}  
-  \end{center}  
-
-  The first clause states that empty lists cannot be further
-  denested. The second removes the first $\ZERO$ from the list and recurses.
-  The third is when the first regular expression is an \texttt{ALTs}, then
-  the content of this alternative should be spilled out and appended
-  with the denested rest of the list. The last case is for all other
-  cases where the head of the list is not $\ZERO$ and not an \texttt{ALTs},
-  then we just keep the head of the list and denest the rest.\\
-  \mbox{}\hfill\mbox{[1 Mark]}
-
-\item[(4)] Implement the function \texttt{flts} which flattens our
-  n-ary sequence regular expression $\prod$. Like \texttt{denest}, this
-  function is intended to delete $\ONE$s and spill out nested $\prod$s.
-  Unfortunately, there is a special case to do with $\ZERO$: If this function encounters a $\ZERO$, then
-  the whole ``product'' should be $\ZERO$. The problem is that the $\ZERO$ can be anywhere
-  inside the list. The easiest way to implement this function is therefore by using an
-  accumulator, which when called is set to \texttt{Nil}. This means \textit{flts} takes
-  two arguments (which are both lists of regular expressions)
-
-  \[
-  \texttt{flts}\;rs\;acc  
-  \]
-
-  This function analyses the list $rs$ as follows
-
-  \begin{center}
-    \begin{tabular}{@{}lllll@{}}
-      1) &$rs = []$                   & $\dn$ & $acc$ & (empty list)\\
-      2) &$rs = \ZERO :: rest$        & $\dn$ & $[\ZERO]$ & (special case for $\ZERO$)\\
-      3) &$rs = \ONE :: rest$         & $\dn$ & $\texttt{flts}\,rest\,acc$ & (throw away $\ONE$)\\
-      4) &$rs = (\prod rs) :: rest$ & $\dn$ & $\texttt{flts}\;rest\,(acc ::: rs)$ & (spill out $\prod$)\\
-      5) &$rs = r :: rest$            & $\dn$ & $\texttt{flts}\;rest\,(acc ::: [r])$& (otherwise)\\
-    \end{tabular}  
+\begin{tabular}{l@{\hspace{4mm}}c@{\hspace{4mm}}ll}
+$r \cdot \ZERO$ & $\mapsto$ & $\ZERO$\\ 
+$\ZERO \cdot r$ & $\mapsto$ & $\ZERO$\\ 
+$r \cdot \ONE$ & $\mapsto$ & $r$\\ 
+$\ONE \cdot r$ & $\mapsto$ & $r$\\ 
+$r + \ZERO$ & $\mapsto$ & $r$\\ 
+$\ZERO + r$ & $\mapsto$ & $r$\\ 
+$r + r$ & $\mapsto$ & $r$\\ 
+$r \,\&\, \ZERO$ & $\mapsto$ & $\ZERO$\\ 
+$\ZERO \,\&\, r$ & $\mapsto$ & $\ZERO$\\ 
+$r \,\&\, r$ & $\mapsto$ & $r$\\ 
+\end{tabular}
   \end{center}
 
-  In the first case we just return whatever has accumulated in
-  $acc$. In the fourth case we spill out the $rs$ by appending the
-  $rs$ to the end of the accumulator. Similarly in the last case we
-  append the single regular expression $r$ to the end of the
-  accumulator. I let you think why you have to add it to the end. \mbox{}\hfill\mbox{[1 Mark]}
+  For example the regular expression
+  \[(r_1 + \ZERO) \cdot \ONE + ((\ONE + r_2) + r_3) \,\&\, (r_4 \cdot \ZERO)\]
+
+  simplifies to just $r_1$. \textbf{Hint:} Regular expressions can be
+  seen as trees and there are several methods for traversing
+  trees. One of them corresponds to the inside-out traversal, which is also
+  sometimes called post-order tra\-versal: you traverse inside the
+  tree and on the way up you apply simplification rules.
+  \textbf{Another Hint:}
+  Remember numerical expressions from school times---there you had expressions
+  like $u + \ldots + (1 \cdot x) - \ldots (z + (y \cdot 0)) \ldots$
+  and simplification rules that looked very similar to rules
+  above. You would simplify such numerical expressions by replacing
+  for example the $y \cdot 0$ by $0$, or $1\cdot x$ by $x$, and then
+  look whether more rules are applicable. If you organise the
+  simplification in an inside-out fashion, it is always clear which
+  simplification should be applied next.\hfill[2 Marks]
+
 
-\item[(5)] Before we can simplify regular expressions, we need what is often called
-  \emph{smart constructors} for $\sum$ and $\prod$. While the ``normal'' constructors
-  \texttt{ALTs} and \texttt{SEQs} give us alternatives and sequences, respectively, \emph{smart}
-  constructors might return something different depending on what list of regular expressions
-  they are given as argument.
+% \item[(4)] Implement the function \texttt{flts} which flattens our
+%   n-ary sequence regular expression $\prod$. Like \texttt{denest}, this
+%   function is intended to delete $\ONE$s and spill out nested $\prod$s.
+%   Unfortunately, there is a special case to do with $\ZERO$: If this function encounters a $\ZERO$, then
+%   the whole ``product'' should be $\ZERO$. The problem is that the $\ZERO$ can be anywhere
+%   inside the list. The easiest way to implement this function is therefore by using an
+%   accumulator, which when called is set to \texttt{Nil}. This means \textit{flts} takes
+%   two arguments (which are both lists of regular expressions)
+
+%   \[
+%   \texttt{flts}\;rs\;acc  
+%   \]
+
+%   This function analyses the list $rs$ as follows
+
+%   \begin{center}
+%     \begin{tabular}{@{}lllll@{}}
+%       1) &$rs = []$                   & $\dn$ & $acc$ & (empty list)\\
+%       2) &$rs = \ZERO :: rest$        & $\dn$ & $[\ZERO]$ & (special case for $\ZERO$)\\
+%       3) &$rs = \ONE :: rest$         & $\dn$ & $\texttt{flts}\,rest\,acc$ & (throw away $\ONE$)\\
+%       4) &$rs = (\prod rs) :: rest$ & $\dn$ & $\texttt{flts}\;rest\,(acc ::: rs)$ & (spill out $\prod$)\\
+%       5) &$rs = r :: rest$            & $\dn$ & $\texttt{flts}\;rest\,(acc ::: [r])$& (otherwise)\\
+%     \end{tabular}  
+%   \end{center}
+
+%   In the first case we just return whatever has accumulated in
+%   $acc$. In the fourth case we spill out the $rs$ by appending the
+%   $rs$ to the end of the accumulator. Similarly in the last case we
+%   append the single regular expression $r$ to the end of the
+%   accumulator. I let you think why you have to add it to the end. \mbox{}\hfill\mbox{[1 Mark]}
 
-  \begin{center}
-  \begin{tabular}{@{}c@{\hspace{9mm}}c@{}}
-    \begin{tabular}{l@{\hspace{2mm}}l@{\hspace{1mm}}ll}
-      & $\sum^{smart}$\smallskip\\
-      1) & $rs = []$  & $\dn$ & $\ZERO$\\ 
-      2) & $rs = [r]$ & $\dn$ & $r$\\ \\
-      3) & otherwise  & $\dn$ & $\sum\,rs$
-    \end{tabular} &
-    \begin{tabular}{l@{\hspace{2mm}}l@{\hspace{1mm}}ll}
-        & $\prod^{smart}$\smallskip\\              
-        1) & $rs = []$ & $\dn$ & $\ONE$\\
-        2a) & $rs = [\ZERO]$ & $\dn$ & $\ZERO$\\
-        2b) & $rs = [r]$ & $\dn$ & $r$\\
-        3) & otherwise  & $\dn$ & $\prod\,rs$
-    \end{tabular}              
-  \end{tabular}    
-  \end{center}
-  \mbox{}\hfill\mbox{[0.5 Marks]}
+% \item[(5)] Before we can simplify regular expressions, we need what is often called
+%   \emph{smart constructors} for $\sum$ and $\prod$. While the ``normal'' constructors
+%   \texttt{ALTs} and \texttt{SEQs} give us alternatives and sequences, respectively, \emph{smart}
+%   constructors might return something different depending on what list of regular expressions
+%   they are given as argument.
+
+%   \begin{center}
+%   \begin{tabular}{@{}c@{\hspace{9mm}}c@{}}
+%     \begin{tabular}{l@{\hspace{2mm}}l@{\hspace{1mm}}ll}
+%       & $\sum^{smart}$\smallskip\\
+%       1) & $rs = []$  & $\dn$ & $\ZERO$\\ 
+%       2) & $rs = [r]$ & $\dn$ & $r$\\ \\
+%       3) & otherwise  & $\dn$ & $\sum\,rs$
+%     \end{tabular} &
+%     \begin{tabular}{l@{\hspace{2mm}}l@{\hspace{1mm}}ll}
+%         & $\prod^{smart}$\smallskip\\              
+%         1) & $rs = []$ & $\dn$ & $\ONE$\\
+%         2a) & $rs = [\ZERO]$ & $\dn$ & $\ZERO$\\
+%         2b) & $rs = [r]$ & $\dn$ & $r$\\
+%         3) & otherwise  & $\dn$ & $\prod\,rs$
+%     \end{tabular}              
+%   \end{tabular}    
+%   \end{center}
+%   \mbox{}\hfill\mbox{[0.5 Marks]}
   
-\item[(6)] Implement the function \textit{simp}, which recursively
-  traverses a regular expression, and on the way up simplifies every
-  regular expression on the left (see below) to the regular expression
-  on the right, except it does not simplify inside ${}^*$-regular
-  expressions and also does not simplify $\ZERO$, $\ONE$ and characters.
+% \item[(6)] Implement the function \textit{simp}, which recursively
+%   traverses a regular expression, and on the way up simplifies every
+%   regular expression on the left (see below) to the regular expression
+%   on the right, except it does not simplify inside ${}^*$-regular
+%   expressions and also does not simplify $\ZERO$, $\ONE$ and characters.
 
-  \begin{center}
-    \begin{tabular}{@{}l@{\hspace{3mm}}c@{\hspace{3mm}}ll@{}}
-      LHS: & & RHS:\smallskip\\
-$\sum\;[r_1,..,r_n]$ & $\mapsto$ & $\sum^{smart}\;(\texttt{(denest + distinct)}[simp(r_1),..,simp(r_n)])$\\
-      $\prod\;[r_1,..,r_n]$ & $\mapsto$ & $\prod^{smart}\;(\texttt{(flts)}[simp(r_1),..,simp(r_n)])$\\
-      $r$ & $\mapsto$ & $r$ \quad (all other cases)
-\end{tabular}
-\end{center}
+%   \begin{center}
+%     \begin{tabular}{@{}l@{\hspace{3mm}}c@{\hspace{3mm}}ll@{}}
+%       LHS: & & RHS:\smallskip\\
+% $\sum\;[r_1,..,r_n]$ & $\mapsto$ & $\sum^{smart}\;(\texttt{(denest + distinct)}[simp(r_1),..,simp(r_n)])$\\
+%       $\prod\;[r_1,..,r_n]$ & $\mapsto$ & $\prod^{smart}\;(\texttt{(flts)}[simp(r_1),..,simp(r_n)])$\\
+%       $r$ & $\mapsto$ & $r$ \quad (all other cases)
+% \end{tabular}
+% \end{center}
 
-The first case is as follows: first apply $simp$ to all regular
-expressions $r_1,.. ,r_n$; then denest the resulting list using
-\texttt{denest}; after that remove all duplicates in this list (this can be
-done in Scala using the function
-\texttt{\_.distinct}). Finally, you end up with a list of (simplified)
-regular expressions; apply the smart constructor $\sum^{smart}$ to this list.
-Similarly in the $\prod$ case: simplify first all regular
-expressions $r_1,.. ,r_n$; then flatten the resulting list using \texttt{flts} and apply the
-smart constructor $\prod^{smart}$ to the result. In all other cases, just return the
-input $r$ as is.
+% The first case is as follows: first apply $simp$ to all regular
+% expressions $r_1,.. ,r_n$; then denest the resulting list using
+% \texttt{denest}; after that remove all duplicates in this list (this can be
+% done in Scala using the function
+% \texttt{\_.distinct}). Finally, you end up with a list of (simplified)
+% regular expressions; apply the smart constructor $\sum^{smart}$ to this list.
+% Similarly in the $\prod$ case: simplify first all regular
+% expressions $r_1,.. ,r_n$; then flatten the resulting list using \texttt{flts} and apply the
+% smart constructor $\prod^{smart}$ to the result. In all other cases, just return the
+% input $r$ as is.
   
 
-  For example the regular expression
-  \[(r_1 + \ZERO) \cdot \ONE + ((\ONE + r_2) + r_3) \cdot (r_4 \cdot \ZERO)\]
+%   For example the regular expression
+%   \[(r_1 + \ZERO) \cdot \ONE + ((\ONE + r_2) + r_3) \cdot (r_4 \cdot \ZERO)\]
 
-  simplifies to just $r_1$. \mbox{}\hfill\mbox{[1 Mark]}
+%   simplifies to just $r_1$. \mbox{}\hfill\mbox{[1 Mark]}
 
-\item[(7)] Implement two functions: The first, called \textit{ders},
+\item[(4)] Implement two functions: The first, called \textit{ders},
   takes a list of characters and a regular expression as arguments, and
   builds the derivative w.r.t.~the list as follows:
 
@@ -428,19 +468,19 @@
 true for the regular expression $(a\cdot b)\cdot c$ and the string
 $abc$, but false if you give it the string $ab$. \hfill[0.5 Mark]
 
-\item[(8)] Implement a function, called \textit{size}, by recursion
+\item[(5)] Implement a function, called \textit{size}, by recursion
   over regular expressions. If a regular expression is seen as a tree,
   then \textit{size} should return the number of nodes in such a
   tree. Therefore this function is defined as follows:
 
 \begin{center}
-\begin{tabular}{lcl}
+\begin{tabular}{lcll}
 $\textit{size}(\ZERO)$ & $\dn$ & $1$\\
 $\textit{size}(\ONE)$  & $\dn$ & $1$\\
 $\textit{size}(c)$     & $\dn$ & $1$\\
-$\textit{size}(\sum\,[r_1,..,r_n]$ & $\dn$ & $1 + \textit{size}(r_1) + ... + \textit{size}(r_n)$\\
-$\textit{size}(\prod\,[r_1,..,r_n]$ & $\dn$ & $1 + \textit{size}(r_1) + ... + \textit{size}(r_n)$\\
+$\textit{size}(r_1 \,?\, r_2)$ & $\dn$ & $1 + \textit{size}(r_1) + \textit{size}(r_2)$ & where $? \in \{\cdot, +, \&\}$\\
 $\textit{size}(r^*)$ & $\dn$ & $1 + \textit{size}(r)$\\
+$\textit{size}(r^{\{n\}})$ & $\dn$ & $1 + \textit{size}(r)$\\
 \end{tabular}
 \end{center}
 
@@ -450,7 +490,7 @@
 taking the derivative, but simplify the result.  The sizes
 are given in \texttt{re.scala}. \hfill[0.5 Marks]
 
-\item[(9)] You do not have to implement anything specific under this
+\item[(6)] You do not have to implement anything specific under this
   task.  The purpose here is that you will be marked for some ``power''
   test cases. For example can your matcher decide within 30 seconds
   whether the regular expression $(a^*)^*\cdot b$ matches strings of the
@@ -469,7 +509,7 @@
 \subsection*{Background}
 
 Although easily implementable in Scala (ok maybe the \texttt{simp} functions and
-the constructors \texttt{ALTs}/\texttt{SEQs} needs a bit more thinking), the idea behind the
+the constructors \texttt{ALT}/\texttt{SEQ}/\texttt{AND} needs a bit more thinking), the idea behind the
 derivative function might not so easy to be seen. To understand its
 purpose better, assume a regular expression $r$ can match strings of
 the form $c\!::\!cs$ (that means strings which start with a character
@@ -567,7 +607,7 @@
     axis lines=left,
     width=6cm,
     height=5.5cm, 
-    legend entries={Java 9},  
+    legend entries={Java 9 and above},  
     legend pos=north west]
 \addplot[cyan,mark=*, mark options={fill=white}] table {re-java9.data};
 \end{axis}

Binary file slides/slides01.pdf has changed

--- a/slides/slides01.tex	Mon Nov 10 16:24:46 2025 +0000
+++ b/slides/slides01.tex	Thu Nov 13 17:44:58 2025 +0000
@@ -325,9 +325,9 @@
 Installation problems:
 \begin{itemize}
 \item Zoltan Meszaros (\texttt{\small{}zoltan.meszaros@kcl.ac.uk})  
-\item Zishan Rahman (\texttt{\small{}zishan.rahman@kcl.ac.uk})
-\item Bofan Zhang (\texttt{\small{}bofan.zhang@kcl.ac.uk})
-\item Aidan Dakhama (\texttt{\small{}aidan.dakhama@kcl.ac.uk})  
+\item Zishan Rahman (\texttt{\small{}zishan.rahman@kcl.ac.uk}, Linux)
+\item Bofan Zhang (\texttt{\small{}bofan.zhang@kcl.ac.uk}, MacOSX)
+\item Aidan Dakhama (\texttt{\small{}aidan.dakhama@kcl.ac.uk}, Linux)  
   \bigskip
 \end{itemize}
 Github problems:

author	Christian Urban <christian.urban@kcl.ac.uk>
	Thu, 13 Nov 2025 17:44:58 +0000
changeset 498	0f1b97538ad4
parent 497	ef37fb04a343
child 499	2f33c51cac48

cws/core_cw01.pdf		file \| annotate \| diff \| comparison \| revisions
cws/core_cw01.tex		file \| annotate \| diff \| comparison \| revisions
cws/core_cw02.pdf		file \| annotate \| diff \| comparison \| revisions
cws/core_cw02.tex		file \| annotate \| diff \| comparison \| revisions
cws/core_cw03.pdf		file \| annotate \| diff \| comparison \| revisions
cws/core_cw03.tex		file \| annotate \| diff \| comparison \| revisions
cws/disclaimer.sty		file \| annotate \| diff \| comparison \| revisions
cws/main_cw03.pdf		file \| annotate \| diff \| comparison \| revisions
cws/main_cw03.tex		file \| annotate \| diff \| comparison \| revisions
slides/slides01.pdf		file \| annotate \| diff \| comparison \| revisions
slides/slides01.tex		file \| annotate \| diff \| comparison \| revisions