51
|
1 |
// Scala Lecture 2
|
|
2 |
//=================
|
|
3 |
|
204
|
4 |
// UNFINISHED BUSINESS from Lecture 1
|
|
5 |
//====================================
|
|
6 |
|
|
7 |
|
|
8 |
// for measuring time
|
|
9 |
def time_needed[T](n: Int, code: => T) = {
|
|
10 |
val start = System.nanoTime()
|
|
11 |
for (i <- (0 to n)) code
|
|
12 |
val end = System.nanoTime()
|
|
13 |
(end - start) / 1.0e9
|
|
14 |
}
|
|
15 |
|
|
16 |
|
|
17 |
val list = (1 to 1000000).toList
|
|
18 |
time_needed(10, for (n <- list) yield n + 42)
|
|
19 |
time_needed(10, for (n <- list.par) yield n + 42)
|
|
20 |
|
268
|
21 |
// (needs a library and 'magic' option -Yrepl-class-based)
|
204
|
22 |
|
212
|
23 |
|
|
24 |
// Just for Fun: Mutable vs Immutable
|
|
25 |
//====================================
|
204
|
26 |
//
|
|
27 |
// - no vars, no ++i, no +=
|
|
28 |
// - no mutable data-structures (no Arrays, no ListBuffers)
|
|
29 |
|
|
30 |
|
212
|
31 |
// Q: Count how many elements are in the intersections of
|
|
32 |
// two sets?
|
204
|
33 |
|
|
34 |
def count_intersection(A: Set[Int], B: Set[Int]) : Int = {
|
|
35 |
var count = 0
|
|
36 |
for (x <- A; if B contains x) count += 1
|
|
37 |
count
|
|
38 |
}
|
|
39 |
|
|
40 |
val A = (1 to 1000).toSet
|
|
41 |
val B = (1 to 1000 by 4).toSet
|
|
42 |
|
|
43 |
count_intersection(A, B)
|
|
44 |
|
|
45 |
// but do not try to add .par to the for-loop above
|
|
46 |
|
|
47 |
|
|
48 |
//propper parallel version
|
|
49 |
def count_intersection2(A: Set[Int], B: Set[Int]) : Int =
|
|
50 |
A.par.count(x => B contains x)
|
|
51 |
|
|
52 |
count_intersection2(A, B)
|
|
53 |
|
|
54 |
|
|
55 |
val A = (1 to 1000000).toSet
|
|
56 |
val B = (1 to 1000000 by 4).toSet
|
|
57 |
|
|
58 |
time_needed(100, count_intersection(A, B))
|
|
59 |
time_needed(100, count_intersection2(A, B))
|
|
60 |
|
|
61 |
|
|
62 |
|
|
63 |
// For-Comprehensions Again
|
|
64 |
//==========================
|
|
65 |
|
|
66 |
// the first produces a result, while the second does not
|
|
67 |
for (n <- List(1, 2, 3, 4, 5)) yield n * n
|
|
68 |
|
|
69 |
|
|
70 |
for (n <- List(1, 2, 3, 4, 5)) println(n)
|
|
71 |
|
|
72 |
|
|
73 |
|
|
74 |
// Higher-Order Functions
|
|
75 |
//========================
|
|
76 |
|
|
77 |
// functions can take functions as arguments
|
|
78 |
|
|
79 |
def even(x: Int) : Boolean = x % 2 == 0
|
|
80 |
def odd(x: Int) : Boolean = x % 2 == 1
|
|
81 |
|
|
82 |
val lst = (1 to 10).toList
|
|
83 |
|
|
84 |
lst.filter(x => even(x))
|
|
85 |
lst.filter(even(_))
|
|
86 |
lst.filter(even)
|
|
87 |
|
|
88 |
lst.count(even)
|
|
89 |
|
212
|
90 |
|
|
91 |
lst.find(even)
|
|
92 |
|
|
93 |
val ps = List((3, 0), (3, 2), (4, 2), (2, 2), (2, 0), (1, 1), (1, 0))
|
204
|
94 |
|
212
|
95 |
lst.sortWith(_ > _)
|
|
96 |
lst.sortWith(_ < _)
|
204
|
97 |
|
212
|
98 |
def lex(x: (Int, Int), y: (Int, Int)) : Boolean =
|
|
99 |
if (x._1 == y._1) x._2 < y._2 else x._1 < y._1
|
|
100 |
|
|
101 |
ps.sortWith(lex)
|
204
|
102 |
|
|
103 |
ps.sortBy(_._1)
|
|
104 |
ps.sortBy(_._2)
|
|
105 |
|
|
106 |
ps.maxBy(_._1)
|
|
107 |
ps.maxBy(_._2)
|
|
108 |
|
|
109 |
|
|
110 |
|
212
|
111 |
// maps (lower-case)
|
|
112 |
//===================
|
204
|
113 |
|
212
|
114 |
def double(x: Int): Int = x + x
|
204
|
115 |
def square(x: Int): Int = x * x
|
|
116 |
|
212
|
117 |
|
|
118 |
|
204
|
119 |
val lst = (1 to 10).toList
|
|
120 |
|
212
|
121 |
lst.map(x => (double(x), square(x)))
|
|
122 |
|
204
|
123 |
lst.map(square)
|
|
124 |
|
268
|
125 |
// this is actually how for-comprehensions
|
|
126 |
// defined as in Scala
|
204
|
127 |
|
|
128 |
lst.map(n => square(n))
|
|
129 |
for (n <- lst) yield square(n)
|
|
130 |
|
|
131 |
// this can be iterated
|
|
132 |
|
|
133 |
lst.map(square).filter(_ > 4)
|
|
134 |
|
|
135 |
lst.map(square).filter(_ > 4).map(square)
|
|
136 |
|
|
137 |
|
|
138 |
// lets define our own functions
|
|
139 |
// type of functions, for example f: Int => Int
|
|
140 |
|
212
|
141 |
lst.tail
|
|
142 |
|
204
|
143 |
def my_map_int(lst: List[Int], f: Int => Int) : List[Int] = {
|
|
144 |
if (lst == Nil) Nil
|
|
145 |
else f(lst.head) :: my_map_int(lst.tail, f)
|
|
146 |
}
|
|
147 |
|
|
148 |
my_map_int(lst, square)
|
|
149 |
|
|
150 |
|
|
151 |
// same function using pattern matching: a kind
|
|
152 |
// of switch statement on steroids (see more later on)
|
|
153 |
|
|
154 |
def my_map_int(lst: List[Int], f: Int => Int) : List[Int] = lst match {
|
|
155 |
case Nil => Nil
|
|
156 |
case x::xs => f(x)::my_map_int(xs, f)
|
|
157 |
}
|
|
158 |
|
|
159 |
|
|
160 |
// other function types
|
|
161 |
//
|
|
162 |
// f1: (Int, Int) => Int
|
|
163 |
// f2: List[String] => Option[Int]
|
|
164 |
// ...
|
212
|
165 |
val lst = (1 to 10).toList
|
204
|
166 |
|
|
167 |
def sumOf(f: Int => Int, lst: List[Int]): Int = lst match {
|
|
168 |
case Nil => 0
|
|
169 |
case x::xs => f(x) + sumOf(f, xs)
|
|
170 |
}
|
|
171 |
|
|
172 |
def sum_squares(lst: List[Int]) = sumOf(square, lst)
|
|
173 |
def sum_cubes(lst: List[Int]) = sumOf(x => x * x * x, lst)
|
|
174 |
|
|
175 |
sum_squares(lst)
|
|
176 |
sum_cubes(lst)
|
|
177 |
|
|
178 |
// lets try it factorial
|
212
|
179 |
def fact(n: Int) : Int =
|
|
180 |
if (n == 0) 1 else n * fact(n - 1)
|
204
|
181 |
|
|
182 |
def sum_fact(lst: List[Int]) = sumOf(fact, lst)
|
|
183 |
sum_fact(lst)
|
|
184 |
|
|
185 |
|
|
186 |
|
|
187 |
|
|
188 |
|
212
|
189 |
// Map type (upper-case)
|
|
190 |
//=======================
|
204
|
191 |
|
|
192 |
// Note the difference between map and Map
|
|
193 |
|
|
194 |
def factors(n: Int) : List[Int] =
|
|
195 |
((1 until n).filter { divisor =>
|
|
196 |
n % divisor == 0
|
|
197 |
}).toList
|
|
198 |
|
|
199 |
|
|
200 |
var ls = (1 to 10).toList
|
|
201 |
|
|
202 |
val facs = ls.map(n => (n, factors(n)))
|
|
203 |
|
|
204 |
facs.find(_._1 == 4)
|
|
205 |
|
|
206 |
// works for lists of pairs
|
|
207 |
facs.toMap
|
|
208 |
|
|
209 |
|
|
210 |
facs.toMap.get(4)
|
212
|
211 |
facs.toMap.getOrElse(42, Nil)
|
204
|
212 |
|
|
213 |
val facsMap = facs.toMap
|
|
214 |
|
|
215 |
val facsMap0 = facsMap + (0 -> List(1,2,3,4,5))
|
212
|
216 |
facsMap0.get(1)
|
204
|
217 |
|
|
218 |
val facsMap4 = facsMap + (1 -> List(1,2,3,4,5))
|
|
219 |
facsMap.get(1)
|
|
220 |
facsMap4.get(1)
|
|
221 |
|
|
222 |
val ls = List("one", "two", "three", "four", "five")
|
|
223 |
ls.groupBy(_.length)
|
|
224 |
|
212
|
225 |
ls.groupBy(_.length).get(2)
|
204
|
226 |
|
|
227 |
|
51
|
228 |
|
268
|
229 |
// Option type (again)
|
|
230 |
//=====================
|
53
|
231 |
|
268
|
232 |
// remember, in Java if something unusually happens,
|
|
233 |
// you return null;
|
204
|
234 |
//
|
268
|
235 |
// in Scala you use Option
|
53
|
236 |
// - if the value is present, you use Some(value)
|
|
237 |
// - if no value is present, you use None
|
|
238 |
|
|
239 |
|
192
|
240 |
List(7,2,3,4,5,6).find(_ < 4)
|
53
|
241 |
List(5,6,7,8,9).find(_ < 4)
|
|
242 |
|
204
|
243 |
// operations on options
|
58
|
244 |
|
51
|
245 |
val lst = List(None, Some(1), Some(2), None, Some(3))
|
|
246 |
|
|
247 |
lst.flatten
|
53
|
248 |
|
192
|
249 |
Some(1).get
|
212
|
250 |
None.get
|
51
|
251 |
|
53
|
252 |
Some(1).isDefined
|
|
253 |
None.isDefined
|
|
254 |
|
212
|
255 |
|
|
256 |
None.isDefined
|
|
257 |
|
51
|
258 |
val ps = List((3, 0), (3, 2), (4, 2), (2, 0), (1, 0), (1, 1))
|
|
259 |
|
|
260 |
for ((x, y) <- ps) yield {
|
|
261 |
if (y == 0) None else Some(x / y)
|
|
262 |
}
|
|
263 |
|
192
|
264 |
// getOrElse is for setting a default value
|
53
|
265 |
|
|
266 |
val lst = List(None, Some(1), Some(2), None, Some(3))
|
204
|
267 |
|
57
|
268 |
for (x <- lst) yield x.getOrElse(0)
|
|
269 |
|
|
270 |
|
53
|
271 |
|
|
272 |
|
192
|
273 |
// error handling with Option (no exceptions)
|
57
|
274 |
//
|
|
275 |
// Try(something).getOrElse(what_to_do_in_an_exception)
|
|
276 |
//
|
53
|
277 |
import scala.util._
|
|
278 |
import io.Source
|
|
279 |
|
212
|
280 |
|
|
281 |
Source.fromURL("""http://www.inf.ucl.ac.uk/staff/urbanc/""").mkString
|
53
|
282 |
|
192
|
283 |
Try(Source.fromURL("""http://www.inf.kcl.ac.uk/staff/urbanc/""").mkString).getOrElse("")
|
53
|
284 |
|
192
|
285 |
Try(Some(Source.fromURL("""http://www.inf.kcl.ac.uk/staff/urbanc/""").mkString)).getOrElse(None)
|
53
|
286 |
|
|
287 |
|
204
|
288 |
// a function that turns strings into numbers (similar to .toInt)
|
212
|
289 |
Integer.parseInt("12u34")
|
204
|
290 |
|
|
291 |
|
|
292 |
def get_me_an_int(s: String) : Option[Int] =
|
53
|
293 |
Try(Some(Integer.parseInt(s))).getOrElse(None)
|
|
294 |
|
204
|
295 |
val lst = List("12345", "foo", "5432", "bar", "x21", "456")
|
53
|
296 |
for (x <- lst) yield get_me_an_int(x)
|
|
297 |
|
268
|
298 |
// summing up all the numbers
|
204
|
299 |
|
212
|
300 |
lst.map(get_me_an_int).flatten.sum
|
204
|
301 |
lst.map(get_me_an_int).flatten.sum
|
|
302 |
|
|
303 |
|
212
|
304 |
lst.flatMap(get_me_an_int).map(_.toString)
|
53
|
305 |
|
|
306 |
|
|
307 |
// This may not look any better than working with null in Java, but to
|
|
308 |
// see the value, you have to put yourself in the shoes of the
|
|
309 |
// consumer of the get_me_an_int function, and imagine you didn't
|
|
310 |
// write that function.
|
|
311 |
//
|
|
312 |
// In Java, if you didn't write this function, you'd have to depend on
|
192
|
313 |
// the Javadoc of the get_me_an_int. If you didn't look at the Javadoc,
|
57
|
314 |
// you might not know that get_me_an_int could return a null, and your
|
|
315 |
// code could potentially throw a NullPointerException.
|
53
|
316 |
|
|
317 |
|
192
|
318 |
|
58
|
319 |
// even Scala is not immune to problems like this:
|
|
320 |
|
192
|
321 |
List(5,6,7,8,9).indexOf(7)
|
204
|
322 |
List(5,6,7,8,9).indexOf(10)
|
212
|
323 |
List(5,6,7,8,9)(-1)
|
192
|
324 |
|
|
325 |
|
|
326 |
|
|
327 |
// Pattern Matching
|
|
328 |
//==================
|
|
329 |
|
|
330 |
// A powerful tool which is supposed to come to Java in a few years
|
|
331 |
// time (https://www.youtube.com/watch?v=oGll155-vuQ)...Scala already
|
|
332 |
// has it for many years ;o)
|
|
333 |
|
|
334 |
// The general schema:
|
|
335 |
//
|
|
336 |
// expression match {
|
|
337 |
// case pattern1 => expression1
|
|
338 |
// case pattern2 => expression2
|
|
339 |
// ...
|
|
340 |
// case patternN => expressionN
|
|
341 |
// }
|
|
342 |
|
|
343 |
|
|
344 |
|
|
345 |
|
204
|
346 |
// remember?
|
192
|
347 |
val lst = List(None, Some(1), Some(2), None, Some(3)).flatten
|
|
348 |
|
|
349 |
|
212
|
350 |
def my_flatten(xs: List[Option[Int]]): List[Int] = xs match {
|
|
351 |
case Nil => Nil
|
|
352 |
case None::rest => my_flatten(rest)
|
|
353 |
case Some(v)::foo => {
|
|
354 |
v :: my_flatten(foo)
|
|
355 |
}
|
192
|
356 |
}
|
58
|
357 |
|
|
358 |
|
192
|
359 |
// another example
|
|
360 |
def get_me_a_string(n: Int): String = n match {
|
212
|
361 |
case 0 | 1 | 2 => "small"
|
|
362 |
case _ => "big"
|
192
|
363 |
}
|
|
364 |
|
|
365 |
get_me_a_string(0)
|
|
366 |
|
212
|
367 |
|
192
|
368 |
// you can also have cases combined
|
266
|
369 |
def season(month: String) : String = month match {
|
192
|
370 |
case "March" | "April" | "May" => "It's spring"
|
|
371 |
case "June" | "July" | "August" => "It's summer"
|
|
372 |
case "September" | "October" | "November" => "It's autumn"
|
204
|
373 |
case "December" => "It's winter"
|
|
374 |
case "January" | "February" => "It's unfortunately winter"
|
192
|
375 |
}
|
|
376 |
|
|
377 |
println(season("November"))
|
|
378 |
|
|
379 |
// What happens if no case matches?
|
212
|
380 |
println(season("foobar"))
|
192
|
381 |
|
|
382 |
|
266
|
383 |
// Days of the months
|
|
384 |
def days(month: String) : Int = month match {
|
|
385 |
case "March" | "April" | "May" => 31
|
|
386 |
case "June" | "July" | "August" => 30
|
|
387 |
}
|
|
388 |
|
|
389 |
|
|
390 |
|
|
391 |
|
204
|
392 |
// Silly: fizz buzz
|
192
|
393 |
def fizz_buzz(n: Int) : String = (n % 3, n % 5) match {
|
|
394 |
case (0, 0) => "fizz buzz"
|
|
395 |
case (0, _) => "fizz"
|
|
396 |
case (_, 0) => "buzz"
|
|
397 |
case _ => n.toString
|
|
398 |
}
|
|
399 |
|
|
400 |
for (n <- 0 to 20)
|
|
401 |
println(fizz_buzz(n))
|
|
402 |
|
|
403 |
|
|
404 |
// User-defined Datatypes
|
|
405 |
//========================
|
|
406 |
|
|
407 |
|
204
|
408 |
abstract class Colour
|
|
409 |
case object Red extends Colour
|
|
410 |
case object Green extends Colour
|
|
411 |
case object Blue extends Colour
|
192
|
412 |
|
204
|
413 |
def fav_colour(c: Colour) : Boolean = c match {
|
|
414 |
case Red => false
|
|
415 |
case Green => true
|
|
416 |
case Blue => false
|
173
|
417 |
}
|
|
418 |
|
204
|
419 |
fav_colour(Green)
|
|
420 |
|
192
|
421 |
|
268
|
422 |
// ... a tiny bit more useful: Roman Numerals
|
204
|
423 |
|
|
424 |
abstract class RomanDigit
|
|
425 |
case object I extends RomanDigit
|
|
426 |
case object V extends RomanDigit
|
|
427 |
case object X extends RomanDigit
|
|
428 |
case object L extends RomanDigit
|
|
429 |
case object C extends RomanDigit
|
|
430 |
case object D extends RomanDigit
|
|
431 |
case object M extends RomanDigit
|
|
432 |
|
|
433 |
type RomanNumeral = List[RomanDigit]
|
192
|
434 |
|
212
|
435 |
List(X,I)
|
|
436 |
|
268
|
437 |
/*
|
212
|
438 |
I -> 1
|
|
439 |
II -> 2
|
|
440 |
III -> 3
|
|
441 |
IV -> 4
|
|
442 |
V -> 5
|
|
443 |
VI -> 6
|
|
444 |
VII -> 7
|
|
445 |
VIII -> 8
|
|
446 |
IX -> 9
|
|
447 |
X -> X
|
268
|
448 |
*/
|
212
|
449 |
|
204
|
450 |
def RomanNumeral2Int(rs: RomanNumeral): Int = rs match {
|
|
451 |
case Nil => 0
|
|
452 |
case M::r => 1000 + RomanNumeral2Int(r)
|
|
453 |
case C::M::r => 900 + RomanNumeral2Int(r)
|
|
454 |
case D::r => 500 + RomanNumeral2Int(r)
|
|
455 |
case C::D::r => 400 + RomanNumeral2Int(r)
|
|
456 |
case C::r => 100 + RomanNumeral2Int(r)
|
|
457 |
case X::C::r => 90 + RomanNumeral2Int(r)
|
|
458 |
case L::r => 50 + RomanNumeral2Int(r)
|
|
459 |
case X::L::r => 40 + RomanNumeral2Int(r)
|
|
460 |
case X::r => 10 + RomanNumeral2Int(r)
|
|
461 |
case I::X::r => 9 + RomanNumeral2Int(r)
|
|
462 |
case V::r => 5 + RomanNumeral2Int(r)
|
|
463 |
case I::V::r => 4 + RomanNumeral2Int(r)
|
|
464 |
case I::r => 1 + RomanNumeral2Int(r)
|
192
|
465 |
}
|
|
466 |
|
204
|
467 |
RomanNumeral2Int(List(I,V)) // 4
|
|
468 |
RomanNumeral2Int(List(I,I,I,I)) // 4 (invalid Roman number)
|
|
469 |
RomanNumeral2Int(List(V,I)) // 6
|
|
470 |
RomanNumeral2Int(List(I,X)) // 9
|
|
471 |
RomanNumeral2Int(List(M,C,M,L,X,X,I,X)) // 1979
|
|
472 |
RomanNumeral2Int(List(M,M,X,V,I,I)) // 2017
|
|
473 |
|
192
|
474 |
|
204
|
475 |
// another example
|
|
476 |
//=================
|
192
|
477 |
|
212
|
478 |
// Once upon a time, in a complete fictional
|
|
479 |
// country there were Persons...
|
192
|
480 |
|
|
481 |
|
|
482 |
abstract class Person
|
204
|
483 |
case object King extends Person
|
192
|
484 |
case class Peer(deg: String, terr: String, succ: Int) extends Person
|
|
485 |
case class Knight(name: String) extends Person
|
|
486 |
case class Peasant(name: String) extends Person
|
212
|
487 |
|
173
|
488 |
|
192
|
489 |
def title(p: Person): String = p match {
|
204
|
490 |
case King => "His Majesty the King"
|
192
|
491 |
case Peer(deg, terr, _) => s"The ${deg} of ${terr}"
|
|
492 |
case Knight(name) => s"Sir ${name}"
|
|
493 |
case Peasant(name) => name
|
|
494 |
}
|
173
|
495 |
|
192
|
496 |
def superior(p1: Person, p2: Person): Boolean = (p1, p2) match {
|
204
|
497 |
case (King, _) => true
|
192
|
498 |
case (Peer(_,_,_), Knight(_)) => true
|
|
499 |
case (Peer(_,_,_), Peasant(_)) => true
|
204
|
500 |
case (Peer(_,_,_), Clown) => true
|
192
|
501 |
case (Knight(_), Peasant(_)) => true
|
204
|
502 |
case (Knight(_), Clown) => true
|
|
503 |
case (Clown, Peasant(_)) => true
|
192
|
504 |
case _ => false
|
|
505 |
}
|
|
506 |
|
|
507 |
val people = List(Knight("David"),
|
|
508 |
Peer("Duke", "Norfolk", 84),
|
|
509 |
Peasant("Christian"),
|
204
|
510 |
King,
|
|
511 |
Clown)
|
192
|
512 |
|
212
|
513 |
println(people.sortWith(superior).mkString("\n"))
|
|
514 |
|
192
|
515 |
|
268
|
516 |
// Tail Recursion
|
204
|
517 |
//================
|
147
|
518 |
|
|
519 |
|
204
|
520 |
def fact(n: Long): Long =
|
|
521 |
if (n == 0) 1 else n * fact(n - 1)
|
147
|
522 |
|
204
|
523 |
fact(10) //ok
|
|
524 |
fact(10000) // produces a stackoverflow
|
147
|
525 |
|
204
|
526 |
def factT(n: BigInt, acc: BigInt): BigInt =
|
|
527 |
if (n == 0) acc else factT(n - 1, n * acc)
|
147
|
528 |
|
204
|
529 |
factT(10, 1)
|
|
530 |
factT(100000, 1)
|
192
|
531 |
|
204
|
532 |
// there is a flag for ensuring a function is tail recursive
|
|
533 |
import scala.annotation.tailrec
|
167
|
534 |
|
204
|
535 |
@tailrec
|
|
536 |
def factT(n: BigInt, acc: BigInt): BigInt =
|
|
537 |
if (n == 0) acc else factT(n - 1, n * acc)
|
167
|
538 |
|
|
539 |
|
|
540 |
|
204
|
541 |
// for tail-recursive functions the Scala compiler
|
|
542 |
// generates loop-like code, which does not need
|
|
543 |
// to allocate stack-space in each recursive
|
|
544 |
// call; Scala can do this only for tail-recursive
|
|
545 |
// functions
|
|
546 |
|
147
|
547 |
|
212
|
548 |
// A Web Crawler / Email Harvester
|
|
549 |
//=================================
|
204
|
550 |
//
|
212
|
551 |
// the idea is to look for links using the
|
|
552 |
// regular expression "https?://[^"]*" and for
|
|
553 |
// email addresses using another regex.
|
204
|
554 |
|
|
555 |
import io.Source
|
|
556 |
import scala.util._
|
|
557 |
|
|
558 |
// gets the first 10K of a web-page
|
|
559 |
def get_page(url: String) : String = {
|
|
560 |
Try(Source.fromURL(url)("ISO-8859-1").take(10000).mkString).
|
|
561 |
getOrElse { println(s" Problem with: $url"); ""}
|
147
|
562 |
}
|
|
563 |
|
204
|
564 |
// regex for URLs and emails
|
|
565 |
val http_pattern = """"https?://[^"]*"""".r
|
|
566 |
val email_pattern = """([a-z0-9_\.-]+)@([\da-z\.-]+)\.([a-z\.]{2,6})""".r
|
|
567 |
|
268
|
568 |
//test case:
|
212
|
569 |
//email_pattern.findAllIn
|
|
570 |
// ("foo bla christian@kcl.ac.uk 1234567").toList
|
|
571 |
|
204
|
572 |
|
|
573 |
// drops the first and last character from a string
|
|
574 |
def unquote(s: String) = s.drop(1).dropRight(1)
|
|
575 |
|
|
576 |
def get_all_URLs(page: String): Set[String] =
|
|
577 |
http_pattern.findAllIn(page).map(unquote).toSet
|
|
578 |
|
|
579 |
// naive version of crawl - searches until a given depth,
|
|
580 |
// visits pages potentially more than once
|
|
581 |
def crawl(url: String, n: Int) : Set[String] = {
|
|
582 |
if (n == 0) Set()
|
|
583 |
else {
|
|
584 |
println(s" Visiting: $n $url")
|
|
585 |
val page = get_page(url)
|
|
586 |
val new_emails = email_pattern.findAllIn(page).toSet
|
212
|
587 |
new_emails ++ (for (u <- get_all_URLs(page)) yield crawl(u, n - 1)).flatten
|
204
|
588 |
}
|
147
|
589 |
}
|
|
590 |
|
204
|
591 |
// some starting URLs for the crawler
|
|
592 |
val startURL = """https://nms.kcl.ac.uk/christian.urban/"""
|
147
|
593 |
|
204
|
594 |
crawl(startURL, 2)
|
|
595 |
|
|
596 |
|
|
597 |
|
|
598 |
|
150
|
599 |
|
|
600 |
|
|
601 |
|
192
|
602 |
// Sudoku
|
|
603 |
//========
|
53
|
604 |
|
57
|
605 |
// THE POINT OF THIS CODE IS NOT TO BE SUPER
|
|
606 |
// EFFICIENT AND FAST, just explaining exhaustive
|
|
607 |
// depth-first search
|
|
608 |
|
|
609 |
|
55
|
610 |
val game0 = """.14.6.3..
|
|
611 |
|62...4..9
|
|
612 |
|.8..5.6..
|
|
613 |
|.6.2....3
|
|
614 |
|.7..1..5.
|
|
615 |
|5....9.6.
|
|
616 |
|..6.2..3.
|
|
617 |
|1..5...92
|
|
618 |
|..7.9.41.""".stripMargin.replaceAll("\\n", "")
|
|
619 |
|
|
620 |
type Pos = (Int, Int)
|
268
|
621 |
val emptyValue = '.'
|
|
622 |
val maxValue = 9
|
55
|
623 |
|
|
624 |
val allValues = "123456789".toList
|
|
625 |
val indexes = (0 to 8).toList
|
|
626 |
|
57
|
627 |
|
268
|
628 |
def empty(game: String) = game.indexOf(emptyValue)
|
|
629 |
def isDone(game: String) = empty(game) == -1
|
|
630 |
def emptyPosition(game: String) : Pos =
|
|
631 |
(empty(game) % maxValue, empty(game) / maxValue)
|
57
|
632 |
|
55
|
633 |
|
268
|
634 |
def get_row(game: String, y: Int) = indexes.map(col => game(y * maxValue + col))
|
|
635 |
def get_col(game: String, x: Int) = indexes.map(row => game(x + row * maxValue))
|
147
|
636 |
|
57
|
637 |
def get_box(game: String, pos: Pos): List[Char] = {
|
55
|
638 |
def base(p: Int): Int = (p / 3) * 3
|
|
639 |
val x0 = base(pos._1)
|
|
640 |
val y0 = base(pos._2)
|
268
|
641 |
for (x <- (x0 until x0 + 3).toList;
|
|
642 |
y <- (y0 until y0 + 3).toList) yield game(x + y * maxValue)
|
|
643 |
}
|
55
|
644 |
|
|
645 |
|
192
|
646 |
//get_row(game0, 0)
|
|
647 |
//get_row(game0, 1)
|
|
648 |
//get_box(game0, (3,1))
|
|
649 |
|
268
|
650 |
def update(game: String, pos: Int, value: Char): String =
|
|
651 |
game.updated(pos, value)
|
55
|
652 |
|
|
653 |
def toAvoid(game: String, pos: Pos): List[Char] =
|
57
|
654 |
(get_col(game, pos._1) ++ get_row(game, pos._2) ++ get_box(game, pos))
|
55
|
655 |
|
268
|
656 |
def candidates(game: String, pos: Pos): List[Char] =
|
|
657 |
allValues.diff(toAvoid(game, pos))
|
55
|
658 |
|
268
|
659 |
//candidates(game0, (0, 0))
|
55
|
660 |
|
268
|
661 |
def pretty(game: String): String =
|
|
662 |
"\n" ++ (game.sliding(maxValue, maxValue).mkString("\n"))
|
55
|
663 |
|
|
664 |
def search(game: String): List[String] = {
|
|
665 |
if (isDone(game)) List(game)
|
192
|
666 |
else
|
268
|
667 |
candidates(game, emptyPosition(game)).
|
|
668 |
map(c => search(update(game, empty(game), c))).flatten
|
55
|
669 |
}
|
|
670 |
|
268
|
671 |
// an easy game
|
55
|
672 |
val game1 = """23.915...
|
|
673 |
|...2..54.
|
|
674 |
|6.7......
|
|
675 |
|..1.....9
|
|
676 |
|89.5.3.17
|
|
677 |
|5.....6..
|
|
678 |
|......9.5
|
|
679 |
|.16..7...
|
|
680 |
|...329..1""".stripMargin.replaceAll("\\n", "")
|
|
681 |
|
57
|
682 |
|
268
|
683 |
// a game that is in the sligtly harder category
|
55
|
684 |
val game2 = """8........
|
|
685 |
|..36.....
|
|
686 |
|.7..9.2..
|
|
687 |
|.5...7...
|
|
688 |
|....457..
|
|
689 |
|...1...3.
|
|
690 |
|..1....68
|
|
691 |
|..85...1.
|
|
692 |
|.9....4..""".stripMargin.replaceAll("\\n", "")
|
|
693 |
|
268
|
694 |
// a game with multiple solutions
|
55
|
695 |
val game3 = """.8...9743
|
|
696 |
|.5...8.1.
|
|
697 |
|.1.......
|
|
698 |
|8....5...
|
|
699 |
|...8.4...
|
|
700 |
|...3....6
|
|
701 |
|.......7.
|
|
702 |
|.3.5...8.
|
|
703 |
|9724...5.""".stripMargin.replaceAll("\\n", "")
|
|
704 |
|
57
|
705 |
|
192
|
706 |
search(game0).map(pretty)
|
|
707 |
search(game1).map(pretty)
|
55
|
708 |
|
|
709 |
// for measuring time
|
|
710 |
def time_needed[T](i: Int, code: => T) = {
|
|
711 |
val start = System.nanoTime()
|
|
712 |
for (j <- 1 to i) code
|
|
713 |
val end = System.nanoTime()
|
268
|
714 |
s"${(end - start) / i / 1.0e9} secs"
|
55
|
715 |
}
|
|
716 |
|
|
717 |
search(game2).map(pretty)
|
57
|
718 |
search(game3).distinct.length
|
192
|
719 |
time_needed(3, search(game2))
|
|
720 |
time_needed(3, search(game3))
|
55
|
721 |
|
53
|
722 |
|
|
723 |
|
|
724 |
|
192
|
725 |
|