progs/lecture2.scala
author Christian Urban <urbanc@in.tum.de>
Tue, 12 Nov 2019 10:47:27 +0000
changeset 319 ed7543c5d317
parent 318 f1215a72cd88
child 320 90aed247c8cf
permissions -rw-r--r--
updated
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
51
0e60e6c24b99 updated
Christian Urban <urbanc@in.tum.de>
parents: 39
diff changeset
     1
// Scala Lecture 2
0e60e6c24b99 updated
Christian Urban <urbanc@in.tum.de>
parents: 39
diff changeset
     2
//=================
0e60e6c24b99 updated
Christian Urban <urbanc@in.tum.de>
parents: 39
diff changeset
     3
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
     4
// For-Comprehensions Again
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
     5
//==========================
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
     6
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
     7
// the first produces a result, while the second does not
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
     8
for (n <- List(1, 2, 3, 4, 5)) yield n * n
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
     9
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    10
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    11
for (n <- List(1, 2, 3, 4, 5)) println(n)
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    12
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    13
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    14
// String Interpolations
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    15
//=======================
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    16
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
    17
def cube(n: Int) : Int = n * n * n
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
    18
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    19
val n = 3
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
    20
println("The cube of " + n + " is " + cube(n) + ".")
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    21
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
    22
println(s"The cube of ${n} is ${cube(n)}.")
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    23
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
    24
// or even
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
    25
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
    26
println(s"The cube of ${n} is ${n * n * n}.")
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    27
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    28
// helpful for debugging purposes
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    29
//
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    30
//         "The most effective debugging tool is still careful thought, 
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    31
//          coupled with judiciously placed print statements."
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    32
//                   — Brian W. Kernighan, in Unix for Beginners (1979)
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    33
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    34
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    35
def gcd_db(a: Int, b: Int) : Int = {
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    36
  println(s"Function called with ${a} and ${b}.")
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    37
  if (b == 0) a else gcd_db(b, a % b)
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    38
}
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    39
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
    40
gcd_db(48, 18)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    41
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    42
316
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    43
// The Option Type
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    44
//=================
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    45
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    46
// in Java, if something unusually happens, you return null or 
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    47
// raise an exception
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    48
//
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    49
//in Scala you use Options instead
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    50
//   - if the value is present, you use Some(value)
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    51
//   - if no value is present, you use None
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    52
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    53
316
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    54
List(7,2,3,4,5,6).find(_ < 4)
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    55
List(5,6,7,8,9).find(_ < 4)
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
    56
310
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
    57
316
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    58
// better error handling with Options (no exceptions)
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    59
//
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    60
//  Try(something).getOrElse(what_to_do_in_case_of_an_exception)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    61
//
316
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    62
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    63
import scala.util._
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    64
import io.Source
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    65
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    66
val my_url = "https://nms.kcl.ac.uk/christian.urban/"
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    67
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    68
Source.fromURL(my_url).mkString
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    69
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    70
Try(Source.fromURL(my_url).mkString).getOrElse("")
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    71
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    72
Try(Some(Source.fromURL(my_url).mkString)).getOrElse(None)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    73
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    74
316
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    75
// the same for files
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    76
Try(Some(Source.fromFile("text.txt").mkString)).getOrElse(None)
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    77
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    78
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
    79
// how to implement a function for reading 
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
    80
// (lines) something from files...
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
    81
//
316
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    82
def get_contents(name: String) : List[String] = 
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    83
  Source.fromFile(name).getLines.toList
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    84
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
    85
get_contents("text.txt")
316
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    86
get_contents("test.txt")
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    87
316
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    88
// slightly better - return Nil
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    89
def get_contents(name: String) : List[String] = 
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    90
  Try(Source.fromFile(name).getLines.toList).getOrElse(List())
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    91
316
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    92
get_contents("text.txt")
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    93
316
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    94
// much better - you record in the type that things can go wrong 
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    95
def get_contents(name: String) : Option[List[String]] = 
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    96
  Try(Some(Source.fromFile(name).getLines.toList)).getOrElse(None)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
    97
316
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    98
get_contents("text.txt")
03d55eb6a0b7 updated
Christian Urban <urbanc@in.tum.de>
parents: 310
diff changeset
    99
get_contents("test.txt")
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   100
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   101
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   102
// operations on options
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   103
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   104
val lst = List(None, Some(1), Some(2), None, Some(3))
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   105
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   106
lst.flatten
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   107
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   108
Some(1).get
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   109
None.get
310
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
   110
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   111
Some(1).isDefined
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   112
None.isDefined
310
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
   113
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
   114
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   115
val ps = List((3, 0), (4, 2), (6, 2), (2, 0), (1, 0), (1, 1))
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   116
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   117
// division where possible
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   118
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   119
for ((x, y) <- ps) yield {
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   120
  if (y == 0) None else Some(x / y)
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   121
}
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   122
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   123
// getOrElse is for setting a default value
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   124
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   125
val lst = List(None, Some(1), Some(2), None, Some(3))
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   126
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   127
for (x <- lst) yield x.getOrElse(0)
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   128
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   129
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   130
// a function that turns strings into numbers (similar to .toInt)
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   131
Integer.parseInt("1234")
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   132
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   133
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   134
def get_me_an_int(s: String) : Option[Int] = 
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   135
 Try(Some(Integer.parseInt(s))).getOrElse(None)
310
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
   136
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
   137
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   138
// This may not look any better than working with null in Java, but to
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   139
// see the value, you have to put yourself in the shoes of the
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   140
// consumer of the get_me_an_int function, and imagine you didn't
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   141
// write that function.
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   142
//
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   143
// In Java, if you didn't write this function, you'd have to depend on
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   144
// the Javadoc of the get_me_an_int. If you didn't look at the Javadoc, 
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   145
// you might not know that get_me_an_int could return null, and your 
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   146
// code could potentially throw a NullPointerException.
310
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
   147
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
   148
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   149
// even Scala is not immune to problems like this:
310
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
   150
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   151
List(5,6,7,8,9).indexOf(7)
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   152
List(5,6,7,8,9).indexOf(10)
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   153
List(5,6,7,8,9)(-1)
310
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
   154
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
   155
996279af8952 updated
Christian Urban <urbanc@in.tum.de>
parents: 309
diff changeset
   156
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   157
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   158
// Higher-Order Functions
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   159
//========================
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   160
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   161
// functions can take functions as arguments
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   162
// and produce functions as result
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   163
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   164
def even(x: Int) : Boolean = x % 2 == 0
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   165
def odd(x: Int) : Boolean = x % 2 == 1
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   166
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   167
val lst = (1 to 10).toList
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   168
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   169
lst.filter(even)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   170
lst.count(even)
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   171
lst.find(even)
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   172
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   173
lst.filter(x => x % 2 == 0)
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   174
lst.filter(_ % 2 == 0)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   175
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   176
lst.sortWith(_ > _)
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   177
lst.sortWith(_ < _)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   178
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   179
// but this only works when the arguments are clear, but 
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   180
// not with multiple occurences
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   181
lst.find(n => odd(n) && n > 2)
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   182
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   183
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   184
val ps = List((3, 0), (3, 2), (4, 2), (2, 2), (2, 0), (1, 1), (1, 0))
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   185
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   186
def lex(x: (Int, Int), y: (Int, Int)) : Boolean = 
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   187
  if (x._1 == y._1) x._2 < y._2 else x._1 < y._1
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   188
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   189
ps.sortWith(lex)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   190
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   191
ps.sortBy(_._1)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   192
ps.sortBy(_._2)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   193
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   194
ps.maxBy(_._1)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   195
ps.maxBy(_._2)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   196
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   197
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   198
// maps (lower-case)
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   199
//===================
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   200
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   201
def double(x: Int): Int = x + x
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   202
def square(x: Int): Int = x * x
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   203
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   204
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   205
val lst = (1 to 10).toList
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   206
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   207
lst.map(x => (double(x), square(x)))
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   208
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   209
lst.map(square)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   210
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   211
// this is actually how for-comprehensions are
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   212
// defined in Scala
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   213
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   214
lst.map(n => square(n))
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   215
for (n <- lst) yield square(n)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   216
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   217
// this can be iterated
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   218
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   219
lst.map(square).filter(_ > 4)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   220
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   221
lst.map(square).filter(_ > 4).map(square)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   222
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   223
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   224
// lets define our own higher-order functions
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   225
// type of functions is for example Int => Int
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   226
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   227
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   228
def my_map_int(lst: List[Int], f: Int => Int) : List[Int] = {
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   229
  if (lst == Nil) Nil
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   230
  else f(lst.head) :: my_map_int(lst.tail, f)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   231
}
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   232
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   233
my_map_int(lst, square)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   234
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   235
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   236
// same function using pattern matching: a kind
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   237
// of switch statement on steroids (see more later on)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   238
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   239
def my_map_int(lst: List[Int], f: Int => Int) : List[Int] = 
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   240
lst match {
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   241
  case Nil => Nil
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   242
  case x::xs => f(x)::my_map_int(xs, f)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   243
}
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   244
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   245
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   246
// other function types
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   247
//
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   248
// f1: (Int, Int) => Int
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   249
// f2: List[String] => Option[Int]
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   250
// ... 
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   251
val lst = (1 to 10).toList
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   252
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   253
def sumOf(f: Int => Int, lst: List[Int]): Int = lst match {
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   254
  case Nil => 0
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   255
  case x::xs => f(x) + sumOf(f, xs)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   256
}
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   257
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   258
def sum_squares(lst: List[Int]) = sumOf(square, lst)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   259
def sum_cubes(lst: List[Int])   = sumOf(x => x * x * x, lst)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   260
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   261
sum_squares(lst)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   262
sum_cubes(lst)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   263
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   264
// lets try a factorial
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   265
def fact(n: Int) : Int = 
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   266
  if (n == 0) 1 else n * fact(n - 1)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   267
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   268
def sum_fact(lst: List[Int]) = sumOf(fact, lst)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   269
sum_fact(lst)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   270
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   271
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   272
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   273
// sometimes it is needed that you specify the type. 
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   274
(1 to 100).filter((x: Int) => x % 2 == 0).sum 
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   275
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   276
// in this case it is clear that x must be an Int
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   277
(1 to 100).filter(x => x % 2 == 0).sum
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   278
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   279
// When each parameter (only x in this case) is used only once
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   280
// you can use the wizardy placeholder syntax
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   281
(1 to 100).filter(_ % 2 == 0).sum
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   282
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   283
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   284
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   285
// Option Type and maps
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   286
//======================
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   287
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   288
// a function that turns strings into numbers (similar to .toInt)
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   289
Integer.parseInt("12u34")
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   290
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   291
import scala.util._
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   292
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   293
def get_me_an_int(s: String) : Option[Int] = 
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   294
 Try(Some(Integer.parseInt(s))).getOrElse(None)
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   295
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   296
val lst = List("12345", "foo", "5432", "bar", "x21", "456")
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   297
for (x <- lst) yield get_me_an_int(x)
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   298
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   299
// summing up all the numbers
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   300
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   301
lst.map(get_me_an_int).flatten.sum
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   302
lst.map(get_me_an_int).flatten.sum
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   303
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   304
lst.flatMap(get_me_an_int).sum
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   305
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   306
// maps on Options
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   307
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   308
get_me_an_int("1234").map(even)
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   309
get_me_an_int("12u34").map(even)
317
07583fbe4f95 updated
Christian Urban <urbanc@in.tum.de>
parents: 316
diff changeset
   310
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   311
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   312
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   313
// Map type (upper-case)
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   314
//=======================
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   315
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   316
// Note the difference between map and Map
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   317
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   318
def factors(n: Int) : List[Int] =
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   319
  (2 until n).toList.filter(n % _ == 0)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   320
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   321
var ls = (1 to 10).toList
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   322
val facs = ls.map(n => (n, factors(n)))
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   323
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   324
facs.find(_._1 == 4)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   325
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   326
// works for lists of pairs
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   327
facs.toMap
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   328
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   329
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   330
facs.toMap.get(4)
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   331
facs.toMap.getOrElse(42, Nil)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   332
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   333
val facsMap = facs.toMap
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   334
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   335
val facsMap0 = facsMap + (0 -> List(1,2,3,4,5))
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   336
facsMap0.get(0)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   337
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   338
val facsMap2 = facsMap + (1 -> List(1,2,3,4,5))
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   339
facsMap.get(1)
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   340
facsMap2.get(1)
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   341
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   342
// groupBy function on Maps
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   343
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   344
val ls = List("one", "two", "three", "four", "five")
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   345
ls.groupBy(_.length)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   346
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   347
ls.groupBy(_.length).get(3)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   348
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   349
51
0e60e6c24b99 updated
Christian Urban <urbanc@in.tum.de>
parents: 39
diff changeset
   350
192
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   351
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   352
// Pattern Matching
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   353
//==================
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   354
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   355
// A powerful tool which is supposed to come to Java in a few years
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   356
// time (https://www.youtube.com/watch?v=oGll155-vuQ)...Scala already
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   357
// has it for many years ;o)
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   358
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   359
// The general schema:
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   360
//
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   361
//    expression match {
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   362
//       case pattern1 => expression1
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   363
//       case pattern2 => expression2
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   364
//       ...
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   365
//       case patternN => expressionN
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   366
//    }
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   367
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   368
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   369
// recall
192
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   370
val lst = List(None, Some(1), Some(2), None, Some(3)).flatten
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   371
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   372
def my_flatten(xs: List[Option[Int]]): List[Int] = xs match {
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   373
  case Nil => Nil 
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   374
  case None::rest => my_flatten(rest)
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   375
  case Some(v)::rest => v :: my_flatten(rest)
192
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   376
}
58
93a2b6e4b84c updated
Christian Urban <urbanc@in.tum.de>
parents: 57
diff changeset
   377
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   378
my_flatten(List(None, Some(1), Some(2), None, Some(3)))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   379
58
93a2b6e4b84c updated
Christian Urban <urbanc@in.tum.de>
parents: 57
diff changeset
   380
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   381
// another example with a default case
192
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   382
def get_me_a_string(n: Int): String = n match {
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   383
  case 0 | 1 | 2 => "small"
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   384
  case _ => "big"
192
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   385
}
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   386
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   387
get_me_a_string(0)
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   388
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   389
192
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   390
// you can also have cases combined
266
31e5218f43de updated to 2.13
Christian Urban <urbanc@in.tum.de>
parents: 212
diff changeset
   391
def season(month: String) : String = month match {
192
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   392
  case "March" | "April" | "May" => "It's spring"
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   393
  case "June" | "July" | "August" => "It's summer"
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   394
  case "September" | "October" | "November" => "It's autumn"
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   395
  case "December" => "It's winter"
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   396
  case "January" | "February" => "It's unfortunately winter"
192
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   397
}
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   398
 
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   399
println(season("November"))
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   400
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   401
// What happens if no case matches?
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   402
println(season("foobar"))
192
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   403
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   404
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   405
// days of some months
266
31e5218f43de updated to 2.13
Christian Urban <urbanc@in.tum.de>
parents: 212
diff changeset
   406
def days(month: String) : Int = month match {
31e5218f43de updated to 2.13
Christian Urban <urbanc@in.tum.de>
parents: 212
diff changeset
   407
  case "March" | "April" | "May" => 31
31e5218f43de updated to 2.13
Christian Urban <urbanc@in.tum.de>
parents: 212
diff changeset
   408
  case "June" | "July" | "August" => 30
31e5218f43de updated to 2.13
Christian Urban <urbanc@in.tum.de>
parents: 212
diff changeset
   409
}
31e5218f43de updated to 2.13
Christian Urban <urbanc@in.tum.de>
parents: 212
diff changeset
   410
31e5218f43de updated to 2.13
Christian Urban <urbanc@in.tum.de>
parents: 212
diff changeset
   411
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   412
// Silly: fizz buzz
192
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   413
def fizz_buzz(n: Int) : String = (n % 3, n % 5) match {
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   414
  case (0, 0) => "fizz buzz"
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   415
  case (0, _) => "fizz"
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   416
  case (_, 0) => "buzz"
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   417
  case _ => n.toString  
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   418
}
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   419
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   420
for (n <- 0 to 20) 
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   421
 println(fizz_buzz(n))
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   422
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   423
278
57b5bba67467 updated
Christian Urban <urbanc@in.tum.de>
parents: 268
diff changeset
   424
57b5bba67467 updated
Christian Urban <urbanc@in.tum.de>
parents: 268
diff changeset
   425
309
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   426
// Recursion
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   427
//===========
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   428
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   429
// well-known example
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   430
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   431
def fib(n: Int) : Int = { 
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   432
  if (n == 0 || n == 1) 1
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   433
   else fib(n - 1) + fib(n - 2)
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   434
}
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   435
309
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   436
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   437
/* Say you have characters a, b, c.
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   438
   What are all the combinations of a certain length?
309
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   439
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   440
   All combinations of length 2:
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   441
  
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   442
     aa, ab, ac, ba, bb, bc, ca, cb, cc
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   443
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   444
   Combinations of length 3:
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   445
   
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   446
     aaa, baa, caa, and so on......
309
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   447
*/
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   448
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   449
def combs(cs: List[Char], l: Int) : List[String] = {
309
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   450
  if (l == 0) List("")
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   451
  else for (c <- cs; s <- combs(cs, l - 1)) yield s"$c$s"
309
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   452
}
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   453
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   454
combs("abc".toList, 2)
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   455
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   456
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   457
// another well-known example
309
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   458
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   459
def move(from: Char, to: Char) =
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   460
  println(s"Move disc from $from to $to!")
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   461
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   462
def hanoi(n: Int, from: Char, via: Char, to: Char) : Unit = {
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   463
  if (n == 0) ()
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   464
  else {
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   465
    hanoi(n - 1, from, to, via)
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   466
    move(from, to)
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   467
    hanoi(n - 1, via, from, to)
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   468
  }
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   469
} 
c5f16a86ae92 updated
Christian Urban <urbanc@in.tum.de>
parents: 278
diff changeset
   470
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   471
hanoi(4, 'A', 'B', 'C')
147
3e5d8657302f updated
Christian Urban <urbanc@in.tum.de>
parents: 95
diff changeset
   472
3e5d8657302f updated
Christian Urban <urbanc@in.tum.de>
parents: 95
diff changeset
   473
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   474
// A Recursive Web Crawler / Email Harvester
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   475
//===========================================
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   476
//
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   477
// the idea is to look for links using the
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   478
// regular expression "https?://[^"]*" and for
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   479
// email addresses using another regex.
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   480
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   481
import io.Source
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   482
import scala.util._
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   483
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   484
// gets the first 10K of a web-page
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   485
def get_page(url: String) : String = {
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   486
  Try(Source.fromURL(url)("ISO-8859-1").take(10000).mkString).
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   487
    getOrElse { println(s"  Problem with: $url"); ""}
147
3e5d8657302f updated
Christian Urban <urbanc@in.tum.de>
parents: 95
diff changeset
   488
}
3e5d8657302f updated
Christian Urban <urbanc@in.tum.de>
parents: 95
diff changeset
   489
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   490
// regex for URLs and emails
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   491
val http_pattern = """"https?://[^"]*"""".r
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   492
val email_pattern = """([a-z0-9_\.-]+)@([\da-z\.-]+)\.([a-z\.]{2,6})""".r
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   493
268
d20583497c5b updated
Christian Urban <urbanc@in.tum.de>
parents: 266
diff changeset
   494
//test case:
212
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   495
//email_pattern.findAllIn
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   496
//  ("foo bla christian@kcl.ac.uk 1234567").toList
c86e40fb3b21 updated
Christian Urban <urbanc@in.tum.de>
parents: 204
diff changeset
   497
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   498
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   499
// drops the first and last character from a string
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   500
def unquote(s: String) = s.drop(1).dropRight(1)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   501
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   502
def get_all_URLs(page: String): Set[String] = 
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   503
  http_pattern.findAllIn(page).map(unquote).toSet
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   504
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   505
// naive version of crawl - searches until a given depth,
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   506
// visits pages potentially more than once
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   507
def crawl(url: String, n: Int) : Unit = {
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   508
  if (n == 0) ()
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   509
  else {
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   510
    println(s"  Visiting: $n $url")
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   511
    for (u <- get_all_URLs(get_page(url))) crawl(u, n - 1)
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   512
  }
147
3e5d8657302f updated
Christian Urban <urbanc@in.tum.de>
parents: 95
diff changeset
   513
}
3e5d8657302f updated
Christian Urban <urbanc@in.tum.de>
parents: 95
diff changeset
   514
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   515
// some starting URLs for the crawler
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   516
val startURL = """https://nms.kcl.ac.uk/christian.urban/"""
147
3e5d8657302f updated
Christian Urban <urbanc@in.tum.de>
parents: 95
diff changeset
   517
204
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   518
crawl(startURL, 2)
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   519
1b04ea68dca6 updated
Christian Urban <urbanc@in.tum.de>
parents: 192
diff changeset
   520
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   521
// a primitive email harvester
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   522
def emails(url: String, n: Int) : Set[String] = {
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   523
  if (n == 0) Set()
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   524
  else {
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   525
    println(s"  Visiting: $n $url")
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   526
    val page = get_page(url)
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   527
    val new_emails = email_pattern.findAllIn(page).toSet
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   528
    new_emails ++ (for (u <- get_all_URLs(page)) yield emails(u, n - 1)).flatten
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   529
  }
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   530
}
55
6610c1dfa8a9 updated
Christian Urban <urbanc@in.tum.de>
parents: 53
diff changeset
   531
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   532
emails(startURL, 3)
55
6610c1dfa8a9 updated
Christian Urban <urbanc@in.tum.de>
parents: 53
diff changeset
   533
6610c1dfa8a9 updated
Christian Urban <urbanc@in.tum.de>
parents: 53
diff changeset
   534
318
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   535
// if we want to explore the internet "deeper", then we
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   536
// first have to parallelise the request of webpages:
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   537
//
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   538
// scala -cp scala-parallel-collections_2.13-0.2.0.jar 
f1215a72cd88 updated
Christian Urban <urbanc@in.tum.de>
parents: 317
diff changeset
   539
// import scala.collection.parallel.CollectionConverters._
55
6610c1dfa8a9 updated
Christian Urban <urbanc@in.tum.de>
parents: 53
diff changeset
   540
53
9f8751912560 updated
Christian Urban <urbanc@in.tum.de>
parents: 51
diff changeset
   541
9f8751912560 updated
Christian Urban <urbanc@in.tum.de>
parents: 51
diff changeset
   542
9f8751912560 updated
Christian Urban <urbanc@in.tum.de>
parents: 51
diff changeset
   543
192
cd2a9c969ef2 updated
Christian Urban <urbanc@in.tum.de>
parents: 174
diff changeset
   544
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   545
// Jumping Towers
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   546
//================
278
57b5bba67467 updated
Christian Urban <urbanc@in.tum.de>
parents: 268
diff changeset
   547
319
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   548
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   549
def moves(xs: List[Int], n: Int) : List[List[Int]] = (xs, n) match {
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   550
  case (Nil, _) => Nil
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   551
  case (xs, 0) => Nil
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   552
  case (x::xs, n) => (x::xs) :: moves(xs, n - 1)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   553
}
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   554
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   555
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   556
moves(List(5,1,0), 1)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   557
moves(List(5,1,0), 2)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   558
moves(List(5,1,0), 5)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   559
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   560
// checks whether a jump tour exists at all
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   561
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   562
def search(xs: List[Int]) : Boolean = xs match {
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   563
  case Nil => true
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   564
  case (x::xs) =>
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   565
    if (xs.length < x) true else moves(xs, x).exists(search(_))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   566
}
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   567
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   568
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   569
search(List(5,3,2,5,1,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   570
search(List(3,5,1,0,0,0,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   571
search(List(3,5,1,0,0,0,0,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   572
search(List(3,5,1,0,0,0,1,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   573
search(List(3,5,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   574
search(List(5,1,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   575
search(Nil)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   576
search(List(1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   577
search(List(5,1,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   578
search(List(3,5,1,0,0,0,0,0,0,0,0,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   579
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   580
// generate *all* jump tours
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   581
//    if we are only interested in the shortes one, we could
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   582
//    shortcircut the calculation and only return List(x) in
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   583
//    case where xs.length < x, because no tour can be shorter
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   584
//    than 1
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   585
// 
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   586
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   587
def jumps(xs: List[Int]) : List[List[Int]] = xs match {
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   588
  case Nil => Nil
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   589
  case (x::xs) => {
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   590
    val children = moves(xs, x)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   591
    val results = children.map(cs => jumps(cs).map(x :: _)).flatten
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   592
    if (xs.length < x) List(x) :: results else results
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   593
  }
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   594
}
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   595
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   596
jumps(List(3,5,1,2,1,2,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   597
jumps(List(3,5,1,2,3,4,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   598
jumps(List(3,5,1,0,0,0,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   599
jumps(List(3,5,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   600
jumps(List(5,1,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   601
jumps(Nil)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   602
jumps(List(1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   603
jumps(List(5,1,2))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   604
moves(List(1,2), 5)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   605
jumps(List(1,5,1,2))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   606
jumps(List(3,5,1,0,0,0,0,0,0,0,0,1))
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   607
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   608
jumps(List(5,3,2,5,1,1)).minBy(_.length)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   609
jumps(List(1,3,5,8,9,2,6,7,6,8,9)).minBy(_.length)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   610
jumps(List(1,3,6,1,0,9)).minBy(_.length)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   611
jumps(List(2,3,1,1,2,4,2,0,1,1)).minBy(_.length)
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   612
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   613
ed7543c5d317 updated
Christian Urban <urbanc@in.tum.de>
parents: 318
diff changeset
   614