1 // Part 2 about Alcohol-Consumption Worldwide |
|
2 //============================================ |
|
3 |
|
4 object CW6b { |
|
5 |
|
6 import io.Source |
|
7 import scala.util._ |
|
8 |
|
9 val url_alcohol = |
|
10 "https://raw.githubusercontent.com/fivethirtyeight/data/master/alcohol-consumption/drinks.csv" |
|
11 |
|
12 val file_population = |
|
13 "population.csv" |
|
14 |
|
15 |
|
16 //(1) Complete the get_csv_page function below. It takes a URL-string |
|
17 // as argument and generates a list of strings corresponding to each |
|
18 // line in the downloaded csv-list. The URL url_alcohol above is one |
|
19 // possible argument. |
|
20 |
|
21 //def get_csv_page(url: String) : List[String] = ... |
|
22 def get_csv_page(url: String) : List[String] = { |
|
23 val csv = Source.fromURL(url) |
|
24 val contents = csv.mkString.split("\n") |
|
25 contents.toList |
|
26 } |
|
27 // Complete the get_csv_file function below. It takes a file name |
|
28 // as argument and reads the content of the given file. Like above, |
|
29 // it should generate a list of strings corresponding to each |
|
30 // line in the csv-list. The filename file_population is one possible |
|
31 // argument. |
|
32 |
|
33 //def get_csv_file(file: String) : List[String] = ... |
|
34 def get_csv_file(file: String) : List[String] = { |
|
35 val csv = Source.fromFile(file) |
|
36 val contents = csv.mkString.split("\n") |
|
37 contents.toList |
|
38 } |
|
39 //(2) Complete the functions that process the csv-lists. For |
|
40 // process_alcs extract the country name (as String) and the |
|
41 // pure alcohol consumption (as Double). For process_pops |
|
42 // generate a Map of Strings (country names) to Long numbers |
|
43 // (population sizes). |
|
44 |
|
45 //def process_alcs(lines: List[String]) : List[(String, Double)] = ... |
|
46 def process_alcs(lines: List[String]) : List[(String, Double)] = { |
|
47 val beheaded = lines.drop(1) |
|
48 val splitEntries = for (n <- beheaded) yield n.split(",").toList |
|
49 for (n <- splitEntries) yield (n.take(1).mkString, n.drop(4).mkString.toDouble) |
|
50 } |
|
51 //def process_pops(lines: List[String]) : Map[String, Long] = ... |
|
52 def process_pops(lines: List[String]) : Map[String, Long] = { |
|
53 val beheaded = lines.drop(1); |
|
54 def toOnePair(line: String) : (String, Long) = { |
|
55 val splitAsList = line.split(",").toList |
|
56 (splitAsList.take(1).mkString, splitAsList.drop(1).mkString.toLong) |
|
57 } |
|
58 val splitEntries = for (n <- beheaded) yield toOnePair(n) |
|
59 splitEntries.toMap |
|
60 } |
|
61 |
|
62 |
|
63 //(3) Calculate for each country the overall alcohol_consumption using |
|
64 // the data from the alcohol list and the population sizes list. You |
|
65 // should only include countries on the alcohol list that are also |
|
66 // on the population sizes list with the exact same name. Note that |
|
67 // the spelling of some names in the alcohol list differs from the |
|
68 // population sizes list. You can ignore entries where the names differ. |
|
69 // Sort the resulting list according to the country with the highest alcohol |
|
70 // consumption to the country with the lowest alcohol consumption. |
|
71 |
|
72 //def sorted_country_consumption() : List[(String, Long)] = ... |
|
73 def sorted_country_consumption() : List[(String, Long)] = { |
|
74 val countryToPop = process_pops(get_csv_file(file_population)) |
|
75 val countryAndAlc = process_alcs(get_csv_page(url_alcohol)) |
|
76 val countryAndConsumption = countryAndAlc.collect { |
|
77 case oneCountryAndAlc |
|
78 if countryToPop.isDefinedAt(oneCountryAndAlc._1) => |
|
79 (oneCountryAndAlc._1, (oneCountryAndAlc._2*countryToPop.get(oneCountryAndAlc._1).get).toLong) |
|
80 } |
|
81 countryAndConsumption.sortWith(_._2 > _._2) |
|
82 } |
|
83 |
|
84 // Calculate the world consumption of pure alcohol of all countries, which |
|
85 // should be the first element in the tuple below. The second element is |
|
86 // the overall consumption of the first n countries in the sorted list |
|
87 // from above; and finally the double should be the percentage of the |
|
88 // first n countries drinking from the the world consumption of alcohol. |
|
89 |
|
90 //def percentage(n: Int) : (Long, Long, Double) = ... |
|
91 def percentage(n: Int) : (Long, Long, Double) = { |
|
92 val ctryConsump = sorted_country_consumption() |
|
93 val totalAlc = ctryConsump.map(_._2).sum |
|
94 val firstNAlc = ctryConsump.take(n).map(_._2).sum |
|
95 val pcntage = (firstNAlc*1.0/totalAlc)*100; |
|
96 (ctryConsump.map(_._2).sum, ctryConsump.take(n).map(_._2).sum, pcntage) |
|
97 } |
|
98 } |
|