handouts/ho06.tex
author cu
Sun, 15 Oct 2017 21:23:16 +0100
changeset 550 58c3536c5a08
parent 534 62985f147c85
child 557 192d01998ebd
permissions -rw-r--r--
updated
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
     1
\documentclass{article}
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
     2
\usepackage{../style}
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
     3
\usepackage{../graphics}
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
     4
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
     5
\begin{document}
495
f5172bb6cf45 updated
Christian Urban <urbanc@in.tum.de>
parents: 480
diff changeset
     6
\fnote{\copyright{} Christian Urban, King's College London, 2014, 2015}
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
     7
467
da4896f201b5 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 462
diff changeset
     8
%https://www.theguardian.com/technology/2016/oct/04/yahoo-secret-email-program-nsa-fbi
429
ff053e2766e8 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 423
diff changeset
     9
%https://nakedsecurity.sophos.com/2015/11/12/california-collects-owns-and-sells-infants-dna-samples/
431
4b53f83c070c updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 429
diff changeset
    10
%http://randomwalker.info/teaching/fall-2012-privacy-technologies/?
4b53f83c070c updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 429
diff changeset
    11
%https://josephhall.org/papers/NYU-MCC-1303-S2012_privacy_syllabus.pdf
4b53f83c070c updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 429
diff changeset
    12
%http://www.jetlaw.org/wp-content/uploads/2014/06/Bambauer_Final.pdf
4b53f83c070c updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 429
diff changeset
    13
%http://www.cs.cmu.edu/~yuxiangw/docs/Differential%20Privacy.pdf
4b53f83c070c updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 429
diff changeset
    14
%https://www.youtube.com/watch?v=Gx13lgEudtU
4b53f83c070c updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 429
diff changeset
    15
%https://fpf.org/wp-content/uploads/Differential-Privacy-as-a-Response-to-the-Reidentification-Threat-Klinefelter-and-Chin.pdf
442
cceb3d2dcba0 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 431
diff changeset
    16
%http://research.neustar.biz/2014/09/08/differential-privacy-the-basics/
429
ff053e2766e8 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 423
diff changeset
    17
443
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    18
%=====
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    19
%Tim Greene, Network World, 17 Dec 2015   (via ACM TechNews, 18 Dec 2015)
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    20
%
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    21
%Massachusetts Institute of Technology (MIT) researchers' experimental
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    22
%Vuvuzela messaging system offers more privacy than The Onion Router (Tor) by
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    23
%rendering text messages sent through it untraceable.  MIT Ph.D. student
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    24
%David Lazar says Vuvuzela resists traffic analysis attacks, while Tor
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    25
%cannot.  The researchers say the system functions no matter how many parties
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    26
%are using it to communicate, and it employs encryption and a set of servers
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    27
%to conceal whether or not parties are participating in text-based dialogues.
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    28
%"Vuvuzela prevents an adversary from learning which pairs of users are
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    29
%communicating, as long as just one out of [the] servers is not compromised,
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    30
%even for users who continue to use Vuvuzela for years," they note.  Vuvuzela
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    31
%can support millions of users hosted on commodity servers deployed by a
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    32
%single group of users.  Instead of anonymizing users, Vuvuzela prevents
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    33
%outside observers from differentiating between people sending messages,
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    34
%receiving messages, or neither, according to Lazar.  The system imposes
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    35
%noise on the client-server traffic which cannot be distinguished from actual
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    36
%messages, and all communications are triple-wrapped in encryption by three
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    37
%servers.  "Vuvuzela guarantees privacy as long as one of the servers is
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    38
%uncompromised, so using more servers increases security at the cost of
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    39
%increased message latency," Lazar notes.
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    40
%http://orange.hosting.lsoft.com/trk/click?ref=znwrbbrs9_5-e70bx2d991x066779&
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    41
456
f65e4fa6e902 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 450
diff changeset
    42
%%%%
f65e4fa6e902 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 450
diff changeset
    43
%% canvas tracking
f65e4fa6e902 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 450
diff changeset
    44
%%https://freedom-to-tinker.com/blog/englehardt/the-princeton-web-census-a-1-million-site-measurement-and-analysis-of-web-privacy/
443
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    45
456
f65e4fa6e902 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 450
diff changeset
    46
%%%
f65e4fa6e902 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 450
diff changeset
    47
%% cupit re-identification attack
f65e4fa6e902 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 450
diff changeset
    48
%% https://nakedsecurity.sophos.com/2016/05/20/published-personal-data-on-70000-okcupid-users-taken-down-after-dmca-order/?utm_source=feedburner&utm_medium=feed&utm_campaign=Feed%3A+nakedsecurity+%28Naked+Security+-+Sophos%29
443
67d7d239c617 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 442
diff changeset
    49
457
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    50
%Differential privacy
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    51
%=====================
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    52
%https://www.wired.com/2016/06/apples-differential-privacy-collecting-data/
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    53
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    54
%Differential privacy, translated from Apple-speak, is the
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    55
%statistical science of trying to learn as much as possible
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    56
%about a group while learning as little as possible about any
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    57
%individual in it.
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    58
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    59
%As Roth notes when he refers to a “mathematical proof,”
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    60
%differential privacy doesn’t merely try to obfuscate or
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    61
%“anonymize” users’ data. That anonymization approach, he
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    62
%argues, tends to fail. In 2007, for instance, Netflix released
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    63
%a large collection of its viewers’ film ratings as part of a
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    64
%competition to optimize its recommendations, removing people’s
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    65
%names and other identifying details and publishing only their
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    66
%Netflix ratings. But researchers soon cross-referenced the
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    67
%Netflix data with public review data on IMDB to match up
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    68
%similar patterns of recommendations between the sites and add
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    69
%names back into Netflix’s supposedly anonymous database.
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    70
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    71
%As an example of that last method, Microsoft’s Dwork points to
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    72
%the technique in which a survey asks if the respondent has
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    73
%ever, say, broken a law. But first, the survey asks them to
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    74
%flip a coin. If the result is tails, they should answer
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    75
%honestly. If the result is heads, they’re instructed to flip
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    76
%the coin again and then answer “yes” for heads or “no” for
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    77
%tails. The resulting random noise can be subtracted from the
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    78
%results with a bit of algebra, and every respondent is
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    79
%protected from punishment if they admitted to lawbreaking.
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    80
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    81
%https://www.cis.upenn.edu/~aaroth/Papers/privacybook.pdf
38ef1ef6082d updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 456
diff changeset
    82
462
33dcbafb27ce updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 457
diff changeset
    83
% Windows 10 data send back to Microsoft (Cortana)
33dcbafb27ce updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 457
diff changeset
    84
%Here’s a non-exhaustive list of data sent back: location data, text
33dcbafb27ce updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 457
diff changeset
    85
%input, voice input, touch input, webpages you visit, and telemetry
33dcbafb27ce updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 457
diff changeset
    86
%data regarding your general usage of your computer, including which
33dcbafb27ce updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 457
diff changeset
    87
%programs you run and for how long.
33dcbafb27ce updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 457
diff changeset
    88
500
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
    89
% Businesses are already using customised pricing online based on
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
    90
% information they can glean about you. It is hard to know how
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
    91
% widespread the practice is; companies keep their pricing strategies
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
    92
% closely guarded and are wary of the bad PR price discrimination
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
    93
% could pose. However, it is clear that a number of large retailers
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
    94
% are experimenting with it. Staples, for example, has offered
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
    95
% discounted prices based on whether rival stores are within 20 miles
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
    96
% of its customers’ location. Office Depot has admitted to using its
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
    97
% customers’ browsing history and location to vary its range of offers
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
    98
% and products. A 2014 study from Northeastern University found
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
    99
% evidence of “steering” or differential pricing at four out of 10
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
   100
% general merchandise websites and five out of five travel
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
   101
% websites. (Steering is when a company doesn’t give you a customised
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
   102
% price, but points you towards more expensive options if it thinks
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
   103
% you will pay more.) The online travel company Orbitz raised
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
   104
% headlines in 2012 when it emerged that the firm was pointing Mac
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
   105
% users towards higher-priced hotel rooms than PC users.
b03becc049e6 updated
Christian Urban <urbanc@in.tum.de>
parents: 495
diff changeset
   106
501
0d40d1f973e0 updated
Christian Urban <urbanc@in.tum.de>
parents: 500
diff changeset
   107
0d40d1f973e0 updated
Christian Urban <urbanc@in.tum.de>
parents: 500
diff changeset
   108
%%% government will overwrite your wishes if it is annoymous
0d40d1f973e0 updated
Christian Urban <urbanc@in.tum.de>
parents: 500
diff changeset
   109
%% https://www.lightbluetouchpaper.org/2016/12/05/government-u-turn-on-health-privacy/
0d40d1f973e0 updated
Christian Urban <urbanc@in.tum.de>
parents: 500
diff changeset
   110
510
51267a687b85 updated test
Christian Urban <urbanc@in.tum.de>
parents: 501
diff changeset
   111
%% corporate surveilance / privacy - report and CC3C talk
51267a687b85 updated test
Christian Urban <urbanc@in.tum.de>
parents: 501
diff changeset
   112
%%      http://crackedlabs.org/en/networksofcontrol
51267a687b85 updated test
Christian Urban <urbanc@in.tum.de>
parents: 501
diff changeset
   113
%%      https://media.ccc.de/v/33c3-8414-corporate_surveillance_digital_tracking_big_data_privacy#video&t=2933
51267a687b85 updated test
Christian Urban <urbanc@in.tum.de>
parents: 501
diff changeset
   114
480
ab31912a3b65 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 467
diff changeset
   115
\section*{Handout 6 (Privacy)}
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   116
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   117
The first motor car was invented around 1886. For ten years,
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   118
until 1896, the law in the UK (and elsewhere) required a
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   119
person to walk in front of any moving car waving a red flag.
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   120
Cars were such a novelty that most people did not know what to
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   121
make of them. The person with the red flag was intended to
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   122
warn the public, for example horse owners, about the impending
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   123
novelty---a car. In my humble opinion, we are at the same
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   124
stage of development with privacy. Nobody really knows what it
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   125
is about or what it is good for. All seems very hazy. There
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   126
are a few laws (e.g.~cookie law, right-to-be-forgotten law)
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   127
which address problems with privacy, but even if they are well
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   128
intentioned, they either back-fire or are already obsolete
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   129
because of newer technologies. The result is that the world of
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   130
``privacy'' looks a little bit like the old Wild
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   131
West---lawless and mythical.
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   132
449
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   133
We would have hoped that after Snowden, Western governments
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   134
would be a bit more sensitive and enlightned about the topic
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   135
of privacy, but this is far from the truth. Ross Anderson
450
f3d5e57ca00a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 449
diff changeset
   136
wrote the following in his blog\footnote{\url{https://www.lightbluetouchpaper.org/2016/02/11/report-on-the-ip-bill/}} about the approach taken in
449
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   137
the US to lessons learned from the Snowden leaks and contrasts
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   138
this with the new snooping bill that is considered in the UK
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   139
parliament: 
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   140
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   141
\begin{quote}\it 
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   142
``The comparison with the USA is stark. There, all three
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   143
branches of government realised they'd gone too far after
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   144
Snowden. President Obama set up the NSA review group, and
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   145
implemented most of its recommendations by executive order;
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   146
the judiciary made changes to the procedures of the FISA
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   147
Court; and Congress failed to renew the data retention
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   148
provisions in the Patriot Act (aided by the judiciary). Yet
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   149
here in Britain the response is just to take Henry VIII powers
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   150
to legalise all the illegal things that GCHQ had been up to,
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   151
and hope that the European courts won't strike the law down
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   152
yet again.''
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   153
\end{quote}
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   154
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   155
\noindent Unfortunately, also big organisations besides
7ecbf5339d0f updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 448
diff changeset
   156
governments seem to take an unenlightened approach to privacy.
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   157
For example, UCAS, a charity set up to help students with
448
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   158
applying to universities in the UK, has a commercial unit that
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   159
happily sells your email addresses to anybody who forks out
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   160
enough money for bombarding you with spam. Yes, you can opt
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   161
out very often from such ``schemes'', but in case of UCAS any
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   162
opt-out will limit also legit emails you might actually be
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   163
interested in.\footnote{The main objectionable point, in my
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   164
opinion, is that the \emph{charity} everybody has to use for
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   165
HE applications has actually very honourable goals
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   166
(e.g.~assist applicants in gaining access to universities),
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   167
but the small print (or better the link ``About us'') reveals
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   168
they set up their organisation so that they can also
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   169
shamelessly sell the email addresses they ``harvest''.
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   170
Everything is of course very legal\ldots{}ethical?\ldots{}well
48d0a9890adc updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 444
diff changeset
   171
that is in the eye of the beholder. See:
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   172
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   173
\url{http://www.ucas.com/about-us/inside-ucas/advertising-opportunities} 
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   174
or
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   175
\url{http://www.theguardian.com/uk-news/2014/mar/12/ucas-sells-marketing-access-student-data-advertisers}}
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   176
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   177
Another example: Verizon, an ISP who is supposed to provide
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   178
you just with connectivity, has found a ``nice'' side-business
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   179
too: When you have enabled all privacy guards in your browser
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   180
(the few you have at your disposal), Verizon happily adds a
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   181
kind of cookie to your
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   182
HTTP-requests.\footnote{\url{http://webpolicy.org/2014/10/24/how-verizons-advertising-header-works/}}
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   183
As shown in the picture below, this cookie will be sent to
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   184
every web-site you visit. The web-sites then can forward the
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   185
cookie to advertisers who in turn pay Verizon to tell them
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   186
everything they want to know about the person who just made
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   187
this request, that is you.
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   188
 
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   189
\begin{center}
366
34a8f73b2c94 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 325
diff changeset
   190
\includegraphics[scale=0.16]{../pics/verizon.png}
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   191
\end{center}
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   192
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   193
\noindent How disgusting! Even worse, Verizon is not known for
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   194
being the cheapest ISP on the planet (completely the
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   195
contrary), and also not known for providing the fastest
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   196
possible speeds, but rather for being among the few ISPs in
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   197
the US with a quasi-monopolistic ``market distribution''.
310
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   198
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   199
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   200
Well, we could go on and on\ldots{}and that has not even
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   201
started us yet with all the naughty things NSA \& Friends are
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   202
up to. Why does privacy actually matter? Nobody, I think, has
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   203
a conclusive answer to this question yet. Maybe the following
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   204
four notions help with clarifying the overall picture
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   205
somewhat: 
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   206
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   207
\begin{itemize}
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   208
\item \textbf{Secrecy} is the mechanism used to limit the
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   209
      number of principals with access to information (e.g.,
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   210
      cryptography or access controls). For example I better
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   211
      keep my password secret, otherwise people from the wrong
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   212
      side of the law might impersonate me.
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   213
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   214
\item \textbf{Confidentiality} is the obligation to protect
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   215
      the secrets of other people or organisations (secrecy
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   216
      for the benefit of an organisation). For example as a
308
2a814c06ae03 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 307
diff changeset
   217
      staff member at King's I have access to data, even
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   218
      private data, I am allowed to use in my work but not
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   219
      allowed to disclose to anyone else.
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   220
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   221
\item \textbf{Anonymity} is the ability to leave no evidence of
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   222
      an activity (e.g., sharing a secret). This is not equal
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   223
        with privacy---anonymity is required in many 
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   224
        circumstances, for example for whistle-blowers, 
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   225
        voting, exam marking and so on.
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   226
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   227
\item \textbf{Privacy} is the ability or right to protect your
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   228
      personal secrets (secrecy for the benefit of an
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   229
      individual). For example, in a job interview, I might
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   230
      not like to disclose that I am pregnant, if I were a
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   231
      woman, or that I am a father. Lest they might not hire
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   232
      me. Similarly, I might not like to disclose my location
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   233
      data, because thieves might break into my house if they
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   234
      know I am away at work. Privacy is essentially
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   235
      everything which ``shouldn't be anybody's business''.
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   236
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   237
\end{itemize}
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   238
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   239
\noindent While this might provide us with some rough
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   240
definitions, the problem with privacy is that it is an
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   241
extremely fine line what should stay private and what should
310
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   242
not. For example, since I am working in academia, I am every
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   243
so often very happy to be a digital exhibitionist: I am very
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   244
happy to disclose all `trivia' related to my work on my
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   245
personal web-page. This is a kind of bragging that is normal
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   246
in academia (at least in the field of CS), even expected if
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   247
you look for a job. I am even happy that Google maintains a
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   248
profile about all my academic papers and their citations. 
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   249
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   250
On the other hand I would be very irritated if anybody I do
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   251
not know had a too close look on my private live---it
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   252
shouldn't be anybody's business. The reason is that knowledge
423
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   253
about my private life can often be used against me. As mentioned
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   254
above, public location data might mean I get robbed. If
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   255
supermarkets build a profile of my shopping habits, they will
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   256
use it to \emph{their} advantage---surely not to \emph{my}
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   257
advantage. Also whatever might be collected about my life will
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   258
always be an incomplete, or even misleading, picture. For
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   259
example I am pretty sure my creditworthiness score was
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   260
temporarily(?) destroyed by not having a regular income in
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   261
this country (before coming to King's I worked in Munich for
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   262
five years). To correct such incomplete or flawed credit
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   263
history data there is, since recently, a law that allows you
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   264
to check what information is held about you for determining
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   265
your creditworthiness. But this concerns only a very small
423
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   266
part of the data that is held about me/you. Also
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   267
what about cases where data is wrong or outdated (but do we
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   268
need a right-to be forgotten).
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   269
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   270
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   271
To see how private matter can lead really to the wrong
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   272
conclusions, take the example of Stephen Hawking: When he was
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   273
diagnosed with his disease, he was given a life expectancy of
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   274
two years. If employers would know about such problems, would
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   275
they have employed Hawking? Now, he is enjoying his 70+
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   276
birthday. Clearly personal medical data needs to stay private.
310
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   277
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   278
To cut a long story short, I let you ponder about the two
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   279
statements which are often voiced in discussions about privacy:
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   280
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   281
\begin{itemize}
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   282
\item \textit{``You have zero privacy anyway. Get over 
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   283
it.''}\\
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   284
\mbox{}\hfill{}{\small{}(by Scott Mcnealy, former CEO of Sun)}
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   285
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   286
\item \textit{``If you have nothing to hide, you have nothing 
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   287
to fear.''}
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   288
\end{itemize}
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   289
 
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   290
\noindent If you like to watch a movie which has this topic as
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   291
its main focus I recommend \emph{Gattaca} from
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   292
1997.\footnote{\url{http://www.imdb.com/title/tt0119177/}} If
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   293
you want to read up on this topic, I can recommend the
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   294
following article that appeared in 2011 in the Chronicle of
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   295
Higher Education:
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   296
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   297
\begin{center} 
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   298
\url{http://chronicle.com/article/Why-Privacy-Matters-Even-if/127461/} 
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   299
\end{center} 
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   300
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   301
\noindent Funnily, or maybe not so funnily, the author of this
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   302
article carefully tries to construct an argument that does not
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   303
only attack the nothing-to-hide statement in cases where
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   304
governments \& co collect people's deepest secrets, or
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   305
pictures of people's naked bodies, but an argument that
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   306
applies also in cases where governments ``only'' collect data
310
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   307
relevant to, say, preventing terrorism. The fun is of course
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   308
that in 2011 we could just not imagine that respected
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   309
governments would do such infantile things as intercepting
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   310
people's nude photos. Well, since Snowden we know some people
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   311
at the NSA did exactly that and then shared such photos among
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   312
colleagues as ``fringe benefit''.  
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   313
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   314
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   315
\subsubsection*{Re-Identification Attacks} 
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   316
310
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   317
Apart from philosophical musings, there are fortunately also
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   318
some real technical problems with privacy. The problem I want
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   319
to focus on in this handout is how to safely disclose datasets
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   320
containing potentially very private data, say health records.
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   321
What can go wrong with such disclosures can be illustrated
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   322
with four well-known examples:
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   323
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   324
\begin{itemize}
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   325
\item In 2006, a then young company called Netflix offered a 1
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   326
      Mio \$ prize to anybody who could improve their movie
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   327
      rating algorithm. For this they disclosed a dataset
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   328
      containing 10\% of all Netflix users at the time
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   329
      (appr.~500K). They removed names, but included numerical
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   330
      ratings of movies as well as times when ratings were
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   331
      uploaded. Though some information was perturbed (i.e.,
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   332
      slightly modified).
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   333
      
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   334
      Two researchers had a closer look at this anonymised
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   335
      data and compared it with public data available from the
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   336
      International Movie Database (IMDb). They found that
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   337
      98\% of the entries could be re-identified in the
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   338
      Netflix dataset: either by their ratings or by the dates
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   339
      the ratings were uploaded. The result was a class-action
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   340
      suit against Netflix, which was only recently resolved
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   341
      involving a lot of money.
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   342
310
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   343
\item In the 1990ies, medical datasets were often made public
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   344
      for research purposes. This was done in anonymised form
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   345
      with names removed, but birth dates, gender and ZIP-code
310
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   346
      were retained. In one case where such data about
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   347
      hospital visits of state employees in Massachusetts was
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   348
      made public, the then governor assured the public that
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   349
      the released dataset protected patient privacy by
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   350
      deleting identifiers. 
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   351
      
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   352
      A graduate student could not resist cross-referencing
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   353
      public voter data with the released data that still
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   354
      included birth dates, gender and ZIP-code. The result
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   355
      was that she could send the governor his own hospital
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   356
      record. It turns out that birth dates, gender and
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   357
      ZIP-code uniquely identify 87\% of people in the US.
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   358
      This work resulted in a number of laws prescribing which
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   359
      private data cannot be released in such datasets.
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   360
 
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   361
\item In 2006, AOL published 20 million Web search queries
310
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   362
      collected from 650,000 users (names had been deleted).
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   363
      This was again done for research purposes. However,
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   364
      within days an old lady, Thelma Arnold, from Lilburn,
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   365
      Georgia, (11,596 inhabitants) was identified as user
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   366
      No.~4417749 in this dataset. It turned out that search
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   367
      engine queries are deep windows into people's private
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   368
      lives. 
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   369
  
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   370
\item Genome-Wide Association Studies (GWAS) was a public
309
b1ba3d88696e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 308
diff changeset
   371
      database of gene-frequency studies linked to diseases.
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   372
      It would essentially record that people who have a
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   373
      disease, say diabetes, have also certain genes. In order
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   374
      to maintain privacy, the dataset would only include
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   375
      aggregate information. In case of DNA data this
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   376
      aggregation was achieved by mixing the DNA of many
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   377
      individuals (having a disease) into a single solution.
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   378
      Then this mixture was sequenced and included in the
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   379
      dataset. The idea was that the aggregate information
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   380
      would still be helpful to researchers, but would protect
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   381
      the DNA data of individuals. 
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   382
       
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   383
      In 2007 a forensic computer scientist showed that
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   384
      individuals can still be identified. For this he used
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   385
      the DNA data from a comparison group (people from the
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   386
      general public) and ``subtracted'' this data from the
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   387
      published data. He was left with data that included all
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   388
      ``special'' DNA-markers of the individuals present in
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   389
      the original mixture. He essentially deleted the
423
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   390
      ``background noise'' in the published data. The problem
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   391
      with DNA data is that it is of such a high resolution
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   392
      that even if the mixture contained maybe 100
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   393
      individuals, you can with current technology detect
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   394
      whether an individual was included in the mixture or
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   395
      not.
310
591b62e1f86a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 309
diff changeset
   396
      
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   397
      This result changed completely how DNA data is nowadays
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   398
      published for research purposes. After the success of 
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   399
      the human-genome project with a very open culture of
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   400
      exchanging data, it became much more difficult to 
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   401
      anonymise data so that patient's privacy is preserved.
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   402
      The public GWAS database was taken offline in 2008.
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   403
      
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   404
\end{itemize}
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   405
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   406
\noindent There are many lessons that can be learned from
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   407
these examples. One is that when making datasets public in
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   408
anonymised form, you want to achieve \emph{forward privacy}.
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   409
This means, no matter what other data that is also available
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   410
or will be released later, the data in the original dataset
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   411
does not compromise an individual's privacy. This principle
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   412
was violated by the availability of ``outside data'' in the
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   413
Netflix and governor of Massachusetts cases. The additional
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   414
data permitted a re-identification of individuals in the
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   415
dataset. In case of GWAS a new technique of re-identification
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   416
compromised the privacy of people in the dataset. The case of
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   417
the AOL dataset shows clearly how incomplete such data can be:
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   418
Although the queries uniquely identified the older lady, she
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   419
also looked up diseases that her friends had, which had
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   420
nothing to do with her. Any rational analysis of her query
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   421
data must therefore have concluded, the lady is on her
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   422
death bed, while she was actually very much alive and kicking.
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   423
444
aea1d40cf1ba updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 443
diff changeset
   424
In 2016, Yahoo released the so far largest machine learning
aea1d40cf1ba updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 443
diff changeset
   425
dataset to the research community. It includes approximately
aea1d40cf1ba updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 443
diff changeset
   426
13.5 TByte of data representing around 100 Billion events from
aea1d40cf1ba updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 443
diff changeset
   427
anonymized user-news items, collected by recording
aea1d40cf1ba updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 443
diff changeset
   428
interactions of about 20M users from February 2015 to May
aea1d40cf1ba updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 443
diff changeset
   429
2015. Yahoo's gracious goal is to promote independent research
aea1d40cf1ba updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 443
diff changeset
   430
in the fields of large-scale machine learning and recommender
aea1d40cf1ba updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 443
diff changeset
   431
systems. It remains to be seen whether this data will really
aea1d40cf1ba updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 443
diff changeset
   432
only be used for that purpose.
aea1d40cf1ba updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 443
diff changeset
   433
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   434
\subsubsection*{Differential Privacy}
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   435
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   436
Differential privacy is one of the few methods that tries to
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   437
achieve forward privacy. The basic idea is to add appropriate
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   438
noise, or errors, to any query of the dataset. The intention
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   439
is to make the result of a query insensitive to individual
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   440
entries in the database. That means the results are
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   441
approximately the same no matter if a particular individual is
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   442
in the dataset or not. The hope is that the added error does
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   443
not eliminate the ``signal'' one is looking for in the
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   444
dataset.
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   445
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   446
%\begin{center}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   447
%User\;\;\;\;    
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   448
%\begin{tabular}{c}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   449
%tell me $f(x)$ $\Rightarrow$\\
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   450
%$\Leftarrow$ $f(x) + \text{noise}$
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   451
%\end{tabular}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   452
%\;\;\;\;\begin{tabular}{@{}c}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   453
%Database\\
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   454
%$x_1, \ldots, x_n$
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   455
%\end{tabular}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   456
%\end{center}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   457
%
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   458
%\begin{center}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   459
%\begin{tabular}{l|l}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   460
%Staff & Salary\\\hline
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   461
%$PM$ & \pounds{107}\\
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   462
%$PF$ & \pounds{102}\\
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   463
%$LM_1$ & \pounds{101}\\
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   464
%$LF_2$ & \pounds{97}\\
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   465
%$LM_3$ & \pounds{100}\\
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   466
%$LM_4$ & \pounds{99}\\
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   467
%$LF_5$ & \pounds{98}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   468
%\end{tabular}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   469
%\end{center}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   470
%
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   471
%
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   472
%\begin{center}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   473
%\begin{tikzpicture} 
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   474
%\begin{axis}[symbolic y coords={salary},
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   475
%             ytick=data,
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   476
%             height=3cm]
%\addplot+[jump mark mid] coordinates
%{(0,salary)   (0.1,salary) 
% (0.4,salary) (0.5,salary)  
% (0.8,salary) (0.9,salary)};
%\end{axis}
%\end{tikzpicture}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   477
%\end{center}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   478
%
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   479
%\begin{tikzpicture}[outline/.style={draw=#1,fill=#1!20}]
%  \node [outline=red]            {red box};
%  \node [outline=blue] at (0,-1) {blue box};
%\end{tikzpicture}
311
8befc029ca1e updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 310
diff changeset
   480
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   481
\ldots
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   482
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   483
312
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   484
\subsubsection*{Further Reading}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   485
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   486
Two cool articles about how somebody obtained via the Freedom
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   487
of Information Law the taxicab dataset of New York and someone
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   488
else showed how easy it is to mine for private information: 
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   489
423
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   490
\begin{center}\small
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   491
\begin{tabular}{p{0.78\textwidth}}
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   492
\url{http://chriswhong.com/open-data/foil_nyc_taxi/}\smallskip\\
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   493
\url{http://research.neustar.biz/2014/09/15/riding-with-the-stars-passenger-privacy-in-the-nyc-taxicab-dataset}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   494
\end{tabular}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   495
\end{center}
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   496
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   497
\noindent 
312
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   498
A readable article about how supermarkets mine your shopping
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   499
habits (especially how they prey on new exhausted parents
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   500
;o) appeared in 2012 in the New York Times:
312
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   501
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   502
\begin{center}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   503
\url{http://www.nytimes.com/2012/02/19/magazine/shopping-habits.html}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   504
\end{center}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   505
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   506
\noindent An article that analyses privacy and shopping habits 
423
11b46fa92a85 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 366
diff changeset
   507
from a more economic point of view is available from:
312
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   508
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   509
\begin{center}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   510
\url{http://www.dtc.umn.edu/~odlyzko/doc/privacy.economics.pdf}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   511
\end{center}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   512
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   513
\noindent An attempt to untangle the web of current technology
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   514
for spying on consumers is published in:
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   515
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   516
\begin{center}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   517
\url{http://cyberlaw.stanford.edu/files/publication/files/trackingsurvey12.pdf}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   518
\end{center}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   519
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   520
\noindent An article that sheds light on the paradox that
312
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   521
people usually worry about privacy invasions of little
313
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   522
significance, and overlook the privacy invasion that might
1d243ac51078 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 312
diff changeset
   523
cause significant damage:
312
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   524
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   525
\begin{center}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   526
\url{http://www.heinz.cmu.edu/~acquisti/papers/Acquisti-Grossklags-Chapter-Etrics.pdf}
c913fe9bfd59 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 311
diff changeset
   527
\end{center}
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   528
512
174cc952ad36 updated
Christian Urban <urbanc@in.tum.de>
parents: 510
diff changeset
   529
174cc952ad36 updated
Christian Urban <urbanc@in.tum.de>
parents: 510
diff changeset
   530
Interesting ideas
174cc952ad36 updated
Christian Urban <urbanc@in.tum.de>
parents: 510
diff changeset
   531
174cc952ad36 updated
Christian Urban <urbanc@in.tum.de>
parents: 510
diff changeset
   532
\begin{center}
174cc952ad36 updated
Christian Urban <urbanc@in.tum.de>
parents: 510
diff changeset
   533
\url{https://adnauseam.io}
174cc952ad36 updated
Christian Urban <urbanc@in.tum.de>
parents: 510
diff changeset
   534
\end{center}
174cc952ad36 updated
Christian Urban <urbanc@in.tum.de>
parents: 510
diff changeset
   535
513
84ed8d6143ea updated
Christian Urban <urbanc@in.tum.de>
parents: 512
diff changeset
   536
\noindent
84ed8d6143ea updated
Christian Urban <urbanc@in.tum.de>
parents: 512
diff changeset
   537
And a paper that predicts ad-blockers will in the end win over anti-ad-blocking:
84ed8d6143ea updated
Christian Urban <urbanc@in.tum.de>
parents: 512
diff changeset
   538
84ed8d6143ea updated
Christian Urban <urbanc@in.tum.de>
parents: 512
diff changeset
   539
\begin{center}
84ed8d6143ea updated
Christian Urban <urbanc@in.tum.de>
parents: 512
diff changeset
   540
\url{http://randomwalker.info/publications/ad-blocking-framework-techniques.pdf}
84ed8d6143ea updated
Christian Urban <urbanc@in.tum.de>
parents: 512
diff changeset
   541
\end{center}
84ed8d6143ea updated
Christian Urban <urbanc@in.tum.de>
parents: 512
diff changeset
   542
84ed8d6143ea updated
Christian Urban <urbanc@in.tum.de>
parents: 512
diff changeset
   543
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   544
\end{document}
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   545
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   546
http://randomwalker.info/teaching/fall-2012-privacy-technologies/?
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   547
http://chronicle.com/article/Why-Privacy-Matters-Even-if/127461/
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   548
http://repository.cmu.edu/cgi/viewcontent.cgi?article=1077&context=hcii
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   549
https://josephhall.org/papers/NYU-MCC-1303-S2012_privacy_syllabus.pdf
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   550
http://www.jetlaw.org/wp-content/uploads/2014/06/Bambauer_Final.pdf
315
7bd723cb9b32 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 314
diff changeset
   551
http://www.cs.cmu.edu/~yuxiangw/docs/Differential%20Privacy.pdf
7bd723cb9b32 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 314
diff changeset
   552
https://www.youtube.com/watch?v=Gx13lgEudtU
7bd723cb9b32 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 314
diff changeset
   553
https://www.cs.purdue.edu/homes/ctask/pdfs/CERIAS_Presentation.pdf
7bd723cb9b32 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 314
diff changeset
   554
http://www.futureofprivacy.org/wp-content/uploads/Differential-Privacy-as-a-Response-to-the-Reidentification-Threat-Klinefelter-and-Chin.pdf
7bd723cb9b32 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 314
diff changeset
   555
http://www.cis.upenn.edu/~aaroth/courses/slides/Overview.pdf
325
48c6751f2173 updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 315
diff changeset
   556
http://www.cl.cam.ac.uk/~sjm217/papers/tor14design.pdf
314
e01f55e7485a updated
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents: 313
diff changeset
   557
307
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   558
%%% Local Variables: 
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   559
%%% mode: latex
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   560
%%% TeX-master: t
98ee5f760a8c added hw 7
Christian Urban <christian dot urban at kcl dot ac dot uk>
parents:
diff changeset
   561
%%% End: