-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathdrawFigure2b.py
103 lines (90 loc) · 3.22 KB
/
drawFigure2b.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
from protocols.LocalHashing import LocalHashing
from Components.Distribution import zipf
from Components.Draw import draw
import math
NUMBEROFAXIS = 7 #### 9
N = 10000 #### 10000
#### begin/BLH ####
# protocol is class, fixing epsilon
def analytical_eps_BLH(protocol, epsilon, n):
vars = [] # return a list of variances
for step in range(NUMBEROFAXIS):
d = 2**(2 + step*2)
x = protocol(d, epsilon, g=2)
x.set_n(n)
var = x.var_analytical()
vars.append(math.log10(var))
return vars
# zipf distribution, similar to experiments in 14-RAPPOR
# run very slow, when d is 2^10
def empirical_eps_BLH(protocol, epsilon, n):
vars = []
for step in range(NUMBEROFAXIS):
d = 2**(2 + step*2)
x = protocol(d, epsilon, g=2) # init
users = zipf.zipf(1.1, d, n)
for i in range(len(users)):
if i % 1000 == 0:
print(step, i, 'BLH')
x.PE(users[i])
x.aggregation() # estimate couterEsti
f = zipf.probList(1.1, d, n)
var = x.var_empirical(f, n)
vars.append(math.log10(var))
return vars
#### end/BLH ####
#### begin/OLH ####
# protocol is class, fixing epsilon
def analytical_eps_OLH(protocol, epsilon, n):
vars = [] # return a list of variances
g = 53 # round(math.exp(epsilon)+1)效果不好,要取最近的素数(因为universal hashing!!)
for step in range(NUMBEROFAXIS): # 9 values
d = 2**(2 + step*2)
x = protocol(d, epsilon, g)
x.set_n(n)
var = x.var_analytical()
vars.append(math.log10(var))
return vars
# protocol is class, fixing epsilon
# run very slow, when d is 2^10
def empirical_eps_OLH(protocol, epsilon, n):
vars = []
g = 53 # round(math.exp(epsilon)+1)效果不好,要取最近的素数(因为universal hashing!!)
for step in range(NUMBEROFAXIS): #### 9 values
d = 2**(2 + step*2)
x = protocol(d, epsilon, g) # init
users = zipf.zipf(1.1, d, n)
for i in range(len(users)):
if i % 1000 == 0:
print(step, i, 'OLH')
x.PE(users[i])
x.aggregation() # estimate couterEsti
f = zipf.probList(1.1, d, n)
var = x.var_empirical(f, n)
vars.append(math.log10(var))
return vars
#### end/OLH ####
'''
Need run 10 times.
Temporarily run once.
'''
# Figure 2(b)
def Comparing_empirical_and_analytical_variance_b():
varslist = [] # return a list of (a list of variances)
# Analytical BLH
vars = analytical_eps_BLH(LocalHashing, 4, N)
varslist.append(vars)
# Empirical BLH
vars = empirical_eps_BLH(LocalHashing, 4, N)
varslist.append(vars)
# Analytical OLH
vars = analytical_eps_OLH(LocalHashing, 4, N)
varslist.append(vars)
# Empirical OLH
vars = empirical_eps_OLH(LocalHashing, 4, N)
varslist.append(vars)
# Draw
d = [item for item in range(2, (NUMBEROFAXIS+1)*2, 2)] # 2^2, 2^4, ..., 2^18
draw.lines(d, varslist, ['Analytical BLH', 'Empirical BLH', 'Analytical OLH', 'Empirical OLH'], title='Comparing empirical and analytical variance', xlabel='Vary d(log2(x))', ylabel='Var(log10(y))')
if __name__ == "__main__":
Comparing_empirical_and_analytical_variance_b()