-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathcompose.py
48 lines (42 loc) · 2.16 KB
/
compose.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
# The Whole Idea is explained as follows
# For instance, Our aim is converting the query Q 0.1<=a<0.2 and 0.4<=b<0.6 to
# the combinations of the following 4 simple queries
# 0) -inf < a < 0.2 and -inf < b < 0.6 00 a use max, b use max, sign is +
# 1) -inf < a < 0.2 and -inf < b < 0.4 01 a use max, b use min, sign is -
# 2) -inf < a < 0.1 and -inf < b < 0.6 10 a use min, b use max, sign is -
# 3) -inf < a < 0.1 and -inf < b < 0.4 11 a use min, b use min, sign is +
# and the result of Q is 0) - 1) - 2) + 3)
# We find the number of simple queries is 2**attr_num
# And their formulas are related to the 0 or 1 in the position of binary number
# while the signs are related to the number of 1s the binary number
# Therefore we have the following algorithms for decompose and compose
import numpy as np
def decompose(input_query, attr_num=10):
# query is a 2-d array 10 x 2
# each row represents the attr while column represents the min and max
# the query is already normalized to [0,1]
# while the attribute is missing, we can give the related range [0,1]
# input_query = np.array([[0.2, 0.3], [0.4, 0.5], [0.3, 0.9], [0.1, 0.7], [0.7, 1.0],
# [0.0, 1.0], [0.1, 0.8], [0.7, 0.8], [0.2, 0.6], [0.4, 0.6]])
output_query_list = []
for i in range(0, 2**attr_num):
output_query = []
for j in range(0, attr_num):
# Since i = 0 represents all max
# while i = 2**n -1 represents all min
if (i & (0b1 << j)) == 0:
output_query.append(input_query[j][1])
else:
output_query.append(input_query[j][0])
output_query_list.append(output_query)
return np.array(output_query_list)
def compose(input_res, attr_num=10):
# the input result are 2**attr_num and each is related to the above generated queries
# input_res = np.random.random(2**attr_num)
res = np.array([0.0])
for i in range(0, 2**attr_num):
count_one = bin(i).count("1")
sign = (-1)**count_one
res = res + sign * input_res[i]
# Due to precision error, sometimes res while be small negative, we fix it by max
return np.maximum(res, np.array([0.0]))