-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathdescriptions.py
31 lines (24 loc) · 951 Bytes
/
descriptions.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
import json
DATAFILE = 'qs.jsonl'
with open(DATAFILE) as file:
for line in file:
data = json.loads(line)
qids = data.get('entities', {})
labels = (list(qids.keys())[0], list(qids.values())[0].get('labels', {}),
list(qids.values())[0].get('descriptions', {}))
labdict = {labels[0]: {
'labels': {lab: labels[1][lab]['value'] for lab in labels[1]}},
'descriptions': {lab: labels[2][lab]['value'] for lab in labels[2]}}
print(json.dumps(labdict, ensure_ascii=False))
# universities, labels, and descriptions
# https://w.wiki/BxW6
"""
select ?university ?label ?description (lang(?description) as ?language) {
?university wdt:P31/wdt:P279* wd:Q3918 .
# ?university wdt:P17 wd:Q30 .
?university rdfs:label ?label .
?university schema:description ?description .
filter (lang(?label) = lang(?description))
} limit 100000
types: https://w.wiki/BxWd
"""