-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathentity_linking_plain.py
More file actions
91 lines (76 loc) · 2.05 KB
/
Copy pathentity_linking_plain.py
File metadata and controls
91 lines (76 loc) · 2.05 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
import requests
import json
import requests # 2.18.4
import pymysql
# Define the base API endpoint for searching datasets
base_url = "https://www.wikidata.org/w/api.php"
user = "..."
pwd = "..."
conn = pymysql.connect(
host="...", user=user, password=pwd, database="..."
)
cursor = conn.cursor()
sql = "SELECT license FROM acordar_datasets"
print(sql)
cursor.execute(sql)
res = cursor.fetchall()
cursor.close()
conn.close()
res_dict = {}
for re in res:
if re[0] is not None:
res_dict[re[0]] = True
http_proxy = "http://127.0.0.1:7899"
https_proxy = "http://127.0.0.1:7899"
proxies = {
"http": "http://127.0.0.1:7899",
"https": "http://127.0.0.1:7899",
}
# Define query parameters for the search
params = {
"action": "wbsearchentities",
"format": "json",
"search": "Fish and Wildlife Service",
"language": "en",
"type": "item",
"limit": 1,
}
# Make the GET request to the API
response = requests.get(base_url, params=params, proxies=proxies)
# Parse the JSON response
new_json = []
entity_type = "publisher" # or "licence"
for name in res_dict.keys():
params = {
"action": "wbsearchentities",
"format": "json",
"search": name,
"language": "en",
"type": "item",
"limit": 1,
}
response = requests.get(base_url, params=params)
data = response.json()
if name == "" or len(data["search"]) == 0:
new_json.append(
{
entity_type + "_name": name,
entity_type: "",
}
)
elif: "NASA" in name or "nasa" in name: # cases for NASA/../.. (NASA's agencies)
new_json.append(
{
entity_type + "_name": name,
entity_type: "https://www.wikidata.org/wiki/Q23548",
}
)
else:
new_json.append(
{
entity_type + "_name": name,
"license": data["search"][0]["concepturi"],
}
)
with open("entity_mapping_acordar.json", "w") as f:
json.dump(new_json, f, indent=2)