Spaces:
Sleeping
Sleeping
Shunfeng Zheng
commited on
Update disambiguation/disambiguate.py
Browse files
disambiguation/disambiguate.py
CHANGED
|
@@ -19,14 +19,7 @@ import streamlit as st
|
|
| 19 |
urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
|
| 20 |
|
| 21 |
|
| 22 |
-
|
| 23 |
-
headers = {
|
| 24 |
-
"User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/18.3 Safari/605.1.15"
|
| 25 |
-
}
|
| 26 |
-
page1 = requests.get(request_url, headers=headers, verify=False)
|
| 27 |
-
cont = page1.content
|
| 28 |
-
st.markdown('111')
|
| 29 |
-
st.markdown(cont)
|
| 30 |
|
| 31 |
|
| 32 |
def dismabiguate_entities(doc, ent, ase, level_1, level_2, level_3, midmid):
|
|
@@ -38,15 +31,6 @@ def get_coordinates(ent, ase, level_1, level_2, level_3, midmid):
|
|
| 38 |
}
|
| 39 |
time.sleep(2)
|
| 40 |
page = requests.get(request_url, headers=headers, verify=False)
|
| 41 |
-
# page = requests.get(request_url, verify=False)
|
| 42 |
-
# print(request_url, '++++++')
|
| 43 |
-
# print(ent, '++++++')
|
| 44 |
-
# print(ase, '++++++')
|
| 45 |
-
# print(level_1, '++++++')
|
| 46 |
-
# print(level_2, '++++++')
|
| 47 |
-
# print(level_3, '++++++')
|
| 48 |
-
# print(midmid, '++++++')
|
| 49 |
-
|
| 50 |
|
| 51 |
json_content = json.loads(page.content)
|
| 52 |
# json_content = json.loads(aa)
|
|
@@ -60,16 +44,6 @@ def get_coordinates(ent, ase, level_1, level_2, level_3, midmid):
|
|
| 60 |
mid1 = None
|
| 61 |
mid2 = None
|
| 62 |
coordinates = all_coordinates
|
| 63 |
-
# if level_1 is not None:
|
| 64 |
-
#
|
| 65 |
-
# all_coordinates, centroid, mid1, mid2 = geo_level1.get_level1_coordinates(all_coordinates, centroid, level_1, midmid)
|
| 66 |
-
|
| 67 |
-
# if level_2 is not None:
|
| 68 |
-
# if level_1 is not None and level_1.lower() not in geo_level1.center:
|
| 69 |
-
# all_coordinates, centroid = geo_level2.get_level2_coordinates(coordinates, centroid, level_2, level_1)
|
| 70 |
-
# else:
|
| 71 |
-
# print ("Else executed")
|
| 72 |
-
# all_coordinates, centroid = geo_level2.get_level2_coordinates(all_coordinates, centroid, level_2, level_1)
|
| 73 |
|
| 74 |
if level_3 is not None:
|
| 75 |
all_coordinates, centroid = geo_level3.get_level3_coordinates(coordinates, centroid, level_3, level_1)
|
|
@@ -82,7 +56,6 @@ def get_coordinates(ent, ase, level_1, level_2, level_3, midmid):
|
|
| 82 |
def dismabiguate_entities_between(doc, ent, ase, level_1, level_2, level_3, midmid):
|
| 83 |
return get_coordinates_between(doc, ent, ase, level_1, level_2, level_3, midmid)
|
| 84 |
|
| 85 |
-
|
| 86 |
def get_coordinates_between(doc, ent, ase, level_1, level_2, level_3, midmid):
|
| 87 |
|
| 88 |
# first ase
|
|
@@ -105,16 +78,9 @@ def get_coordinates_between(doc, ent, ase, level_1, level_2, level_3, midmid):
|
|
| 105 |
"User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/18.3 Safari/605.1.15"
|
| 106 |
}
|
| 107 |
page = requests.get(request_url, headers=headers, verify=False)
|
| 108 |
-
|
| 109 |
-
|
| 110 |
-
print(doc.ents)
|
| 111 |
-
|
| 112 |
-
st.markdown(ase)
|
| 113 |
-
st.markdown(request_url)
|
| 114 |
-
st.markdown(page.content)
|
| 115 |
json_content = json.loads(page.content)
|
| 116 |
-
# json_content = json.loads(aa)
|
| 117 |
-
# print(json_content, 'jjj')
|
| 118 |
all_coordinates = json_content[0]['geojson']['coordinates'][0]
|
| 119 |
centroid = (float(json_content[0]['lon']), float(json_content[0]['lat']))
|
| 120 |
for p in all_coordinates:
|
|
|
|
| 19 |
urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
|
| 20 |
|
| 21 |
|
| 22 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 23 |
|
| 24 |
|
| 25 |
def dismabiguate_entities(doc, ent, ase, level_1, level_2, level_3, midmid):
|
|
|
|
| 31 |
}
|
| 32 |
time.sleep(2)
|
| 33 |
page = requests.get(request_url, headers=headers, verify=False)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 34 |
|
| 35 |
json_content = json.loads(page.content)
|
| 36 |
# json_content = json.loads(aa)
|
|
|
|
| 44 |
mid1 = None
|
| 45 |
mid2 = None
|
| 46 |
coordinates = all_coordinates
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 47 |
|
| 48 |
if level_3 is not None:
|
| 49 |
all_coordinates, centroid = geo_level3.get_level3_coordinates(coordinates, centroid, level_3, level_1)
|
|
|
|
| 56 |
def dismabiguate_entities_between(doc, ent, ase, level_1, level_2, level_3, midmid):
|
| 57 |
return get_coordinates_between(doc, ent, ase, level_1, level_2, level_3, midmid)
|
| 58 |
|
|
|
|
| 59 |
def get_coordinates_between(doc, ent, ase, level_1, level_2, level_3, midmid):
|
| 60 |
|
| 61 |
# first ase
|
|
|
|
| 78 |
"User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/18.3 Safari/605.1.15"
|
| 79 |
}
|
| 80 |
page = requests.get(request_url, headers=headers, verify=False)
|
| 81 |
+
|
| 82 |
+
st.markdown('The IP of this Space is blocked by OpenStreetMap, we are fixing this issue. You can still interact with the second table at the first page.')
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 83 |
json_content = json.loads(page.content)
|
|
|
|
|
|
|
| 84 |
all_coordinates = json_content[0]['geojson']['coordinates'][0]
|
| 85 |
centroid = (float(json_content[0]['lon']), float(json_content[0]['lat']))
|
| 86 |
for p in all_coordinates:
|