NikosKprl commited on
Commit
b700d6b
·
verified ·
1 Parent(s): 07745e7

Update ✨Entity Linking Application✨.py

Browse files
Files changed (1) hide show
  1. ✨Entity Linking Application✨.py +12 -13
✨Entity Linking Application✨.py CHANGED
@@ -62,8 +62,8 @@ async def combination_method(name, session):
62
  x = itertools_combinations(new_name, 2)
63
  for i in x:
64
  new_word = (i[0] + " " + i[1])
65
- url = f"{new_word} site:en.wikipedia.org inurl:/wiki/ -inurl:?"
66
- s = search(url, num_results = 12, lang="en")
67
  for i in s:
68
  data.add(i.split("/")[-1])
69
  return data
@@ -73,7 +73,7 @@ async def single_method(name, session):
73
  data = set()
74
  new_name = name.replace("-", " ").replace("/", " ").split()
75
  for i in new_name:
76
- url = f"{i} site:en.wikipedia.org inurl:/wiki/ -inurl:?"
77
  s = search(url, num_results = 12, lang="en")
78
  for i in s:
79
  data.add(i.split("/")[-1])
@@ -85,7 +85,7 @@ async def mains(name, single, combi):
85
  qids = set()
86
 
87
  async with aiohttp.ClientSession() as session:
88
- url = f"{name} site:en.wikipedia.org inurl:/wiki/ -inurl:?"
89
  s = search(url, num_results = 30, lang="en")
90
  for i in s:
91
  data.add(i.split("/")[-1])
@@ -267,17 +267,17 @@ async def main(name):
267
  with open(f"/home/user/app/info_extraction/{name}.json", "w", encoding="utf-8") as flast:
268
  json.dump(final_list, flast)
269
 
270
- def check_sentence(sentence):
271
- two_consecutive_uppercase = r"[A-Z]{2}"
272
- uppercase_followed_by_fullstop = r"[A-Z]\."
273
 
274
- if re.search(two_consecutive_uppercase, sentence):
275
- return True
276
 
277
- if re.search(uppercase_followed_by_fullstop, sentence):
278
- return True
279
 
280
- return False
281
 
282
  chrome_driver_path = "chromedriver.exe"
283
  chrome_path = r'"C:\Program Files\Google\Chrome\Application\chrome.exe"'
@@ -428,7 +428,6 @@ def main_cli():
428
  st.write(f"Applying Candidate Selection module... (4/5) [{number}/{len(list_with_full_names)}]")
429
  with open(f"/home/user/app/info_extraction/{i}.json", "r") as f:
430
  json_file = json.load(f)
431
- print(json_file)
432
  lista = []
433
  lista_1 = []
434
  for element in json_file:
 
62
  x = itertools_combinations(new_name, 2)
63
  for i in x:
64
  new_word = (i[0] + " " + i[1])
65
+ url = f"{new_word} site:en.wikipedia.org inurl:/wiki/ -inurl:? -inurl:Category: -inurl:Help: -inurl:Special: -inurl:File:"
66
+ s = search(url, num_results = 12, lang="en")l
67
  for i in s:
68
  data.add(i.split("/")[-1])
69
  return data
 
73
  data = set()
74
  new_name = name.replace("-", " ").replace("/", " ").split()
75
  for i in new_name:
76
+ url = f"{i} site:en.wikipedia.org inurl:/wiki/ -inurl:? -inurl:Category: -inurl:Help: -inurl:Special: -inurl:File:"
77
  s = search(url, num_results = 12, lang="en")
78
  for i in s:
79
  data.add(i.split("/")[-1])
 
85
  qids = set()
86
 
87
  async with aiohttp.ClientSession() as session:
88
+ url = f"{name} site:en.wikipedia.org inurl:/wiki/ -inurl:? -inurl:Category: -inurl:Help: -inurl:Special: -inurl:File:"
89
  s = search(url, num_results = 30, lang="en")
90
  for i in s:
91
  data.add(i.split("/")[-1])
 
267
  with open(f"/home/user/app/info_extraction/{name}.json", "w", encoding="utf-8") as flast:
268
  json.dump(final_list, flast)
269
 
270
+ #def check_sentence(sentence):
271
+ # two_consecutive_uppercase = r"[A-Z]{2}"
272
+ # uppercase_followed_by_fullstop = r"[A-Z]\."
273
 
274
+ # if re.search(two_consecutive_uppercase, sentence):
275
+ # return True
276
 
277
+ # if re.search(uppercase_followed_by_fullstop, sentence):
278
+ # return True
279
 
280
+ # return False
281
 
282
  chrome_driver_path = "chromedriver.exe"
283
  chrome_path = r'"C:\Program Files\Google\Chrome\Application\chrome.exe"'
 
428
  st.write(f"Applying Candidate Selection module... (4/5) [{number}/{len(list_with_full_names)}]")
429
  with open(f"/home/user/app/info_extraction/{i}.json", "r") as f:
430
  json_file = json.load(f)
 
431
  lista = []
432
  lista_1 = []
433
  for element in json_file: