p-baleine commited on
Commit
e5112e5
1 Parent(s): 972452d

filter result

Browse files
Files changed (1) hide show
  1. metaanalyser/paper/paper.py +4 -2
metaanalyser/paper/paper.py CHANGED
@@ -177,7 +177,9 @@ def search_on_google_scholar(
177
 
178
  return True
179
 
180
- search_result = fetch_google_scholar(query, start)
 
 
181
 
182
  return [i for i in search_result if valid_item(i)]
183
 
@@ -186,7 +188,6 @@ def search_on_google_scholar(
186
 
187
  while len(result) < n:
188
  # FIXME: 今のままだとそもそも検索結果が全体で n 件以下の場合に無限ループになってしまう
189
- logger.info(f"Looking for `{query}` on Google Scholar, offset: {start}...")
190
  result += fetch(start)
191
  start += 10
192
 
@@ -257,6 +258,7 @@ Summry: {summary}
257
 
258
  @memory.cache
259
  def fetch_google_scholar(query: str, start: int) -> dict:
 
260
  serpapi = SerpAPIWrapper(params={
261
  "engine": "google_scholar",
262
  "gl": "us",
 
177
 
178
  return True
179
 
180
+ # FIXME: 検索結果に arxiv の文献をなるべく多く含めたいため検索クエリを弄っている
181
+ actual_query = " ".join([query, "arxiv"]) if "arxiv" not in query.lower() else query
182
+ search_result = fetch_google_scholar(actual_query, start)
183
 
184
  return [i for i in search_result if valid_item(i)]
185
 
 
188
 
189
  while len(result) < n:
190
  # FIXME: 今のままだとそもそも検索結果が全体で n 件以下の場合に無限ループになってしまう
 
191
  result += fetch(start)
192
  start += 10
193
 
 
258
 
259
  @memory.cache
260
  def fetch_google_scholar(query: str, start: int) -> dict:
261
+ logger.info(f"Looking for `{query}` on Google Scholar, offset: {start}...")
262
  serpapi = SerpAPIWrapper(params={
263
  "engine": "google_scholar",
264
  "gl": "us",