Yijun-Yang commited on
Commit
73855f3
1 Parent(s): ba8da6c
huixiangdou/service/findarticles.py CHANGED
@@ -5,7 +5,7 @@ import os
5
  from tqdm import tqdm
6
  import json
7
  import shutil
8
-
9
  class ArticleRetrieval:
10
  def __init__(self,
11
  keywords: list,
@@ -43,6 +43,7 @@ class ArticleRetrieval:
43
 
44
  ## 清洗XML文件
45
  def _clean_xml(self,txt):
 
46
  root = ET.fromstring(txt)
47
  txt = self._get_all_text(root)
48
  txt = txt.split('REFERENCES')[0] # 截取参考文献之前的文本
 
5
  from tqdm import tqdm
6
  import json
7
  import shutil
8
+ from loguru import logger
9
  class ArticleRetrieval:
10
  def __init__(self,
11
  keywords: list,
 
43
 
44
  ## 清洗XML文件
45
  def _clean_xml(self,txt):
46
+ logger.error(text[:100])
47
  root = ET.fromstring(txt)
48
  txt = self._get_all_text(root)
49
  txt = txt.split('REFERENCES')[0] # 截取参考文献之前的文本