Spaces:
Runtime error
Runtime error
Commit
·
73855f3
1
Parent(s):
ba8da6c
test
Browse files
huixiangdou/service/findarticles.py
CHANGED
|
@@ -5,7 +5,7 @@ import os
|
|
| 5 |
from tqdm import tqdm
|
| 6 |
import json
|
| 7 |
import shutil
|
| 8 |
-
|
| 9 |
class ArticleRetrieval:
|
| 10 |
def __init__(self,
|
| 11 |
keywords: list,
|
|
@@ -43,6 +43,7 @@ class ArticleRetrieval:
|
|
| 43 |
|
| 44 |
## 清洗XML文件
|
| 45 |
def _clean_xml(self,txt):
|
|
|
|
| 46 |
root = ET.fromstring(txt)
|
| 47 |
txt = self._get_all_text(root)
|
| 48 |
txt = txt.split('REFERENCES')[0] # 截取参考文献之前的文本
|
|
|
|
| 5 |
from tqdm import tqdm
|
| 6 |
import json
|
| 7 |
import shutil
|
| 8 |
+
from loguru import logger
|
| 9 |
class ArticleRetrieval:
|
| 10 |
def __init__(self,
|
| 11 |
keywords: list,
|
|
|
|
| 43 |
|
| 44 |
## 清洗XML文件
|
| 45 |
def _clean_xml(self,txt):
|
| 46 |
+
logger.error(text[:100])
|
| 47 |
root = ET.fromstring(txt)
|
| 48 |
txt = self._get_all_text(root)
|
| 49 |
txt = txt.split('REFERENCES')[0] # 截取参考文献之前的文本
|