Spaces:
Running
Running
Update pipeline.py
Browse files- pipeline.py +2 -0
pipeline.py
CHANGED
@@ -325,9 +325,11 @@ def pipeline_with_gemini(accessions):
|
|
325 |
# get supplementary of that article
|
326 |
print("tem links length ", len(tem_links))
|
327 |
for link in tem_links:
|
|
|
328 |
html = extractHTML.HTML("",link)
|
329 |
jsonSM = html.getSupMaterial()
|
330 |
article_text_tem = html.getListSection()
|
|
|
331 |
if article_text_tem:
|
332 |
if "Just a moment...Enable JavaScript and cookies to continue".lower() not in article_text_tem.lower() or "403 Forbidden Request".lower() not in article_text_tem.lower():
|
333 |
links.append(link)
|
|
|
325 |
# get supplementary of that article
|
326 |
print("tem links length ", len(tem_links))
|
327 |
for link in tem_links:
|
328 |
+
print("link in tem: ", link)
|
329 |
html = extractHTML.HTML("",link)
|
330 |
jsonSM = html.getSupMaterial()
|
331 |
article_text_tem = html.getListSection()
|
332 |
+
print(article_text_tem, jsonSM)
|
333 |
if article_text_tem:
|
334 |
if "Just a moment...Enable JavaScript and cookies to continue".lower() not in article_text_tem.lower() or "403 Forbidden Request".lower() not in article_text_tem.lower():
|
335 |
links.append(link)
|