Spaces:
Running
Running
Update pipeline.py
Browse files- pipeline.py +3 -0
pipeline.py
CHANGED
@@ -327,12 +327,15 @@ def pipeline_with_gemini(accessions):
|
|
327 |
for link in tem_links:
|
328 |
print("link in tem: ", link)
|
329 |
html = extractHTML.HTML("",link)
|
|
|
330 |
jsonSM = html.getSupMaterial()
|
|
|
331 |
article_text_tem = html.getListSection()
|
332 |
print(article_text_tem, jsonSM)
|
333 |
if article_text_tem:
|
334 |
if "Just a moment...Enable JavaScript and cookies to continue".lower() not in article_text_tem.lower() or "403 Forbidden Request".lower() not in article_text_tem.lower():
|
335 |
links.append(link)
|
|
|
336 |
if jsonSM:
|
337 |
links += sum((jsonSM[key] for key in jsonSM),[])
|
338 |
print("this is links: ",links)
|
|
|
327 |
for link in tem_links:
|
328 |
print("link in tem: ", link)
|
329 |
html = extractHTML.HTML("",link)
|
330 |
+
print("html yeh")
|
331 |
jsonSM = html.getSupMaterial()
|
332 |
+
print("jsonsm yeah")
|
333 |
article_text_tem = html.getListSection()
|
334 |
print(article_text_tem, jsonSM)
|
335 |
if article_text_tem:
|
336 |
if "Just a moment...Enable JavaScript and cookies to continue".lower() not in article_text_tem.lower() or "403 Forbidden Request".lower() not in article_text_tem.lower():
|
337 |
links.append(link)
|
338 |
+
print("tem link appended ", link)
|
339 |
if jsonSM:
|
340 |
links += sum((jsonSM[key] for key in jsonSM),[])
|
341 |
print("this is links: ",links)
|