diff --git a/bibliovid_scrapper.py b/bibliovid_scrapper.py index 982d283cbb1ecef85aa49fc6443923f39e1c140f..dff4ac86b1827aab29377f75b222a49af9152db8 100644 --- a/bibliovid_scrapper.py +++ b/bibliovid_scrapper.py @@ -24,19 +24,34 @@ for article in articles['results']: return node.get_text().strip() return '' + #title = safe_text(main.find('h1')) + #link = divs[8].find('a').attrs['href'] + #findings = safe_text(divs[12].find('div')) + #take_away = safe_text(divs[14].contents[0].find('div')) + #relevance_level = safe_text(divs[16].contents[0].find('div')) + #objectives = safe_text(divs[18].contents[0].find('div')) + #methods = safe_text(divs[20].contents[0].find('div')) + + #article['link'] = link + #article['findings'] = findings + #article['take_away'] = take_away + #article['relevance_level'] = relevance_level + #article['objectives'] = objectives + #article['methods'] = methods + title = safe_text(main.find('h1')) link = divs[8].find('a').attrs['href'] - findings = safe_text(divs[12].find('div')) - take_away = safe_text(divs[14].contents[0].find('div')) - relevance_level = safe_text(divs[16].contents[0].find('div')) - objectives = safe_text(divs[18].contents[0].find('div')) - methods = safe_text(divs[20].contents[0].find('div')) + findings = safe_text(divs[14].find('div')) + take_away = safe_text(divs[16].contents[0].find('div')) + relevance_level = safe_text(divs[18].contents[0].find('div')) + objectives = safe_text(divs[20].contents[0].find('div')) + methods = safe_text(divs[22].contents[0].find('div')) article['link'] = link - article['findings'] = findings - article['take_away'] = take_away - article['relevance_level'] = relevance_level - article['objectives'] = objectives + article['results'] = findings + article['synthesis'] = take_away + article['strength_of_evidence_details'] = relevance_level + article['goals'] = objectives article['methods'] = methods print(json.dumps(articles, indent=2))