Код: Выделить всё
import requests
import time
import pandas as pd
def get_pubmed_results_count(search_terms, delay=1):
base_url = "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/esearch.fcgi"
results = {}
for term in search_terms:
# Define parameters for the API request
params = {
"db": "pubmed",
"term": term,
"retmode": "json"
}
try:
# Make the request to the PubMed API
response = requests.get(base_url, params=params)
response.raise_for_status()
# Parse the response
data = response.json()
count = data['esearchresult']['count']
results[term] = count
except requests.exceptions.RequestException as e:
print(f"Error retrieving data for term '{term}': {e}")
results[term] = None
# Respectful delay between requests
time.sleep(delay)
return results
# Example usage
df_searchterms = pd.read_csv('search1.csv')
print(df_searchterms)
if __name__ == "__main__":
for index, row in df_searchterms.iterrows():
search_terms = (row['Term'])
result_counts = get_pubmed_results_count(search_terms)
for term, count in result_counts.items():
df_results = pd.DataFrame(result_counts.items(), columns=['term','count'])
print (df_results)
df_results.to_csv('TestRestults1.csv', index=False)
Код: Выделить всё
Term
0 APOE AND Alzheimer's
1 PSEN1 AND Alzheimer's
2 PSEN2 AND Alzheimer's
3 APP AND Alzheimer's
4 CLU AND Alzheimer's
Подробнее здесь: https://stackoverflow.com/questions/787 ... n-for-loop
Мобильная версия