1.代码如下
import time
import requests
import pandas as pd
import os
def getArticle(PMCID,NIHMSID,DOI,title,path):
print(PMCID,NIHMSID,DOI,title,path)
os.chdir(path)
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/80.0.3987.163 Safari/537.36"}
if (PMCID!="NA" and NIHMSID != "NA"):
print("PMCID & NIHMSID")
NIHMSID = str(NIHMSID).replace("NIHMS", "nihms")
urls=f'https://www.ncbi.nlm.nih.gov/pmc/articles/{PMCID}/pdf/{NIHMSID}.pdf'
r = requests.get(urls, headers=headers)
with open(title + ".pdf", 'wb') as f:
f.write(r.content)
if (PMCID!="NA" and NIHMSID =="NA"):
print("PMCID")
DOI_after=DOI.split("/")
urls = f'https://www.ncbi.nlm.nih.g