import requests from bs4 import BeautifulSoup import os import pandas as pd import io
[2]
path = "/Users/zhangyanan/Desktop/DOI/" os.chdir("/Users/zhangyanan/Desktop") os.getcwd()
'/Users/zhangyanan/Desktop'
[3]
if os.path.exists(path) == False: os.mkdir(path) #20210607更新,创建保存下载文章的文件夹 f = open("DOI.txt", "r", encoding="utf-8") #存放DOI码的.txt文件中,每行存放一个文献的DOI码,完毕须换行(最后一个也须换行!) head = {\ 'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/79.0.3945.117 Safari/537.36'\ }
for line in f.readlines(): line = line[:-1] #去换行符 url = "https://www.nature.com/articles/" + line + '.pdf' #20210515更新:现在换成这个sci hub检索地址 try: download_url = ""