代码1:
#!/usr/bin/env python
# coding=utf-8
#import importlib,sys
#import sys
#sys.setdefaultencoding('gbk')
'''import sys
import imp
import sys
reload(sys)
sys.setdefaultencoding('utf8')
'''
'''
import sys
sys.setdefaultencoding('utf-8')
import jieba
import json'''
from bs4 import BeautifulSoup
import urllib.request
import urllib.parse as parse
import ssl
import re
import os,os.path
import codecs
import requests
def getHtml(url):
global html
page = urllib.request.urlopen(url)
html = page.read()
return html
def file(url1,file_name,name):
print(url1)
headers = {'Host': 'download.lfd.uci.edu','User-Agent':'Mozilla/5.0 (Windows NT 10.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/57.0.2987.98 Safari/537.36 LBBROWSER','Referer': 'https://www.lfd.uci.edu/~gohlke/pythonlibs/',
'Connection': 'keep-alive',
'Upgrade-Insecure-Requests': '1',
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/57.0.2987.98 Safari/537.36 LBBROWSER',
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
'Accept-Encoding': 'gzip, deflate, sdch, br',
'Accept-Language': 'zh-CN,zh;q=0.8'}
#req = urllib.urlretrieve(download_url,headers=headers)
#urllib.request.urlopen('https://www.lfd.uci.edu/~gohlke/pythonlibs/')
#req = urllib.request.Request(url=url,headers=header)
request = requests.get(url=url1,headers=headers)
#response = urllib.request.urlopen(request)
global i
i += 1
file = open(name ,'wb+')
file.write(request.content)
file.close()
print(file_name)
print("Completed : .... %d ..." % x)
save_path = os.getcwd()
url = 'https://www.lfd.uci.edu/'
html = getHtml(url)
html='''
ad3‑2.2.1‑cp38‑cp38‑win_amd64.whl ad3‑2.2.1‑cp38‑cp38‑win32.whl ad3‑2.2.1‑cp37‑cp37m‑win_amd64.whl ad3‑2.2.1‑cp37‑cp37m‑win32.whl ad3‑2.2.1‑cp36‑cp36m‑win_amd64.whl ad3‑2.2.1‑cp36‑cp36m‑win32.whl ad3‑2.2.1‑cp35‑cp35m‑win_amd64.whl ad3‑2.2.1‑cp35‑cp35m‑win32.whl