from urllib.request import urlopen,Request
from bs4 import BeautifulSoup
import os
from urllib.request import urlretrieve
headers={'User-Agent':'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3947.100 Safari/537.36'}
def updateurl(url,headers):
ret = Request(url, headers=headers)
html = urlopen(ret)
bs = BeautifulSoup(html, "html.parser")
return bs
link=[]
url='https://www.sohu.com/a/286956359_301394'
bs = updateurl(url, headers)
img1=bs.find('article',{'class':"article"})
i=0
path = 'C:\\Users\\user\\PycharmProjects\\pythonProject\\'
os.mkdir(path + 'lwt')
for kk in img1.find_all('p'):
try:
link.append(kk.find('img')['src'])
except:
continue
url=urlretrieve(link[i],'lwt\\image{}.jpg'.format(i))
i+=1