import requests
from fack user-agent import UserAgent
from lxml import etree
from random import randint
from time import sleep
from bs4 import BeautifulSoup
def parse_index(html):
e = etree.HTML(html)
all_url = e.xpath(‘//div[@class=“channel_detail” movie-item-title"]/a/@href’)
return [‘http://moven.com{}’.format(url) for url in all_url’]
def parse_info(html):
e = etree.HTML(html)
name = soup.selete(‘h3.name’)[0].text
types = soup.selete(‘li.ellipsis’)[1].text
actors = soup.selete(‘li.celebrity actor > div.info >a’)
name = e.xpath(‘//h3[@class=“name”]/text())[0]
types = e.xpath(’//li[@class=“ellipsis”][1]/text()‘)[0]
actors = e.xpath(’//li[@class=“celebrity actor”]/div[@class=“info”]/a/text())
actors = format_actors(actors)
return{
“name”:name,
“types”:types,
“actors”:actors
}