1 static void Main(string[] args)2 {3 int errorCount = 0;//计算爬取失败的次数
4 int count = 450;//结束范围
5 for (int i = 401; i <= count; i++)6 {7 Thread.Sleep(2000);//每隔两秒爬取一次,不要给服务器压力
8 try
9 {10 HtmlWeb web = newHtmlWeb();11 //https://maoyan.com/films/1
12 web.OverrideEncoding =Encoding.UTF8;13 HtmlDocument doc = web.Load($"https://maoyan.com/films/{i}");//把url中的1替换为i
14
15 HtmlDocument htmlDoc = newHtmlDocument();16 string url = $"https://maoyan.com/films/{i}";17
18 //获取电影名
19 HtmlNode MovieTitle = doc.DocumentNode.SelectSingleNode("//div[@class=‘movie-brief-container‘]/h1[@class=‘name‘]");//分析页面结构后得到的div20 if (MovieTitle == null)//如果是null,那么表明进入验证页面了,执行第二种方法
21 {22 string urlResponse =URLRequest(url);23 htmlDoc.LoadHtml(urlResponse);24 MovieTitle &