使用HtmlAgilityPack抓取html标签属性内容

第一步:安装HtmlAgilityPack


简单抓取一些想要的信息:

        static void Main(string[] args)
        {
            HtmlWeb webClient = new HtmlWeb();
            HtmlDocument doc = webClient.Load("http://www.iqiyi.com/v_19rrdze0xk.html#vfrm=24-9-0-1");

            #region [获取 head meta property(键) content(值)]
            HtmlNodeCollection meat_property_List = doc.DocumentNode.SelectNodes(".//meta[@property]");
            if (meat_property_List != null)
            {
                Console.WriteLine();
                Console.WriteLine("[获取 head meta property(键) content(值)]");
                foreach (HtmlNode meat_property in meat_property_List)
                {
                    HtmlAttribute property_att = meat_property.Attributes["property"];
                    HtmlAttribute content_att = meat_property.Attributes["content"];
                    Console.WriteLine(string.Format("{0}\t:\t{1}", property_att.Value, content_att.Value));
                }
            }
            #endregion

            #region [获取 head meta name(键) content(值)]
            HtmlNodeCollection meat_name_List = doc.DocumentNode.SelectNodes(".//meta[@name]");
            if (meat_name_List != null)
            {
                Console.WriteLine();
                Console.WriteLine("[获取 head meta name(键) content(值)]");
                foreach (var meat_name in meat_name_List)
                {
                    HtmlAttribute name_att = meat_name.Attributes["name"];
                    HtmlAttribute content_att = meat_name.Attributes["content"];
                    Console.WriteLine(string.Format("{0}\t:\t{1}", name_att.Value, content_att.Value));
                }
            }
            #endregion

            #region [获取 title]
            Console.WriteLine();
            Console.WriteLine("[获取 title]");
            var titleObj = doc.DocumentNode.SelectSingleNode("//title");
            if (titleObj != null)
            {
                Console.WriteLine("title:" + titleObj.InnerText);
            }
            #endregion

            #region [获取 首个 img src]
            Console.WriteLine();
            Console.WriteLine("[获取 首个 img src]");
            var imgObj = doc.DocumentNode.SelectSingleNode("//img");
            if (imgObj != null)
            {
                string src = imgObj.Attributes["src"].Value;
                Console.WriteLine("img src:" + src);
            }
            #endregion

            Console.ReadKey();
        }



评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值