JumonyParser帮助类

此类可以根据地址加载html文档,并能根据css选择器获取标签进行抓包

 

using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;
using System.Threading.Tasks;

using Ivony.Html;
using Ivony.Html.Parser;

namespace zhcwCapPackage
{
    public class ReptileHelper
    {
        /// <summary>
        /// html文档
        /// </summary>
        private IHtmlDocument doc;
        private static Encoding encoding = Encoding.UTF8;
       
        public ReptileHelper(string url)
        {
            doc = new JumonyParser().LoadDocument(url, encoding);
        }

        /// <summary>
        /// 查询指定url中指定选择器的元素集 
        /// </summary>
        /// <param name="url">地址</param>
        /// <param name="selector">css选择器</param>
        /// <returns></returns>
        public IEnumerable<IHtmlElement> QueryHtmlElements(string selector)
        {
            return doc.Find(selector);
        }

        /// <summary>
        /// 查询指定url中指定选择器的元素集 
        /// </summary>
        /// <param name="url">地址</param>
        /// <param name="selector">css选择器</param>
        /// <returns></returns>
        public static IEnumerable<IHtmlElement> QueryHtmlElements(string url,string selector)
        {
            IHtmlDocument doccument = new JumonyParser().LoadDocument(url, encoding);
            return doccument.Find(selector);
        }
    }
}

 

posted @ 2017-07-14 10:13  花生打代码会头痛  阅读(640)  评论(0)    收藏  举报