(14)爬虫xpath使用

from lxml import etree
import requests
url = 'https://www.qidian.com/all'
headers={
    'User-Agent':'Mozilla/5.0(Windows;U;WindowsNT6.1;en-us)AppleWebKit/534.50(KHTML,likeGecko)Version/5.1Safari/534.50'
}
response = requests.get(url,headers=headers)
e = etree.HTML(response.text)
name=e.xpath('//h4/a/text()')
aut=e.xpath('''//p[@class='author']/a[1]/text()''')
print(name)
print(aut)
for n,a in zip(name,aut):
    print(n,':',a)
posted @ 2020-07-14 21:53  kuanleung  阅读(7)  评论(0)    收藏  举报  来源