# 导入库
import requests
from bs4 import BeautifulSoup


def getUrlText(url):
    try:
        web = requests.get(url)
        soup = BeautifulSoup(web.text)
        web.raise_for_status()             # 查看网页的状态
        web.encoding = 'utf-8'             # 设置编码
        return web.text, web.status_code, len(web.text), web.encoding, len(soup.text)

    except:
        return


url = "https://www.sogou.com"

for i in range(20):
    print(i)
    print(getUrlText(url))

 

博客园  ©  2004-2025
浙公网安备 33010602011771号 浙ICP备2021040463号-3