# -*- coding: utf-8 -*- """ 第 0008 题:一个HTML文件,找出里面的正文。 """ import requests,re from bs4 import BeautifulSoup url = 'http://linyii.com' data=requests.get(url) r = re.findall(r'
[\s\S]*',data.text) print(r[0]) print('---------------------------------------------------------------') soup = BeautifulSoup(data.text,'html.parser') print(soup.body.text)