https://m.ituring.com.cn/book/tupubarticle/25962?bookID=1980&type=tubook&subject=%E7%AC%AC%204%20%E7%AB%A0%E3%80%80%E7%BD%91%E7%BB%9C%E7%88%AC%E8%99%AB%E6%A8%A1%E5%9E%8B
第 4 章 网络爬虫模型#一个 Content 类的示例
import requests
from bs4 import BeautifulSoup
class Content:
def __init__(self,url,title,body):
self.url=url
self.title=title
self.body=body
def getPage(url):
req=requests.get(url)
return BeautifulSoup(req.text,'html.parser')
def scrapeBrooking(url):
soup=getPage(url)
title=soup.find('h1').text
body=soup.find('div',{'class':'post-body'}).text
return Content(url,title,body)


