import requests
from bs4 import BeautifulSoup
import jsonclass bs4YQ():url = 'https://www.lmonkey.com/t'headers = {'user-agent': }res_html = Noneinfo = []def __init__(self):res = requests.get(url=self.url, headers=self.headers)if res.status_code == 200:print('请求成功')self.res_html = res.textif self.ParseData():self.WriteJson() print('succeed')else:print('请求失败')def ParseData(self):bs = BeautifulSoup(self.res_html, 'lxml') try:lists = bs.find_all('div', {'class': 'list-group-item list-group-item-action p-06'}) for i in lists:titles = i.find('div', {'class', 'topic_title mb-0 lh-180'})if titles:infodict = {'title': titles.text.split('\n')[0],'author': i.strong.a.text,'url': i.a['href'],'time': i.span['title']}self.info.append(infodict)return Trueexcept:return Falsedef WriteJson(self):if self.info is not None:try:with open('./yq.json', 'w', encoding='utf-8') as fp:json.dump(self.info, fp)return Trueexcept:return Falseelse:print('无法获取解析数据')return False
if __name__ == '__main__':bs4YQ()
本文来自互联网用户投稿,文章观点仅代表作者本人,不代表本站立场,不承担相关法律责任。如若转载,请注明出处。 如若内容造成侵权/违法违规/事实不符,请点击【内容举报】进行投诉反馈!