写了个爬虫爬文章,就只爬到了点点!大佬们救救孩子吧...
pycharm吧
全部回复
仅看楼主
level 1
#coding = utf-8
import requests
import parsel
url = "https://www.biqugee.com/book/61885/"
headers = {"User-Agent": "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/70.0.3538.25 Safari/537.36 Core/1.70.3883.400 QQBrowser/10.8.4559.400"}
response = requests.get(url=url,headers=headers)
selector = parsel.Selector(response.text)
novel_name = selector.css("#info h1::text").get()
href = selector.css("#list dd a::attr(href)").getall()
#print(novel_name)
#print(href)
for link in href:
link_url = "https://www.biqugee.com/"+link
response_1 = requests.get(link_url)
# print(response_1.text)
selector_1 = parsel.Selector(response_1.text)
title = selector_1.css(".bookname h1::text").get() #章节名字
contents = selector_1.css("
#content ::text").getall() #
小说内容
# content = "\n".join(content_list)
contents2 = []
for content in contents :
contents2.append(content.strip())
with open(novel_name + ".txt",mode="a",encoding="utf-8") as f:
f.write("\n".join(contents2))
2022年03月05日 08点03分 1
1