import requests
from bs4 import BeautifulSoup
#获取目录
bookMuluUrl = "http://www.janpn.com/book/wushentianxia.html"
bookMulu = requests.get(bookMuluUrl)
muluContent = BeautifulSoup(bookMulu.text,"html.parser")
mulu = muluContent.find(attrs={"class":"panel-chapterlist"}).find_all_next("li")
muluList = []
id = 1
try:
for i in mulu:
dic = {}
# print(i)
dic["id"]=id
dic["url"] = str(i.a['href'])
dic["title"] = i.text
muluList.append(dic)
id = id+1
except Exception as e:
print("获取目录失败",e)
#打印目录
for i in muluList:
print(i)
#阅读
readFlag = True
charpterNumber = int(input("请输入要阅读的章节ID"))
while readFlag:
charpterUrl = muluList[charpterNumber-1]['url']
charpterTitle = muluList[charpterNumber-1]['title']
response = requests.get(charpterUrl)
soup = BeautifulSoup(response.text,"html.parser")
story = str(soup.find(id="htmlContent"))
print(story.replace("<br/>","\n"))
try:
continueReadFlag = input("是否继续阅读按N退出").lower()
if continueReadFlag != "n":
charpterNumber = charpterNumber + 1
else:
readFlag = False
except Exception as e:
charpterNumber = charpterNumber + 1
python抓小说阅读
發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.