python抓小說閱讀

import  requests
from bs4 import BeautifulSoup

#獲取目錄
bookMuluUrl = "http://www.janpn.com/book/wushentianxia.html"
bookMulu = requests.get(bookMuluUrl)
muluContent = BeautifulSoup(bookMulu.text,"html.parser")
mulu = muluContent.find(attrs={"class":"panel-chapterlist"}).find_all_next("li")
muluList = []
id = 1
try:
    for i in mulu:
        dic = {}
        # print(i)
        dic["id"]=id
        dic["url"] = str(i.a['href'])
        dic["title"] = i.text
        muluList.append(dic)
        id = id+1
except Exception as e:
    print("獲取目錄失敗",e)

#打印目錄
for i in muluList:
    print(i)


#閱讀
readFlag = True
charpterNumber = int(input("請輸入要閱讀的章節ID"))
while readFlag:
    charpterUrl = muluList[charpterNumber-1]['url']
    charpterTitle = muluList[charpterNumber-1]['title']
    response = requests.get(charpterUrl)
    soup = BeautifulSoup(response.text,"html.parser")
    story = str(soup.find(id="htmlContent"))
    print(story.replace("<br/>","\n"))
    try:
        continueReadFlag =  input("是否繼續閱讀按N退出").lower()
        if continueReadFlag != "n":
            charpterNumber = charpterNumber + 1
        else:
            readFlag = False
    except Exception as e:
        charpterNumber = charpterNumber + 1

發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章