python3獲取股東的減持信息（轉）

# -*- coding: GB2312 -*-
import requests
from bs4 import BeautifulSoup
import csv
import time
import codecs


# 獲取數據
def getHTML(url):
    response = requests.get(url)
    print(response.apparent_encoding)  # 返回頁面編碼：GB2312


    # 單用GB2312也可以好像
    try:
        print(response.text.encode('GB2312').decode('GB2312'))
    except:
        print(response.text.encode('utf-8').decode('utf-8'))
    return response.text


# 處理數據
def writeFile(writer, res):
    # 返回的數據：var TbrNdpvg={pages:401,data:[]},"url":""}
    startid = res.find("[")
    endid = res.find("]")
    print(startid)
    print(endid)
    new_content = res[startid + 1:endid - 1]
    # print(content_txt[startid:endid])
    list = new_content.split("\",")
    print(len(list))
    new_list = []
    for i in list:
        i = i.replace('"', '')
        new_list.append(i)
    print(new_list)

    m = len(new_list)
    for i in range(m):
        # print(type(new_list[i]))
        try:
            new_list[i].encode('GB2312').decode('GB2312')

        except:
            new_list[i].encode('utf-8').decode('utf-8')

        new_list_i = new_list[i].split(',')
        new_list_i[0] = new_list_i[0] + '\t'  # 寫csv，不允許科學計算

        print(type(new_list_i))
        print(new_list_i)
        writer.writerow(new_list_i)


for i in range(40):
    url = "http://data.eastmoney.com/DataCenter_V3/gdzjc.ashx?pagesize=500&page=" + str(
        i) + "&js=var%20UWExJjvK¶m=&sortRule=-1&sortType=BDJZ&tabid=jjc&code=&name=&rt=50815994"
    print(url)
    res = getHTML(url)
    time.sleep(1)  # 每隔一秒訪問
    csvFile = codecs.open('d:/Aa.csv', 'a', encoding='utf8')  # codecs.open() 防止寫入亂碼
    writer = csv.writer(csvFile)
    writeFile(writer, res)

發表評論

所有評論

還沒有人評論，想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.

python3獲取股東的減持信息（轉）

10分鐘搞定Mysql主從部署配置

如何使用 JS 判斷用戶是否處於活躍狀態

一鍵自動化博客發佈工具,用過的人都說好(掘金篇)

「Pygors跨平臺GUI」2：安裝MinGW-w64、MSYS2還是WSL2

[轉帖]

python列出centos7內存使用前50的進程信息

「Pygors跨平臺GUI」1：Pygors跨平臺GUI應用研究

Java ThreadPoolShutdown

“她”來了，陪伴賽道鉅變！爲GPT-4o加上你的一個數字分身

京東秒送售後系統退款業務重構心得| 京東零售技術團隊

java 深淺拷貝（克隆）

java 普通工程ant打包的xml

bootstrap的表單使用axios操作時候無法進入then解決方案

給hive增加一列

python 報錯 AttributeError DataFrame object has no attribute as_matrix

https://yachay.unat.edu.pe/blog/index.php?comment_area=format_blog&comment_component=blog&comment_co

linux以太網驅動總結