• 东财数据爬取


    # coding: utf-8
    """
    # @Time    : 2021/5/24 8:57
    # @Author  : Gina Gao
    # @File    : 
    # @Software: PyCharm
    # @Descript:
    """
     
    import pandas as pd
    
    import openpyxl
    import  requests
    import  json
    
    
    def write_excel_xlsx(path, sheet_name, value):
        print("print",1)
        # index = len(value)
        # print(value.keys())#['f1', 'f2']
        # print(value)
        dict_list=[]
        for i in value:
            for j in i:
                dict_list.append(j)
        index=len(dict_list)
        print(dict_list[0].keys())
        workbook = openpyxl.Workbook()
        sheet = workbook.active
        sheet.title = sheet_name
        for i in range(0, index):
            # for j in range(0, len(value[i])):
            # print(dict_list[i])
            sheet.cell(row=i+1, column=1, value=str(dict_list[i]))
        workbook.save(path)
        print("xlsx格式表格写入数据成功!")
    
    def data_url():
        path='http://push2.eastmoney.com/api/qt/clist/get?fid=f62&po=1&pz=50&pn=1&np=1&fltt=2&invt=2&ut=b2884a393a59ad64002292a3e90d46a5&fs=m%3A0%2Bt%3A6%2Bf%3A!2%2Cm%3A0%2Bt%3A13%2Bf%3A!2%2Cm%3A0%2Bt%3A80%2Bf%3A!2%2Cm%3A1%2Bt%3A2%2Bf%3A!2%2Cm%3A1%2Bt%3A23%2Bf%3A!2%2Cm%3A0%2Bt%3A7%2Bf%3A!2%2Cm%3A1%2Bt%3A3%2Bf%3A!2&fields=f12%2Cf14%2Cf2%2Cf3%2Cf62%2Cf184%2Cf66%2Cf69%2Cf72%2Cf75%2Cf78%2Cf81%2Cf84%2Cf87%2Cf204%2Cf205%2Cf124%2Cf1'
        data=requests.get(path).content
        data_js=json.loads(data)
        total=data_js['data']['total']
        pn=int(total/50)
        print("total",total)
        if total%50!=0:
            pn=pn+1
        data_dict = {}
        data_detail=[]
        for i in range(1,pn):#pn 页数
            # print("i",i)
            path1='http://push2.eastmoney.com/api/qt/clist/get?fid=f62&po=1&pz=50&pn={i}&np=1&fltt=2&invt=2&ut=b2884a393a59ad64002292a3e90d46a5&fs=m%3A0%2Bt%3A6%2Bf%3A!2%2Cm%3A0%2Bt%3A13%2Bf%3A!2%2Cm%3A0%2Bt%3A80%2Bf%3A!2%2Cm%3A1%2Bt%3A2%2Bf%3A!2%2Cm%3A1%2Bt%3A23%2Bf%3A!2%2Cm%3A0%2Bt%3A7%2Bf%3A!2%2Cm%3A1%2Bt%3A3%2Bf%3A!2&fields=f12%2Cf14%2Cf2%2Cf3%2Cf62%2Cf184%2Cf66%2Cf69%2Cf72%2Cf75%2Cf78%2Cf81%2Cf84%2Cf87%2Cf204%2Cf205%2Cf124%2Cf1'.format(i=i)
            data = requests.get(path1).content
            data_js = json.loads(data)
            # print(data_js)
            data_detail.append(data_js['data']['diff'])
    
    
        return data_detail
    
    def main():
        data=data_url()
        print("data",len(data))
        # print(data)
        filepath=r'C:Userskexin.gaoDesktop2222222222222	est.xlsx'
        sheet_name='gina_test'
        write_excel_xlsx(filepath,sheet_name,data)
    if __name__ == '__main__':
        main()
  • 相关阅读:
    P4149 [IOI2011]Race dsu on tree
    CodeForces
    2020牛客国庆集训派对day2 CHEAP DELIVERIES
    Hero In Maze
    topo排序
    今年暑假不AC
    小国的游戏
    Stall Reservations
    博弈论
    Reversed Words
  • 原文地址:https://www.cnblogs.com/gina11/p/14863758.html
Copyright © 2020-2023  润新知