• 遍历win10文件夹并解析json文件,按照json格式存入mongo数据库(基于python 3.6)


    import re
    import json
    from pymongo import MongoClient
    import os

    # def Write_json(data):
    # open_Json = open("1.json", "a")
    # Write_json = json.dumps(data)
    # open_Json.write(Write_json)
    # open_Json.close()

    def load_Mongo(Address, port, Process_data, Name):
    client = MongoClient(Address, port) #数据地址+端口号
    db = client.portal #数据库
    collection = db.typhoons #数据表
    # collection.find({Name})
       ret = collection.find({"ename": Name})
    if not ret or ret.count() == 0:
    collection.insert(Process_data)
    for i in collection.find({"ename": Name}):
    id = str(i['_id'])
    print('Have been stored,' + 'ObjectID:' + '' + id)

    else:
    # collection.insert(Process_data)
    for i in collection.find({"ename": Name}):
    id = str(i['_id'])
    print('Already exist,' + 'ObjectID:' + '' + id)
     
    def loadFont(address, port, Json_File):
    n = 0
    Date = []
    Info = []
    ADV= []
    LAT= []
    LON= []
    TIME= []
    WIND= []
    PR= []
    STAT = []
    Data_Header = []
    json_File = Json_File #json文件地址
    with open(json_File, encoding='utf-8') as f:
    while True:
    lines = f.readline()
    n = n+1
    if not lines:
    break
    pass

    Colon = re.findall(r':', lines, re.I)
    if Colon: #处理第一行数据
    date = re.split(r":", lines) #分割冒号
    date = date[1].replace(' ', '').replace(' ', '').replace(' ', '').replace(' ', '')
    Date.append(date)
    # print(Date)
    else:


    if n == 2:
    info = lines
    info = info.replace(' ', '').replace(' ', '').replace(' ', '')
    Info.append(info)
    else:
    if n == 3:
    Data_header = re.split(r" ", lines)
    while '' in Data_header: #移除空格
    Data_header.remove('')
    for head_Num in range(len(Data_header)):
    head_Find = re.findall(r' ', Data_header[head_Num], re.I)
    if head_Find: #查找 并删除,然后加入json文件
    Data_header[head_Num] = Data_header[head_Num].replace(' ', '').replace(' ', '').replace(' ', '')
    # json_List.setdefault(Data_header[head_Num]) #增加键值对
    Data_Header.append(Data_header[head_Num])

    else:
    head_Data = Data_header[head_Num]
    # json_List.setdefault(head_Data) #增加键值对
    Data_Header.append(head_Data)
    # Write_json(json_List) #写入json
    # print(Data_header)


    else:
    if n > 3:
    all = re.split(r" ", lines)
    while '' in all:
    all.remove('')
    ADV.append(all[0])
    LAT.append(all[1])
    LON.append(all[2])
    TIME.append(all[3])
    WIND.append(all[4])
    PR.append(all[5])
    stat = []
    for count in range(len(all)):
    if count > 5:
    stat.append(all[count])
    # print(stat)
    else:
    continue
    stat = " ".join(str(i) for i in stat) #合并数据
    stat = stat.replace(' ', '').replace(' ', '').replace(' ', '')
    STAT.append(stat)
    # print(STAT)


    #设计字典

    Addit_all = [ ]
    json_List = {'ename': '', 'is_current': 'null','enddate':'null', 'name':'null', 'sn':'null','land':[ ], 'startdate':'',
    'track':[ ] }
    json_List['startdate'] = Date[0]
    json_List['ename'] = Info[0]
    i = len(ADV)
    j = 0
    while j < i:
    # json_List ['startdate'] = TIME[j]
    addit = {}
    addit ['forecast'] = 'null'
    if STAT[j] == 'TROPICAL STORM':
    addit['type'] = 'TS'
    elif STAT[j] == 'TROPICAL DEPRESSION':
    addit['type'] = 'TD'
    else:


    addit['type'] = STAT[j]
    addit['speed'] = WIND[j]
    addit['moveDirection'] ='null'
    # addit['ADV'] = ADV[j]
    addit['longitude'] = LON[j]
    addit['latitude'] = LAT[j]
    addit ['radius10'] = 'null'
    addit['time'] = TIME[j]
    addit['radius7'] = 'null'
    addit ['pressure'] = PR[j]
    addit ['power'] = 'null'
    addit['des'] = ''
    addit['moveSpeed'] = 'null'
    Addit_all.append(addit) #将多组数据加入数组
    j = j + 1
    json_List['track'] = Addit_all
    # Write_json(json_List)
    print(json_List)
    load_Mongo(address, port, json_List, Info[0])


    List = []
    def traverse(json_Dir):
    fs = os.listdir(json_Dir)
    for file in fs:
    tmp_path = os.path.join(json_Dir, file)
    if not os.path.isdir(tmp_path):
    file_path = tmp_path
    List.append(file_path)
    # print('文件: %s' % tmp_path)
    else:
    # print('文件夹:%s' % tmp_path)
    traverse(tmp_path)
    return List

    if __name__=="__main__":
    mongo_address = '127.0.0.1' #数据库地址
    mongo_port = 27017 #数据库端口
    json_Path = 'E:Typhoon_dataData' # json总文件夹地址
    traverse(json_Path) #遍历文件夹,获取文件地址
    for json_Filenum in range(len(List)):
    loadFont(mongo_address, mongo_port, List[json_Filenum]) #载入mongo
  • 相关阅读:
    新书《JFinal极速开发实战》正式发布
    Maven转化为Dynamic Web Module
    SpringMVC——数据校验
    SpringMVC——请求映射
    Spring——Bean的命名及实例化
    js实现省市区三级联动
    MySQL数据库忘记密码
    Spring——控制反转
    SpringMVC(五)@RequestHeader和@CookieValue
    SpringMVC(四)@RequestParam
  • 原文地址:https://www.cnblogs.com/setname/p/8597357.html
Copyright © 2020-2023  润新知