import re
import json
from pymongo import MongoClient
import os
# def Write_json(data):
# open_Json = open("1.json", "a")
# Write_json = json.dumps(data)
# open_Json.write(Write_json)
# open_Json.close()
def load_Mongo(Address, port, Process_data, Name):
client = MongoClient(Address, port) #数据地址+端口号
db = client.portal #数据库
collection = db.typhoons #数据表
# collection.find({Name})
ret = collection.find({"ename": Name})
if not ret or ret.count() == 0:
collection.insert(Process_data)
for i in collection.find({"ename": Name}):
id = str(i['_id'])
print('Have been stored,' + 'ObjectID:' + '' + id)
else:
# collection.insert(Process_data)
for i in collection.find({"ename": Name}):
id = str(i['_id'])
print('Already exist,' + 'ObjectID:' + '' + id)
def loadFont(address, port, Json_File):
n = 0
Date = []
Info = []
ADV= []
LAT= []
LON= []
TIME= []
WIND= []
PR= []
STAT = []
Data_Header = []
json_File = Json_File #json文件地址
with open(json_File, encoding='utf-8') as f:
while True:
lines = f.readline()
n = n+1
if not lines:
break
pass
Colon = re.findall(r':', lines, re.I)
if Colon: #处理第一行数据
date = re.split(r":", lines) #分割冒号
date = date[1].replace('
', '').replace('
', '').replace(' ', '').replace(' ', '')
Date.append(date)
# print(Date)
else:
if n == 2:
info = lines
info = info.replace('
', '').replace('
', '').replace(' ', '')
Info.append(info)
else:
if n == 3:
Data_header = re.split(r" ", lines)
while '' in Data_header: #移除空格
Data_header.remove('')
for head_Num in range(len(Data_header)):
head_Find = re.findall(r'
', Data_header[head_Num], re.I)
if head_Find: #查找
并删除,然后加入json文件
Data_header[head_Num] = Data_header[head_Num].replace('
', '').replace('
', '').replace(' ', '')
# json_List.setdefault(Data_header[head_Num]) #增加键值对
Data_Header.append(Data_header[head_Num])
else:
head_Data = Data_header[head_Num]
# json_List.setdefault(head_Data) #增加键值对
Data_Header.append(head_Data)
# Write_json(json_List) #写入json
# print(Data_header)
else:
if n > 3:
all = re.split(r" ", lines)
while '' in all:
all.remove('')
ADV.append(all[0])
LAT.append(all[1])
LON.append(all[2])
TIME.append(all[3])
WIND.append(all[4])
PR.append(all[5])
stat = []
for count in range(len(all)):
if count > 5:
stat.append(all[count])
# print(stat)
else:
continue
stat = " ".join(str(i) for i in stat) #合并数据
stat = stat.replace('
', '').replace('
', '').replace(' ', '')
STAT.append(stat)
# print(STAT)
#设计字典
Addit_all = [ ]
json_List = {'ename': '', 'is_current': 'null','enddate':'null', 'name':'null', 'sn':'null','land':[ ], 'startdate':'',
'track':[ ] }
json_List['startdate'] = Date[0]
json_List['ename'] = Info[0]
i = len(ADV)
j = 0
while j < i:
# json_List ['startdate'] = TIME[j]
addit = {}
addit ['forecast'] = 'null'
if STAT[j] == 'TROPICAL STORM':
addit['type'] = 'TS'
elif STAT[j] == 'TROPICAL DEPRESSION':
addit['type'] = 'TD'
else:
addit['type'] = STAT[j]
addit['speed'] = WIND[j]
addit['moveDirection'] ='null'
# addit['ADV'] = ADV[j]
addit['longitude'] = LON[j]
addit['latitude'] = LAT[j]
addit ['radius10'] = 'null'
addit['time'] = TIME[j]
addit['radius7'] = 'null'
addit ['pressure'] = PR[j]
addit ['power'] = 'null'
addit['des'] = ''
addit['moveSpeed'] = 'null'
Addit_all.append(addit) #将多组数据加入数组
j = j + 1
json_List['track'] = Addit_all
# Write_json(json_List)
print(json_List)
load_Mongo(address, port, json_List, Info[0])
List = []
def traverse(json_Dir):
fs = os.listdir(json_Dir)
for file in fs:
tmp_path = os.path.join(json_Dir, file)
if not os.path.isdir(tmp_path):
file_path = tmp_path
List.append(file_path)
# print('文件: %s' % tmp_path)
else:
# print('文件夹:%s' % tmp_path)
traverse(tmp_path)
return List
if __name__=="__main__":
mongo_address = '127.0.0.1' #数据库地址
mongo_port = 27017 #数据库端口
json_Path = 'E:Typhoon_dataData' # json总文件夹地址
traverse(json_Path) #遍历文件夹,获取文件地址
for json_Filenum in range(len(List)):
loadFont(mongo_address, mongo_port, List[json_Filenum]) #载入mongo