遍历win10文件夹并解析json文件,按照json格式存入mongo数据库(基于python 3.6)

Posted Moucong

tags:

篇首语:本文由小常识网(cha138.com)小编为大家整理,主要介绍了遍历win10文件夹并解析json文件,按照json格式存入mongo数据库(基于python 3.6)相关的知识,希望对你有一定的参考价值。

import re
import json
from pymongo import MongoClient
import os

# def Write_json(data):
# open_Json = open("1.json", "a")
# Write_json = json.dumps(data)
# open_Json.write(Write_json)
# open_Json.close()

def load_Mongo(Address, port, Process_data, Name):
client = MongoClient(Address, port) #数据地址+端口号
db = client.portal #数据库
collection = db.typhoons #数据表
# collection.find({Name})
collection.insert(Process_data)
for i in collection.find({"ename": Name}):
id = str(i[‘_id‘])
print(‘已存放,‘ + ‘ObjectID:‘ + ‘‘ + id)
def loadFont(address, port, Json_File):
n = 0
Date = []
Info = []
ADV= []
LAT= []
LON= []
TIME= []
WIND= []
PR= []
STAT = []
Data_Header = []
json_File = Json_File #json文件地址
with open(json_File, encoding=‘utf-8‘) as f:
while True:
lines = f.readline()
n = n+1
if not lines:
break
pass

Colon = re.findall(r‘:‘, lines, re.I)
if Colon: #处理第一行数据
date = re.split(r":", lines) #分割冒号
date = date[1].replace(\r, ‘‘).replace(\n, ‘‘).replace(\t, ‘‘).replace(‘ ‘, ‘‘)
Date.append(date)
# print(Date)
else:


if n == 2:
info = lines
info = info.replace(\r, ‘‘).replace(\n, ‘‘).replace(\t, ‘‘)
Info.append(info)
else:
if n == 3:
Data_header = re.split(r" ", lines)
while ‘‘ in Data_header: #移除空格
Data_header.remove(‘‘)
for head_Num in range(len(Data_header)):
head_Find = re.findall(r‘\n‘, Data_header[head_Num], re.I)
if head_Find: #查找\n并删除,然后加入json文件
Data_header[head_Num] = Data_header[head_Num].replace(\r, ‘‘).replace(\n, ‘‘).replace(\t, ‘‘)
# json_List.setdefault(Data_header[head_Num]) #增加键值对
Data_Header.append(Data_header[head_Num])

else:
head_Data = Data_header[head_Num]
# json_List.setdefault(head_Data) #增加键值对
Data_Header.append(head_Data)
# Write_json(json_List) #写入json
# print(Data_header)


else:
if n > 3:
all = re.split(r" ", lines)
while ‘‘ in all:
all.remove(‘‘)
ADV.append(all[0])
LAT.append(all[1])
LON.append(all[2])
TIME.append(all[3])
WIND.append(all[4])
PR.append(all[5])
stat = []
for count in range(len(all)):
if count > 5:
stat.append(all[count])
# print(stat)
else:
continue
stat = " ".join(str(i) for i in stat) #合并数据
stat = stat.replace(\r, ‘‘).replace(\n, ‘‘).replace(\t, ‘‘)
STAT.append(stat)
# print(STAT)


#设计字典

Addit_all = [ ]
json_List = {‘ename‘: ‘‘, ‘is_current‘: ‘null‘,‘enddate‘:‘null‘, ‘name‘:‘null‘, ‘sn‘:‘null‘,‘land‘:[ ], ‘startdate‘:‘‘,
‘track‘:[ ] }
json_List[‘startdate‘] = Date[0]
json_List[‘ename‘] = Info[0]
i = len(ADV)
j = 0
while j < i:
# json_List [‘startdate‘] = TIME[j]
addit = {}
addit [‘forecast‘] = ‘null‘
if STAT[j] == ‘TROPICAL STORM‘:
addit[‘type‘] = ‘TS‘
elif STAT[j] == ‘TROPICAL DEPRESSION‘:
addit[‘type‘] = ‘TD‘
else:


addit[‘type‘] = STAT[j]
addit[‘speed‘] = WIND[j]
addit[‘moveDirection‘] =‘null‘
# addit[‘ADV‘] = ADV[j]
addit[‘longitude‘] = LON[j]
addit[‘latitude‘] = LAT[j]
addit [‘radius10‘] = ‘null‘
addit[‘time‘] = TIME[j]
addit[‘radius7‘] = ‘null‘
addit [‘pressure‘] = PR[j]
addit [‘power‘] = ‘null‘
addit[‘des‘] = ‘‘
addit[‘moveSpeed‘] = ‘null‘
Addit_all.append(addit) #将多组数据加入数组
j = j + 1
json_List[‘track‘] = Addit_all
# Write_json(json_List)
print(json_List)
load_Mongo(address, port, json_List, Info[0])


List = []
def traverse(json_Dir):
fs = os.listdir(json_Dir)
for file in fs:
tmp_path = os.path.join(json_Dir, file)
if not os.path.isdir(tmp_path):
file_path = tmp_path
List.append(file_path)
# print(‘文件: %s‘ % tmp_path)
else:
# print(‘文件夹:%s‘ % tmp_path)
traverse(tmp_path)
return List

if __name__=="__main__":
mongo_address = ‘127.0.0.1‘ #数据库地址
mongo_port = 27017 #数据库端口
json_Path = ‘E:\Typhoon_data\Data‘ # json总文件夹地址
traverse(json_Path) #遍历文件夹,获取文件地址
for json_Filenum in range(len(List)):
loadFont(mongo_address, mongo_port, List[json_Filenum]) #载入mongo


























































































































































以上是关于遍历win10文件夹并解析json文件,按照json格式存入mongo数据库(基于python 3.6)的主要内容,如果未能解决你的问题,请参考以下文章

使用Java开发 接收一个Json文件,然后解析Json 并按照特定的Csv格式转换,输出Csv格式的文件,求案例谢谢

解析连续 JSON 文件的最佳方法?

获取本地的json并展示

JS对JSON对象遍历输出的时候真的是按照顺序输出吗?

win10怎么关闭始终使用这种方式打开json

qt解析json汉字和数字一起的时候提示数据错误