批量导入
https://blog.csdn.net/weixin_42886817/article/details/100141798
查看字典中的数据:字典名[‘key名’]
import os
import json
structure_data = []
data_dir = 'C:/Users/10069/Desktop/结构化字段/'
all_json = os.listdir(data_dir)
for j_name in all_json:
j = open(data_dir+j_name)
info = json.load(j) # 批量导入json文件
for k in info: # 合并所有文件中structure_data中字典数据
k_values = info[k]
structure_data.append(k_values['structure_data'])
json文件格式错误时导入添加lines=True,导入为数据框
a = pd.read_json('C:/Users/10069/Desktop/ZTBNews_random600_predict.json',lines=True,encoding='utf_8_sig')
对structure_data中各个key计数
判断字典中是否存在某个key:‘name’ in i.keys()
agencyname_num = 0
for i in structure_data:
if 'agencyname' in i.keys():
agencyname_num += 1
# 对0不计数
bidmoney_num = 0
for i in structure_data:
if 'bidmoney' in i.keys() and i['bidmoney'] != 0:
bidmoney_num += 1
计算相同键数的字典数
len() 函数计算字典元素个数,即键的总数
num = 0
for i in structure_data:
if len(i) == 2:
num +=1
print(num)
# 0不计数
num = [0,0,0,0,0,0,0,0,0,0]
n=9 # 2-9
for i in structure_data:
if