import csv
import json
import pandas as pd
csv_filename = 'tmdb_5000_movies.csv'
json_filename = 'tmdb_5000_movies.json'
def main():
csvfile = open(csv_filename, 'r', encoding='UTF-8')
jsonfile = open(json_filename, 'w', encoding='UTF-8')
dataframe = pd.read_csv(csv_filename, encoding='UTF-8')
# 获取表头
fieldnames = dataframe.columns
fieldnames = tuple(fieldnames)
# print(fieldnames)
reader = csv.DictReader(csvfile, fieldnames=fieldnames)
count01 = 0
for row in reader:
# 跳过第一行的标题
if count01 == 0:
count01 += 1
continue
# 确保每一行都能成功地解析
for k in row.keys():
# 如果表格中字段以是json数组,则将其转换成python的list
if str(row[k]).startswith('['):
try:
row[k] = json.loads(row[k])
except:
# 该列表为空
continue
# 写入文件
json.dump(row, jsonfile, ensure_ascii=False)
jsonfile.write('\n')
jsonfile.close()
csvfile.close()
print("succees!")
if __name__ == '__main__':
main()
解析结果: