import pandas as pd
import json
path = r'/Users/mac/Desktop/test_le/m.xlsx'
data = pd.read_excel(path)
output_file = 'm.jsonl'
with open(output_file,'w',encoding='utf-8') as f:
for index,row in data.iterrows():
qa_pairs = row['faq']
# 提取这一列当中'question'的键值
Q = row['question']
# 变成json类型
qa_json = json.loads(qa_pairs)
# 修剪qa格式,输出键'q'及对应的值
trimmed_qa = [{"q":item["questions"]} for item in qa_json]
# 把键'Q'和'q'合并
#注意:如果这里在final_data外面加中括号的话,会出现多余的缩进和换行符
final_data = {"Q":Q},{"questions":trimmed_qa}
#将数据保存为JSONL文件
data_str = json.dumps(final_data,ensure_ascii=False)
f.write(data_str + '\n')
把Excel变成格式规范的json/jsonl文件
最新推荐文章于 2024-07-14 16:32:48 发布