环境:python3
原始表:
拆分后的表:
import pandas as pd
#from pandas.core.frame import DataFrame
"""
读取文件
"""
rawdata = pd.read_csv('E:\\testdata\\test1.csv',encoding = "GBK")
rawdata2 = rawdata[['ID','More_characters']]
#df5 = pd.DataFrame(data = [(0, 'a,b'),(2,'a,b,c'),(3,'a')],columns = ['var2','var3'])
"""
分割字符串
"""
m = rawdata2.values.tolist()
y=[]
for ID,s in m:
for v in s.split(','):
n=[]
v=v.strip()
n.append(ID)
n.append(v)
y.append(n)
#print(ID, v)
data=pd.DataFrame(y,columns = ['ID','More_characters_split'])
data.to_csv('E:\\testdata\\test2.csv', index=False, header=False )
####合并###
frames =[rawdata,data]
##result = pd.concat(frames)
###ID为共同字段,按照ID匹配合并
result2 = pd.merge(rawdata,data,on='ID')
result2.to_csv('E:\\testdata\\test3.csv', index=False, header=1 )