df['col'][df['col'].isnull().values==True] #查找空值
# 删除某列空值所在行数据
data_result['result'].isnull().value_counts()
data_result['result'] = data_result['result'].fillna('999')
data_result[(data_result.result == '999')].index.tolist() # [37405, 37406, 104433, 104434, 104435, 120601, 120602]
data_result = data_result.drop([37405, 37406, 104433, 104434, 104435, 120601, 120602])
data_result = data_result.reset_index(drop = True) # 重新索引
2.创建空dataframe, 添加数据
topic_df = pd.DataFrame(columns=["score", "topic"]) #创建dataframe
for i in range(len(data_result['result'])):
print(i)
for j in data_result['result'][i]:
# 添加数据
topic_df = topic_df.append(pd.DataFrame({'score': [j[0]], 'topic': [j[1]]}),ignore_index=True)
3.数据类型转换
topic_df['score'] = topic_df['score'].astype(float)
4.两个dataframe上下合并拼接
df = df1.append(df2)
pd.concat([a,b],axis=0,ignore_index=True)
df["C"] = df[["A", "B"]].max(axis=1)
6、打印输出多个变量
print("变量1:%s 变量2:%s" %(a1,a2))
原文链接:https://blog.csdn.net/kerry_55/article/details/105101420