数据处理笔记
import pandas as pd
#读取数据
data = pd.read_csv(path, header=0) #head=0表示第一行取为列名,head=-1表示列名为空
#改列名
data.columns = ['column1', 'column2', 'column3']
#取多列
data_12 = data[['column1', 'column2']]
#按列分割
train = pd.read_csv(train_path, header=0) #train有五列1, 2, 3, 4, 5
train_x, train_y = train, train.pop('5') #train_x为前四列,train_y为最后一列
#等价于
train = pd.read_csv(train_path, header=0)
train_x2 = train[['1', '2','3', '4']]
train_y2 = train[['5']]
#区别在于前者pop后train只剩四列,后者train保持不变
#创建m x n 矩阵的list
import copy
def new_list(shape,value = 0):
result = value
for i in range(len(shape)):
result = [copy.deepcopy(result) for k in range(shape[-1 - i])]
return result
tmp_list = new_list([3,2],1.0)
1万+

被折叠的 条评论
为什么被折叠?



