1.
pandas数据读取和预处理
# import pandas and load dataset
import pandas as pd
names = ['Sex', 'Length', 'Diameter', 'Height', 'Whole_weight',
'Shucked_weight', 'Viscera_weight', 'Shell_weight', 'Rings']
data = pd.read_csv(data_file, header=None, names=names)
print(data) # [4177 rows x 9 columns]
type(data) # pandas.core.frame.DataFrame
data.isnull().values.any() # False (check if there are any missing values)
data.isnull().sum() # total no. of missing values in each column
data.isnull().sum().sum() # total no. of missing values in entire dataframe
data.dtypes
data["Rings"] = data["Rings"].astype(float) # convert from int64 to float64
data["Sex"] = data["Sex"].astype("category") # convert from object to category
data["Sex"]
data.dtypes
data.describe() # summary of data
data["Height"].describe() # summary of variable "Height" only
data["Sex"].value_counts() # summary of variable "Sex"
torch变量size
import torch
X = torch.arange(24).reshape(2, 3, 4)
len(X)
#output: 2
len (X)总是返回第0轴的长度。
What are the shapes of summation outputs along axis 0, 1, and 2?