STEP 1 / pandas
import pandas as pd
path = 'xxx'
data = pd.read_csv(path, header=None, names=['label','title','text'])
data :
STEP 2 / sklearn.model_selection.train_test_split
from sklearn.model_selection import train_test_split
x= data.iloc[:,:] # 选取 data 所有行、所有列数据
y = data.iloc[:,0] # 选取 data 所有行、第一列数据
X_train, X_test, y_train, y_test = train_test_split(x, y, test_size=0.4, random_state=0)
x (左) & y (右) :
X_train :