代码来源:《机器学习实战》
# encoding=utf-8
"""
Date:2019-07-29 10:54
User:LiYu
Email:liyu_5498@163.com
"""
from numpy import *
def file2matrix(filename):
"""读取并处理数据"""
with open(filename, 'r') as f:
linesList = f.readlines()
numberOfLines = len(linesList)
returnMat = zeros((numberOfLines, 3)) # 1000*3的全0矩阵
classLabelVector = []
index = 0
for line in linesList:
line = line.strip().split('\t')
# print(line[0:3]) # ['35018', '9.959588', '0.060020']
# print(line[-1]) # largeDoses
returnMat[index, :] = line[0:3]
classLabelVector.append(line[-1])
index += 1
# print(numberOfLines) # 1000