1.导入TXT 数据
长度 宽度 高 类型
15 5 2 1
20 7 3 2
30 10 5 3
16 4 2 1
22 8 3 2
32 12 6 3
14 4 3 1
18 6 4 2
31 12 5 3
import numpy as np
def file2matrix(fileName):
f = open(fileName)
datasLines = f.readlines()
print(datasLines)
sizeDatas = len(datasLines)
sizeColumnList = datasLines[0].split()
sizeColumnNumber = len(sizeColumnList)
datasZeros = np.zeros((sizeDatas - 1 , sizeColumnNumber - 1), int)
labels = []
index = 0
for line in datasLines[1 : ]:
line = line.split()
datasZeros[index, :] = line[0 : sizeColumnNumber - 1]
labels.append(int(line[-1]))
index += 1
datas = datasZeros
labels = np.array(labels)
return datas,labels
fileName = ("data_diy.txt")
datas,labels = file2matrix(fileName)
print(datas)
print(labels)
2.读取txt三种方式:
# read():读取至文件结束,返回字符串
f = open('email/spam/1.txt')
emailTxt = f.read()
print(emailTxt)
f.close
# --- Codeine 15mg -- 30 for $203.70 -- VISA Only!!! --
#
# -- Codeine (Methylmorphine) is a narcotic (opioid) pain reliever
# -- We have 15mg & 30mg pills -- 30/15mg for $203.70 - 60/15mg for $385.80 - 90/15mg for $562.50 -- VISA Only!!! ---
# readline():读取一行内容,返回字符串
f = open('email/spam/1.txt')
b = f.readline()
print(b)
f.close
# --- Codeine 15mg -- 30 for $203.70 -- VISA Only!!! --
# readlines():读取所有行,返回列表,每一行为一元素
f = open('email/spam/1.txt')
lines = f.readlines()
print(lines)
f.close
# ['--- Codeine 15mg -- 30 for $203.70 -- VISA Only!!! --\n', '\n', '-- Codeine (Methylmorphine) is a narcotic (opioid) pain reliever\n', '-- We have 15mg & 30mg pills -- 30/15mg for $203.70 - 60/15mg for $385.80 - 90/15mg for $562.50 -- VISA Only!!! ---']