代码中用到的gocan.csv test_2g.csv train_2g.csv test_new.csv train_new.csv 已经上传在名为hw3的资源中。
import tensorflow as tf
import numpy as np
import pandas as pd
from sklearn import preprocessing
# 常量
X_Independent_Num = 42
Layer0_Num = X_Independent_Num
Layer1_Num = 20
Layer2_Num = 10
Layer3_Num = 20
def integrate_train_data(): # 综合生成最终版训练数据集
train_data_0 = np.array(pd.read_csv("train_2g.csv"))
train_data_1 = np.array(pd.read_csv("gongcan.csv"))
f_0 = open("train_new.csv", 'w')
f_0.writelines("TrajID,IMEI,IMSI,MRTime,RNCID_1,CellID_1,Longitude_1,Latitude_1,Dbm_1,AsuLevel_1,SignalLevel_1,"
"RNCID_2,CellID_2,Longitude_2,Latitude_2,Dbm_2,AsuLevel_2,SignalLevel_2,RNCID_3,CellID_3,"
"Longitude_3,Latitude_3,Dbm_3,AsuLevel_3,SignalLevel_3,RNCID_4,CellID_4,Longitude_4,Latitude_4,"
"Dbm_4,AsuLevel_4,SignalLevel_4,RNCID_5,CellID_5,Longitude_5,Latitude_5,Dbm_5,AsuLevel_5,"
"SignalLevel_5,RNCID_6,CellID_6,Longitude_6,Latitude_6,Dbm_6,AsuLevel_6,SignalLevel_6,Longitude,"
"Latitude,Altitude,Accuracy,Speed" + "\n")
for i in range(train_data_0.shape[0]):
for k in range(6):
f_0.writelines(str(train_data_0[i][k]) + ",")
for j in range(train_data_1.shape[0]):
if train_data_0[i][4] == train_data_1[j][0] and train_data_0[i][5] == train_data_1[j][1]:
f_0.writelines(str(train_data_1[j][2]) + "," + str(train_data_1[j][3]) + ",")
break
elif j == (train_data_1.shape[0] - 1):
f_0.writelines("31.29365558" + "," + "121.20186171" + ",")
# print(j)
# print(train_data_1.shape[0])
# os.system("pause")
for k in range(6, 11, 1):
f_0.writelines(str(train_data_0[i][k]) + ",")
for j in range(train_data_1.shape[0]):
if train_data_0[i][9] == train_data_1[j][0] and train_data_0[i][10] == train_data_1[j][1]:
f_0.writelines(str(train_data_1[j][2]) + "," + str(train_data_1[j][3]) + ",")
break
elif j == (train_data_1.shape[0] - 1):
f_0.writelines("31.29365558" + "," + "121.20186171" + ",")
for k in range(11, 16, 1):
f_0.writelines(str(train_data_0[i][k]) + ",")