AI day03(2020 8/1)

Numpy

import numpy as np
data = np.array([[1,2,3],
[4,5,6],[
    7,8,9
]])
data
array([[1, 2, 3],
       [4, 5, 6],
       [7, 8, 9]])

numpy 数据必须一致
numpy.genfromtxt() 可以读文本内容

print(data.shape)
(3, 3)
t = data%2 == 0
t
array([[False,  True, False],
       [ True, False,  True],
       [False,  True, False]])
data[t]
array([2, 4, 6, 8])
data[data==5]
array([5])
data[data%2==1]
array([1, 3, 5, 7, 9])
tt = np.array(['wo','s','ww','wos'])
tt
array(['wo', 's', 'ww', 'wos'], dtype='<U3')
data
array([[1, 2, 3],
       [4, 5, 6],
       [7, 8, 9]])
data.sum()
45
data.sum(axis=0)
array([12, 15, 18])
data.sum(axis=1)
array([ 6, 15, 24])

axis = 1 按行
axis = 0 按列

# 维度
data.ndim

2
# 个数
data.size
9
# 初始化
print(np.zeros((3,4)))
print('-'*20)
print(np.ones((3,4)))
[[0. 0. 0. 0.]
 [0. 0. 0. 0.]
 [0. 0. 0. 0.]]
--------------------
[[1. 1. 1. 1.]
 [1. 1. 1. 1.]
 [1. 1. 1. 1.]]
np.arange(5,10,1)
array([5, 6, 7, 8, 9])
np.random.random((2,4))
array([[0.91888061, 0.16794386, 0.77254003, 0.72115635],
       [0.80070458, 0.76273646, 0.74992497, 0.6513706 ]])
# 从 x , y 平均分为 n 个值
np.linspace(0,np.pi,1000)
array([0.        , 0.00314474, 0.00628947, 0.00943421, 0.01257895,
       0.01572369, 0.01886842, 0.02201316, 0.0251579 , 0.02830264,
       0.03144737, 0.03459211, 0.03773685, 0.04088159, 0.04402632,
       0.04717106, 0.0503158 , 0.05346054, 0.05660527, 0.05975001,
       0.06289475, 0.06603949, 0.06918422, 0.07232896, 0.0754737 ,
       0.07861843, 0.08176317, 0.08490791, 0.08805265, 0.09119738,
       0.09434212, 0.09748686, 0.1006316 , 0.10377633, 0.10692107,
       0.11006581, 0.11321055, 0.11635528, 0.11950002, 0.12264476,
       0.1257895 , 0.12893423, 0.13207897, 0.13522371, 0.13836845,
       0.14151318, 0.14465792, 0.14780266, 0.15094739, 0.15409213,
       0.15723687, 0.16038161, 0.16352634, 0.16667108, 0.16981582,
       0.17296056, 0.17610529, 0.17925003, 0.18239477, 0.18553951,
       0.18868424, 0.19182898, 0.19497372, 0.19811846, 0.20126319,
       0.20440793, 0.20755267, 0.21069741, 0.21384214, 0.21698688,
       0.22013162, 0.22327635, 0.22642109, 0.22956583, 0.23271057,
       0.2358553 , 0.23900004, 0.24214478, 0.24528952, 0.24843425,
       0.25157899, 0.25472373, 0.25786847, 0.2610132 , 0.26415794,
       0.26730268, 0.27044742, 0.27359215, 0.27673689, 0.27988163,
       0.28302637, 0.2861711 , 0.28931584, 0.29246058, 0.29560531,
       0.29875005, 0.30189479, 0.30503953, 0.30818426, 0.311329  ,
       0.31447374, 0.31761848, 0.32076321, 0.32390795, 0.32705269,
       0.33019743, 0.33334216, 0.3364869 , 0.33963164, 0.34277638,
       0.34592111, 0.34906585, 0.35221059, 0.35535533, 0.35850006,
       0.3616448 , 0.36478954, 0.36793427, 0.37107901, 0.37422375,
       0.37736849, 0.38051322, 0.38365796, 0.3868027 , 0.38994744,
       0.39309217, 0.39623691, 0.39938165, 0.40252639, 0.40567112,
       0.40881586, 0.4119606 , 0.41510534, 0.41825007, 0.42139481,
       0.42453955, 0.42768429, 0.43082902, 0.43397376, 0.4371185 ,
       0.44026323, 0.44340797, 0.44655271, 0.44969745, 0.45284218,
       0.45598692, 0.45913166, 0.4622764 , 0.46542113, 0.46856587,
       0.47171061, 0.47485535, 0.47800008, 0.48114482, 0.48428956,
       0.4874343 , 0.49057903, 0.49372377, 0.49686851, 0.50001325,
       0.50315798, 0.50630272, 0.50944746, 0.51259219, 0.51573693,
       0.51888167, 0.52202641, 0.52517114, 0.52831588, 0.53146062,
       0.53460536, 0.53775009, 0.54089483, 0.54403957, 0.54718431,
       0.55032904, 0.55347378, 0.55661852, 0.55976326, 0.56290799,
       0.56605273, 0.56919747, 0.57234221, 0.57548694, 0.57863168,
       0.58177642, 0.58492115, 0.58806589, 0.59121063, 0.59435537,
       0.5975001 , 0.60064484, 0.60378958, 0.60693432, 0.61007905,
       0.61322379, 0.61636853, 0.61951327, 0.622658  , 0.62580274,
       0.62894748, 0.63209222, 0.63523695, 0.63838169, 0.64152643,
       0.64467117, 0.6478159 , 0.65096064, 0.65410538, 0.65725011,
       0.66039485, 0.66353959, 0.66668433, 0.66982906, 0.6729738 ,
       0.67611854, 0.67926328, 0.68240801, 0.68555275, 0.68869749,
       0.69184223, 0.69498696, 0.6981317 , 0.70127644, 0.70442118,
       0.70756591, 0.71071065, 0.71385539, 0.71700013, 0.72014486,
       0.7232896 , 0.72643434, 0.72957907, 0.73272381, 0.73586855,
       0.73901329, 0.74215802, 0.74530276, 0.7484475 , 0.75159224,
       0.75473697, 0.75788171, 0.76102645, 0.76417119, 0.76731592,
       0.77046066, 0.7736054 , 0.77675014, 0.77989487, 0.78303961,
       0.78618435, 0.78932909, 0.79247382, 0.79561856, 0.7987633 ,
       0.80190803, 0.80505277, 0.80819751, 0.81134225, 0.81448698,
       0.81763172, 0.82077646, 0.8239212 , 0.82706593, 0.83021067,
       0.83335541, 0.83650015, 0.83964488, 0.84278962, 0.84593436,
       0.8490791 , 0.85222383, 0.85536857, 0.85851331, 0.86165805,
       0.86480278, 0.86794752, 0.87109226, 0.87423699, 0.87738173,
       0.88052647, 0.88367121, 0.88681594, 0.88996068, 0.89310542,
       0.89625016, 0.89939489, 0.90253963, 0.90568437, 0.90882911,
       0.91197384, 0.91511858, 0.91826332, 0.92140806, 0.92455279,
       0.92769753, 0.93084227, 0.93398701, 0.93713174, 0.94027648,
       0.94342122, 0.94656595, 0.94971069, 0.95285543, 0.95600017,
       0.9591449 , 0.96228964, 0.96543438, 0.96857912, 0.97172385,
       0.97486859, 0.97801333, 0.98115807, 0.9843028 , 0.98744754,
       0.99059228, 0.99373702, 0.99688175, 1.00002649, 1.00317123,
       1.00631597, 1.0094607 , 1.01260544, 1.01575018, 1.01889491,
       1.02203965, 1.02518439, 1.02832913, 1.03147386, 1.0346186 ,
       1.03776334, 1.04090808, 1.04405281, 1.04719755, 1.05034229,
       1.05348703, 1.05663176, 1.0597765 , 1.06292124, 1.06606598,
       1.06921071, 1.07235545, 1.07550019, 1.07864493, 1.08178966,
       1.0849344 , 1.08807914, 1.09122387, 1.09436861, 1.09751335,
       1.10065809, 1.10380282, 1.10694756, 1.1100923 , 1.11323704,
       1.11638177, 1.11952651, 1.12267125, 1.12581599, 1.12896072,
       1.13210546, 1.1352502 , 1.13839494, 1.14153967, 1.14468441,
       1.14782915, 1.15097389, 1.15411862, 1.15726336, 1.1604081 ,
       1.16355283, 1.16669757, 1.16984231, 1.17298705, 1.17613178,
       1.17927652, 1.18242126, 1.185566  , 1.18871073, 1.19185547,
       1.19500021, 1.19814495, 1.20128968, 1.20443442, 1.20757916,
       1.2107239 , 1.21386863, 1.21701337, 1.22015811, 1.22330285,
       1.22644758, 1.22959232, 1.23273706, 1.23588179, 1.23902653,
       1.24217127, 1.24531601, 1.24846074, 1.25160548, 1.25475022,
       1.25789496, 1.26103969, 1.26418443, 1.26732917, 1.27047391,
       1.27361864, 1.27676338, 1.27990812, 1.28305286, 1.28619759,
       1.28934233, 1.29248707, 1.29563181, 1.29877654, 1.30192128,
       1.30506602, 1.30821075, 1.31135549, 1.31450023, 1.31764497,
       1.3207897 , 1.32393444, 1.32707918, 1.33022392, 1.33336865,
       1.33651339, 1.33965813, 1.34280287, 1.3459476 , 1.34909234,
       1.35223708, 1.35538182, 1.35852655, 1.36167129, 1.36481603,
       1.36796077, 1.3711055 , 1.37425024, 1.37739498, 1.38053971,
       1.38368445, 1.38682919, 1.38997393, 1.39311866, 1.3962634 ,
       1.39940814, 1.40255288, 1.40569761, 1.40884235, 1.41198709,
       1.41513183, 1.41827656, 1.4214213 , 1.42456604, 1.42771078,
       1.43085551, 1.43400025, 1.43714499, 1.44028973, 1.44343446,
       1.4465792 , 1.44972394, 1.45286867, 1.45601341, 1.45915815,
       1.46230289, 1.46544762, 1.46859236, 1.4717371 , 1.47488184,
       1.47802657, 1.48117131, 1.48431605, 1.48746079, 1.49060552,
       1.49375026, 1.496895  , 1.50003974, 1.50318447, 1.50632921,
       1.50947395, 1.51261869, 1.51576342, 1.51890816, 1.5220529 ,
       1.52519763, 1.52834237, 1.53148711, 1.53463185, 1.53777658,
       1.54092132, 1.54406606, 1.5472108 , 1.55035553, 1.55350027,
       1.55664501, 1.55978975, 1.56293448, 1.56607922, 1.56922396,
       1.5723687 , 1.57551343, 1.57865817, 1.58180291, 1.58494765,
       1.58809238, 1.59123712, 1.59438186, 1.59752659, 1.60067133,
       1.60381607, 1.60696081, 1.61010554, 1.61325028, 1.61639502,
       1.61953976, 1.62268449, 1.62582923, 1.62897397, 1.63211871,
       1.63526344, 1.63840818, 1.64155292, 1.64469766, 1.64784239,
       1.65098713, 1.65413187, 1.65727661, 1.66042134, 1.66356608,
       1.66671082, 1.66985555, 1.67300029, 1.67614503, 1.67928977,
       1.6824345 , 1.68557924, 1.68872398, 1.69186872, 1.69501345,
       1.69815819, 1.70130293, 1.70444767, 1.7075924 , 1.71073714,
       1.71388188, 1.71702662, 1.72017135, 1.72331609, 1.72646083,
       1.72960557, 1.7327503 , 1.73589504, 1.73903978, 1.74218451,
       1.74532925, 1.74847399, 1.75161873, 1.75476346, 1.7579082 ,
       1.76105294, 1.76419768, 1.76734241, 1.77048715, 1.77363189,
       1.77677663, 1.77992136, 1.7830661 , 1.78621084, 1.78935558,
       1.79250031, 1.79564505, 1.79878979, 1.80193453, 1.80507926,
       1.808224  , 1.81136874, 1.81451347, 1.81765821, 1.82080295,
       1.82394769, 1.82709242, 1.83023716, 1.8333819 , 1.83652664,
       1.83967137, 1.84281611, 1.84596085, 1.84910559, 1.85225032,
       1.85539506, 1.8585398 , 1.86168454, 1.86482927, 1.86797401,
       1.87111875, 1.87426349, 1.87740822, 1.88055296, 1.8836977 ,
       1.88684243, 1.88998717, 1.89313191, 1.89627665, 1.89942138,
       1.90256612, 1.90571086, 1.9088556 , 1.91200033, 1.91514507,
       1.91828981, 1.92143455, 1.92457928, 1.92772402, 1.93086876,
       1.9340135 , 1.93715823, 1.94030297, 1.94344771, 1.94659245,
       1.94973718, 1.95288192, 1.95602666, 1.95917139, 1.96231613,
       1.96546087, 1.96860561, 1.97175034, 1.97489508, 1.97803982,
       1.98118456, 1.98432929, 1.98747403, 1.99061877, 1.99376351,
       1.99690824, 2.00005298, 2.00319772, 2.00634246, 2.00948719,
       2.01263193, 2.01577667, 2.01892141, 2.02206614, 2.02521088,
       2.02835562, 2.03150035, 2.03464509, 2.03778983, 2.04093457,
       2.0440793 , 2.04722404, 2.05036878, 2.05351352, 2.05665825,
       2.05980299, 2.06294773, 2.06609247, 2.0692372 , 2.07238194,
       2.07552668, 2.07867142, 2.08181615, 2.08496089, 2.08810563,
       2.09125037, 2.0943951 , 2.09753984, 2.10068458, 2.10382931,
       2.10697405, 2.11011879, 2.11326353, 2.11640826, 2.119553  ,
       2.12269774, 2.12584248, 2.12898721, 2.13213195, 2.13527669,
       2.13842143, 2.14156616, 2.1447109 , 2.14785564, 2.15100038,
       2.15414511, 2.15728985, 2.16043459, 2.16357932, 2.16672406,
       2.1698688 , 2.17301354, 2.17615827, 2.17930301, 2.18244775,
       2.18559249, 2.18873722, 2.19188196, 2.1950267 , 2.19817144,
       2.20131617, 2.20446091, 2.20760565, 2.21075039, 2.21389512,
       2.21703986, 2.2201846 , 2.22332934, 2.22647407, 2.22961881,
       2.23276355, 2.23590828, 2.23905302, 2.24219776, 2.2453425 ,
       2.24848723, 2.25163197, 2.25477671, 2.25792145, 2.26106618,
       2.26421092, 2.26735566, 2.2705004 , 2.27364513, 2.27678987,
       2.27993461, 2.28307935, 2.28622408, 2.28936882, 2.29251356,
       2.2956583 , 2.29880303, 2.30194777, 2.30509251, 2.30823724,
       2.31138198, 2.31452672, 2.31767146, 2.32081619, 2.32396093,
       2.32710567, 2.33025041, 2.33339514, 2.33653988, 2.33968462,
       2.34282936, 2.34597409, 2.34911883, 2.35226357, 2.35540831,
       2.35855304, 2.36169778, 2.36484252, 2.36798726, 2.37113199,
       2.37427673, 2.37742147, 2.3805662 , 2.38371094, 2.38685568,
       2.39000042, 2.39314515, 2.39628989, 2.39943463, 2.40257937,
       2.4057241 , 2.40886884, 2.41201358, 2.41515832, 2.41830305,
       2.42144779, 2.42459253, 2.42773727, 2.430882  , 2.43402674,
       2.43717148, 2.44031622, 2.44346095, 2.44660569, 2.44975043,
       2.45289516, 2.4560399 , 2.45918464, 2.46232938, 2.46547411,
       2.46861885, 2.47176359, 2.47490833, 2.47805306, 2.4811978 ,
       2.48434254, 2.48748728, 2.49063201, 2.49377675, 2.49692149,
       2.50006623, 2.50321096, 2.5063557 , 2.50950044, 2.51264518,
       2.51578991, 2.51893465, 2.52207939, 2.52522412, 2.52836886,
       2.5315136 , 2.53465834, 2.53780307, 2.54094781, 2.54409255,
       2.54723729, 2.55038202, 2.55352676, 2.5566715 , 2.55981624,
       2.56296097, 2.56610571, 2.56925045, 2.57239519, 2.57553992,
       2.57868466, 2.5818294 , 2.58497414, 2.58811887, 2.59126361,
       2.59440835, 2.59755308, 2.60069782, 2.60384256, 2.6069873 ,
       2.61013203, 2.61327677, 2.61642151, 2.61956625, 2.62271098,
       2.62585572, 2.62900046, 2.6321452 , 2.63528993, 2.63843467,
       2.64157941, 2.64472415, 2.64786888, 2.65101362, 2.65415836,
       2.6573031 , 2.66044783, 2.66359257, 2.66673731, 2.66988204,
       2.67302678, 2.67617152, 2.67931626, 2.68246099, 2.68560573,
       2.68875047, 2.69189521, 2.69503994, 2.69818468, 2.70132942,
       2.70447416, 2.70761889, 2.71076363, 2.71390837, 2.71705311,
       2.72019784, 2.72334258, 2.72648732, 2.72963206, 2.73277679,
       2.73592153, 2.73906627, 2.742211  , 2.74535574, 2.74850048,
       2.75164522, 2.75478995, 2.75793469, 2.76107943, 2.76422417,
       2.7673689 , 2.77051364, 2.77365838, 2.77680312, 2.77994785,
       2.78309259, 2.78623733, 2.78938207, 2.7925268 , 2.79567154,
       2.79881628, 2.80196102, 2.80510575, 2.80825049, 2.81139523,
       2.81453996, 2.8176847 , 2.82082944, 2.82397418, 2.82711891,
       2.83026365, 2.83340839, 2.83655313, 2.83969786, 2.8428426 ,
       2.84598734, 2.84913208, 2.85227681, 2.85542155, 2.85856629,
       2.86171103, 2.86485576, 2.8680005 , 2.87114524, 2.87428998,
       2.87743471, 2.88057945, 2.88372419, 2.88686892, 2.89001366,
       2.8931584 , 2.89630314, 2.89944787, 2.90259261, 2.90573735,
       2.90888209, 2.91202682, 2.91517156, 2.9183163 , 2.92146104,
       2.92460577, 2.92775051, 2.93089525, 2.93403999, 2.93718472,
       2.94032946, 2.9434742 , 2.94661894, 2.94976367, 2.95290841,
       2.95605315, 2.95919788, 2.96234262, 2.96548736, 2.9686321 ,
       2.97177683, 2.97492157, 2.97806631, 2.98121105, 2.98435578,
       2.98750052, 2.99064526, 2.99379   , 2.99693473, 3.00007947,
       3.00322421, 3.00636895, 3.00951368, 3.01265842, 3.01580316,
       3.0189479 , 3.02209263, 3.02523737, 3.02838211, 3.03152684,
       3.03467158, 3.03781632, 3.04096106, 3.04410579, 3.04725053,
       3.05039527, 3.05354001, 3.05668474, 3.05982948, 3.06297422,
       3.06611896, 3.06926369, 3.07240843, 3.07555317, 3.07869791,
       3.08184264, 3.08498738, 3.08813212, 3.09127686, 3.09442159,
       3.09756633, 3.10071107, 3.1038558 , 3.10700054, 3.11014528,
       3.11329002, 3.11643475, 3.11957949, 3.12272423, 3.12586897,
       3.1290137 , 3.13215844, 3.13530318, 3.13844792, 3.14159265])
# 加减乘除 
    # 1. 对于矩阵 --> 对应位置相运算
    # 2. 对于值  --> 所有元素运算
# np.dot(a,b) --> 矩阵乘法运算
a = np.array([[1,2],[3,4]])
b = np.array([[5,6],[7,8]])
print(a)
print(b)
np.dot(a,b)
[[1 2]
 [3 4]]
[[5 6]
 [7 8]]





array([[19, 22],
       [43, 50]])
# 幂运算
np.exp(a)
array([[ 2.71828183,  7.3890561 ],
       [20.08553692, 54.59815003]])
# floor 向下取整数
np.floor(10*np.random.rand(10))
array([3., 4., 9., 6., 1., 2., 5., 1., 6., 9.])
# ravel 将矩阵转为向量(一维)
# data.T 矩阵转置
# 矩阵拼接与分隔
a = np.floor(10*np.random.random((2,2)))
b = np.floor(10*np.random.random((2,2)))
print(a)
print(b)
print('*'*20)
# 按行拼接
# hsplit
print(np.hstack((a,b)))
# 按列拼接
# vsplit
print(np.vstack((a,b)))
[[6. 0.]
 [0. 8.]]
[[4. 7.]
 [6. 6.]]
********************
[[6. 0. 4. 7.]
 [0. 8. 6. 6.]]
[[6. 0.]
 [0. 8.]
 [4. 7.]
 [6. 6.]]

Pandas

# 文件读取
# pd.read_
import pandas as pd
# Series和DataFrame
# pd.head()
# pd.tail()
data = pd.DataFrame([[1,2,3,4,5,6,7,8,9,10],[2,3,4,5,6,7,8,9,10,11]])
data
0123456789
012345678910
1234567891011
data.head()
0123456789
012345678910
1234567891011
# 按列取
data[0]
0    1
1    2
Name: 0, dtype: int64
# 按行取
data.loc[0]
0     1
1     2
2     3
3     4
4     5
5     6
6     7
7     8
8     9
9    10
Name: 0, dtype: int64
# [列][行]
data[2][1]
4
# 同时取多列
data[[1,2]]
12
023
134
# 以x为指标按列排序,inplace 是否在原数据上操作,ascending是否升序
data.sort_values(1,inplace=False,ascending=False)
0123456789
1234567891011
012345678910
data_ = pd.read_csv('data/train.csv')
data_
PassengerIdSurvivedPclassNameSexAgeSibSpParchTicketFareCabinEmbarked
0103Braund, Mr. Owen Harrismale22.010A/5 211717.2500NaNS
1211Cumings, Mrs. John Bradley (Florence Briggs Th...female38.010PC 1759971.2833C85C
2313Heikkinen, Miss. Lainafemale26.000STON/O2. 31012827.9250NaNS
3411Futrelle, Mrs. Jacques Heath (Lily May Peel)female35.01011380353.1000C123S
4503Allen, Mr. William Henrymale35.0003734508.0500NaNS
5603Moran, Mr. JamesmaleNaN003308778.4583NaNQ
6701McCarthy, Mr. Timothy Jmale54.0001746351.8625E46S
7803Palsson, Master. Gosta Leonardmale2.03134990921.0750NaNS
8913Johnson, Mrs. Oscar W (Elisabeth Vilhelmina Berg)female27.00234774211.1333NaNS
91012Nasser, Mrs. Nicholas (Adele Achem)female14.01023773630.0708NaNC
101113Sandstrom, Miss. Marguerite Rutfemale4.011PP 954916.7000G6S
111211Bonnell, Miss. Elizabethfemale58.00011378326.5500C103S
121303Saundercock, Mr. William Henrymale20.000A/5. 21518.0500NaNS
131403Andersson, Mr. Anders Johanmale39.01534708231.2750NaNS
141503Vestrom, Miss. Hulda Amanda Adolfinafemale14.0003504067.8542NaNS
151612Hewlett, Mrs. (Mary D Kingcome)female55.00024870616.0000NaNS
161703Rice, Master. Eugenemale2.04138265229.1250NaNQ
171812Williams, Mr. Charles EugenemaleNaN0024437313.0000NaNS
181903Vander Planke, Mrs. Julius (Emelia Maria Vande...female31.01034576318.0000NaNS
192013Masselmani, Mrs. FatimafemaleNaN0026497.2250NaNC
202102Fynney, Mr. Joseph Jmale35.00023986526.0000NaNS
212212Beesley, Mr. Lawrencemale34.00024869813.0000D56S
222313McGowan, Miss. Anna "Annie"female15.0003309238.0292NaNQ
232411Sloper, Mr. William Thompsonmale28.00011378835.5000A6S
242503Palsson, Miss. Torborg Danirafemale8.03134990921.0750NaNS
252613Asplund, Mrs. Carl Oscar (Selma Augusta Emilia...female38.01534707731.3875NaNS
262703Emir, Mr. Farred ChehabmaleNaN0026317.2250NaNC
272801Fortune, Mr. Charles Alexandermale19.03219950263.0000C23 C25 C27S
282913O'Dwyer, Miss. Ellen "Nellie"femaleNaN003309597.8792NaNQ
293003Todoroff, Mr. LaliomaleNaN003492167.8958NaNS
.......................................
86186202Giles, Mr. Frederick Edwardmale21.0102813411.5000NaNS
86286311Swift, Mrs. Frederick Joel (Margaret Welles Ba...female48.0001746625.9292D17S
86386403Sage, Miss. Dorothy Edith "Dolly"femaleNaN82CA. 234369.5500NaNS
86486502Gill, Mr. John Williammale24.00023386613.0000NaNS
86586612Bystrom, Mrs. (Karolina)female42.00023685213.0000NaNS
86686712Duran y More, Miss. Asuncionfemale27.010SC/PARIS 214913.8583NaNC
86786801Roebling, Mr. Washington Augustus IImale31.000PC 1759050.4958A24S
86886903van Melkebeke, Mr. PhilemonmaleNaN003457779.5000NaNS
86987013Johnson, Master. Harold Theodormale4.01134774211.1333NaNS
87087103Balkic, Mr. Cerinmale26.0003492487.8958NaNS
87187211Beckwith, Mrs. Richard Leonard (Sallie Monypeny)female47.0111175152.5542D35S
87287301Carlsson, Mr. Frans Olofmale33.0006955.0000B51 B53 B55S
87387403Vander Cruyssen, Mr. Victormale47.0003457659.0000NaNS
87487512Abelson, Mrs. Samuel (Hannah Wizosky)female28.010P/PP 338124.0000NaNC
87587613Najib, Miss. Adele Kiamie "Jane"female15.00026677.2250NaNC
87687703Gustafsson, Mr. Alfred Ossianmale20.00075349.8458NaNS
87787803Petroff, Mr. Nedeliomale19.0003492127.8958NaNS
87887903Laleff, Mr. KristomaleNaN003492177.8958NaNS
87988011Potter, Mrs. Thomas Jr (Lily Alexenia Wilson)female56.0011176783.1583C50C
88088112Shelley, Mrs. William (Imanita Parrish Hall)female25.00123043326.0000NaNS
88188203Markun, Mr. Johannmale33.0003492577.8958NaNS
88288303Dahlberg, Miss. Gerda Ulrikafemale22.000755210.5167NaNS
88388402Banfield, Mr. Frederick Jamesmale28.000C.A./SOTON 3406810.5000NaNS
88488503Sutehall, Mr. Henry Jrmale25.000SOTON/OQ 3920767.0500NaNS
88588603Rice, Mrs. William (Margaret Norton)female39.00538265229.1250NaNQ
88688702Montvila, Rev. Juozasmale27.00021153613.0000NaNS
88788811Graham, Miss. Margaret Edithfemale19.00011205330.0000B42S
88888903Johnston, Miss. Catherine Helen "Carrie"femaleNaN12W./C. 660723.4500NaNS
88989011Behr, Mr. Karl Howellmale26.00011136930.0000C148C
89089103Dooley, Mr. Patrickmale32.0003703767.7500NaNQ

891 rows × 12 columns

data_.head()
PassengerIdSurvivedPclassNameSexAgeSibSpParchTicketFareCabinEmbarked
0103Braund, Mr. Owen Harrismale22.010A/5 211717.2500NaNS
1211Cumings, Mrs. John Bradley (Florence Briggs Th...female38.010PC 1759971.2833C85C
2313Heikkinen, Miss. Lainafemale26.000STON/O2. 31012827.9250NaNS
3411Futrelle, Mrs. Jacques Heath (Lily May Peel)female35.01011380353.1000C123S
4503Allen, Mr. William Henrymale35.0003734508.0500NaNS
age = data_['Age']
age.head()
0    22.0
1    38.0
2    26.0
3    35.0
4    35.0
Name: Age, dtype: float64
age_is_null = age.isnull()
age_is_null
0      False
1      False
2      False
3      False
4      False
5       True
6      False
7      False
8      False
9      False
10     False
11     False
12     False
13     False
14     False
15     False
16     False
17      True
18     False
19      True
20     False
21     False
22     False
23     False
24     False
25     False
26      True
27     False
28      True
29      True
       ...  
861    False
862    False
863     True
864    False
865    False
866    False
867    False
868     True
869    False
870    False
871    False
872    False
873    False
874    False
875    False
876    False
877    False
878     True
879    False
880    False
881    False
882    False
883    False
884    False
885    False
886    False
887    False
888     True
889    False
890    False
Name: Age, Length: 891, dtype: bool
age[age.notnull()]
0      22.0
1      38.0
2      26.0
3      35.0
4      35.0
6      54.0
7       2.0
8      27.0
9      14.0
10      4.0
11     58.0
12     20.0
13     39.0
14     14.0
15     55.0
16      2.0
18     31.0
20     35.0
21     34.0
22     15.0
23     28.0
24      8.0
25     38.0
27     19.0
30     40.0
33     66.0
34     28.0
35     42.0
37     21.0
38     18.0
       ... 
856    45.0
857    51.0
858    24.0
860    41.0
861    21.0
862    48.0
864    24.0
865    42.0
866    27.0
867    31.0
869     4.0
870    26.0
871    47.0
872    33.0
873    47.0
874    28.0
875    15.0
876    20.0
877    19.0
879    56.0
880    25.0
881    33.0
882    22.0
883    28.0
884    25.0
885    39.0
886    27.0
887    19.0
889    26.0
890    32.0
Name: Age, Length: 714, dtype: float64

预处理

data_.head(10)
PassengerIdSurvivedPclassNameSexAgeSibSpParchTicketFareCabinEmbarked
0103Braund, Mr. Owen Harrismale22.010A/5 211717.2500NaNS
1211Cumings, Mrs. John Bradley (Florence Briggs Th...female38.010PC 1759971.2833C85C
2313Heikkinen, Miss. Lainafemale26.000STON/O2. 31012827.9250NaNS
3411Futrelle, Mrs. Jacques Heath (Lily May Peel)female35.01011380353.1000C123S
4503Allen, Mr. William Henrymale35.0003734508.0500NaNS
5603Moran, Mr. JamesmaleNaN003308778.4583NaNQ
6701McCarthy, Mr. Timothy Jmale54.0001746351.8625E46S
7803Palsson, Master. Gosta Leonardmale2.03134990921.0750NaNS
8913Johnson, Mrs. Oscar W (Elisabeth Vilhelmina Berg)female27.00234774211.1333NaNS
91012Nasser, Mrs. Nicholas (Adele Achem)female14.01023773630.0708NaNC
# 透视表
data_1 = data_.pivot_table(index='Pclass',values='Survived',aggfunc=np.mean)
data_1
Survived
Pclass
10.629630
20.472826
30.242363
# apply()自定义函数

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值