Numpy
import numpy as np
data = np.array([[1,2,3],
[4,5,6],[
7,8,9
]])
data
array([[1, 2, 3],
[4, 5, 6],
[7, 8, 9]])
numpy 数据必须一致
numpy.genfromtxt() 可以读文本内容
print(data.shape)
(3, 3)
t = data%2 == 0
t
array([[False, True, False],
[ True, False, True],
[False, True, False]])
data[t]
array([2, 4, 6, 8])
data[data==5]
array([5])
data[data%2==1]
array([1, 3, 5, 7, 9])
tt = np.array(['wo','s','ww','wos'])
tt
array(['wo', 's', 'ww', 'wos'], dtype='<U3')
data
array([[1, 2, 3],
[4, 5, 6],
[7, 8, 9]])
data.sum()
45
data.sum(axis=0)
array([12, 15, 18])
data.sum(axis=1)
array([ 6, 15, 24])
axis = 1 按行
axis = 0 按列
data.ndim
2
data.size
9
print(np.zeros((3,4)))
print('-'*20)
print(np.ones((3,4)))
[[0. 0. 0. 0.]
[0. 0. 0. 0.]
[0. 0. 0. 0.]]
--------------------
[[1. 1. 1. 1.]
[1. 1. 1. 1.]
[1. 1. 1. 1.]]
np.arange(5,10,1)
array([5, 6, 7, 8, 9])
np.random.random((2,4))
array([[0.91888061, 0.16794386, 0.77254003, 0.72115635],
[0.80070458, 0.76273646, 0.74992497, 0.6513706 ]])
np.linspace(0,np.pi,1000)
array([0. , 0.00314474, 0.00628947, 0.00943421, 0.01257895,
0.01572369, 0.01886842, 0.02201316, 0.0251579 , 0.02830264,
0.03144737, 0.03459211, 0.03773685, 0.04088159, 0.04402632,
0.04717106, 0.0503158 , 0.05346054, 0.05660527, 0.05975001,
0.06289475, 0.06603949, 0.06918422, 0.07232896, 0.0754737 ,
0.07861843, 0.08176317, 0.08490791, 0.08805265, 0.09119738,
0.09434212, 0.09748686, 0.1006316 , 0.10377633, 0.10692107,
0.11006581, 0.11321055, 0.11635528, 0.11950002, 0.12264476,
0.1257895 , 0.12893423, 0.13207897, 0.13522371, 0.13836845,
0.14151318, 0.14465792, 0.14780266, 0.15094739, 0.15409213,
0.15723687, 0.16038161, 0.16352634, 0.16667108, 0.16981582,
0.17296056, 0.17610529, 0.17925003, 0.18239477, 0.18553951,
0.18868424, 0.19182898, 0.19497372, 0.19811846, 0.20126319,
0.20440793, 0.20755267, 0.21069741, 0.21384214, 0.21698688,
0.22013162, 0.22327635, 0.22642109, 0.22956583, 0.23271057,
0.2358553 , 0.23900004, 0.24214478, 0.24528952, 0.24843425,
0.25157899, 0.25472373, 0.25786847, 0.2610132 , 0.26415794,
0.26730268, 0.27044742, 0.27359215, 0.27673689, 0.27988163,
0.28302637, 0.2861711 , 0.28931584, 0.29246058, 0.29560531,
0.29875005, 0.30189479, 0.30503953, 0.30818426, 0.311329 ,
0.31447374, 0.31761848, 0.32076321, 0.32390795, 0.32705269,
0.33019743, 0.33334216, 0.3364869 , 0.33963164, 0.34277638,
0.34592111, 0.34906585, 0.35221059, 0.35535533, 0.35850006,
0.3616448 , 0.36478954, 0.36793427, 0.37107901, 0.37422375,
0.37736849, 0.38051322, 0.38365796, 0.3868027 , 0.38994744,
0.39309217, 0.39623691, 0.39938165, 0.40252639, 0.40567112,
0.40881586, 0.4119606 , 0.41510534, 0.41825007, 0.42139481,
0.42453955, 0.42768429, 0.43082902, 0.43397376, 0.4371185 ,
0.44026323, 0.44340797, 0.44655271, 0.44969745, 0.45284218,
0.45598692, 0.45913166, 0.4622764 , 0.46542113, 0.46856587,
0.47171061, 0.47485535, 0.47800008, 0.48114482, 0.48428956,
0.4874343 , 0.49057903, 0.49372377, 0.49686851, 0.50001325,
0.50315798, 0.50630272, 0.50944746, 0.51259219, 0.51573693,
0.51888167, 0.52202641, 0.52517114, 0.52831588, 0.53146062,
0.53460536, 0.53775009, 0.54089483, 0.54403957, 0.54718431,
0.55032904, 0.55347378, 0.55661852, 0.55976326, 0.56290799,
0.56605273, 0.56919747, 0.57234221, 0.57548694, 0.57863168,
0.58177642, 0.58492115, 0.58806589, 0.59121063, 0.59435537,
0.5975001 , 0.60064484, 0.60378958, 0.60693432, 0.61007905,
0.61322379, 0.61636853, 0.61951327, 0.622658 , 0.62580274,
0.62894748, 0.63209222, 0.63523695, 0.63838169, 0.64152643,
0.64467117, 0.6478159 , 0.65096064, 0.65410538, 0.65725011,
0.66039485, 0.66353959, 0.66668433, 0.66982906, 0.6729738 ,
0.67611854, 0.67926328, 0.68240801, 0.68555275, 0.68869749,
0.69184223, 0.69498696, 0.6981317 , 0.70127644, 0.70442118,
0.70756591, 0.71071065, 0.71385539, 0.71700013, 0.72014486,
0.7232896 , 0.72643434, 0.72957907, 0.73272381, 0.73586855,
0.73901329, 0.74215802, 0.74530276, 0.7484475 , 0.75159224,
0.75473697, 0.75788171, 0.76102645, 0.76417119, 0.76731592,
0.77046066, 0.7736054 , 0.77675014, 0.77989487, 0.78303961,
0.78618435, 0.78932909, 0.79247382, 0.79561856, 0.7987633 ,
0.80190803, 0.80505277, 0.80819751, 0.81134225, 0.81448698,
0.81763172, 0.82077646, 0.8239212 , 0.82706593, 0.83021067,
0.83335541, 0.83650015, 0.83964488, 0.84278962, 0.84593436,
0.8490791 , 0.85222383, 0.85536857, 0.85851331, 0.86165805,
0.86480278, 0.86794752, 0.87109226, 0.87423699, 0.87738173,
0.88052647, 0.88367121, 0.88681594, 0.88996068, 0.89310542,
0.89625016, 0.89939489, 0.90253963, 0.90568437, 0.90882911,
0.91197384, 0.91511858, 0.91826332, 0.92140806, 0.92455279,
0.92769753, 0.93084227, 0.93398701, 0.93713174, 0.94027648,
0.94342122, 0.94656595, 0.94971069, 0.95285543, 0.95600017,
0.9591449 , 0.96228964, 0.96543438, 0.96857912, 0.97172385,
0.97486859, 0.97801333, 0.98115807, 0.9843028 , 0.98744754,
0.99059228, 0.99373702, 0.99688175, 1.00002649, 1.00317123,
1.00631597, 1.0094607 , 1.01260544, 1.01575018, 1.01889491,
1.02203965, 1.02518439, 1.02832913, 1.03147386, 1.0346186 ,
1.03776334, 1.04090808, 1.04405281, 1.04719755, 1.05034229,
1.05348703, 1.05663176, 1.0597765 , 1.06292124, 1.06606598,
1.06921071, 1.07235545, 1.07550019, 1.07864493, 1.08178966,
1.0849344 , 1.08807914, 1.09122387, 1.09436861, 1.09751335,
1.10065809, 1.10380282, 1.10694756, 1.1100923 , 1.11323704,
1.11638177, 1.11952651, 1.12267125, 1.12581599, 1.12896072,
1.13210546, 1.1352502 , 1.13839494, 1.14153967, 1.14468441,
1.14782915, 1.15097389, 1.15411862, 1.15726336, 1.1604081 ,
1.16355283, 1.16669757, 1.16984231, 1.17298705, 1.17613178,
1.17927652, 1.18242126, 1.185566 , 1.18871073, 1.19185547,
1.19500021, 1.19814495, 1.20128968, 1.20443442, 1.20757916,
1.2107239 , 1.21386863, 1.21701337, 1.22015811, 1.22330285,
1.22644758, 1.22959232, 1.23273706, 1.23588179, 1.23902653,
1.24217127, 1.24531601, 1.24846074, 1.25160548, 1.25475022,
1.25789496, 1.26103969, 1.26418443, 1.26732917, 1.27047391,
1.27361864, 1.27676338, 1.27990812, 1.28305286, 1.28619759,
1.28934233, 1.29248707, 1.29563181, 1.29877654, 1.30192128,
1.30506602, 1.30821075, 1.31135549, 1.31450023, 1.31764497,
1.3207897 , 1.32393444, 1.32707918, 1.33022392, 1.33336865,
1.33651339, 1.33965813, 1.34280287, 1.3459476 , 1.34909234,
1.35223708, 1.35538182, 1.35852655, 1.36167129, 1.36481603,
1.36796077, 1.3711055 , 1.37425024, 1.37739498, 1.38053971,
1.38368445, 1.38682919, 1.38997393, 1.39311866, 1.3962634 ,
1.39940814, 1.40255288, 1.40569761, 1.40884235, 1.41198709,
1.41513183, 1.41827656, 1.4214213 , 1.42456604, 1.42771078,
1.43085551, 1.43400025, 1.43714499, 1.44028973, 1.44343446,
1.4465792 , 1.44972394, 1.45286867, 1.45601341, 1.45915815,
1.46230289, 1.46544762, 1.46859236, 1.4717371 , 1.47488184,
1.47802657, 1.48117131, 1.48431605, 1.48746079, 1.49060552,
1.49375026, 1.496895 , 1.50003974, 1.50318447, 1.50632921,
1.50947395, 1.51261869, 1.51576342, 1.51890816, 1.5220529 ,
1.52519763, 1.52834237, 1.53148711, 1.53463185, 1.53777658,
1.54092132, 1.54406606, 1.5472108 , 1.55035553, 1.55350027,
1.55664501, 1.55978975, 1.56293448, 1.56607922, 1.56922396,
1.5723687 , 1.57551343, 1.57865817, 1.58180291, 1.58494765,
1.58809238, 1.59123712, 1.59438186, 1.59752659, 1.60067133,
1.60381607, 1.60696081, 1.61010554, 1.61325028, 1.61639502,
1.61953976, 1.62268449, 1.62582923, 1.62897397, 1.63211871,
1.63526344, 1.63840818, 1.64155292, 1.64469766, 1.64784239,
1.65098713, 1.65413187, 1.65727661, 1.66042134, 1.66356608,
1.66671082, 1.66985555, 1.67300029, 1.67614503, 1.67928977,
1.6824345 , 1.68557924, 1.68872398, 1.69186872, 1.69501345,
1.69815819, 1.70130293, 1.70444767, 1.7075924 , 1.71073714,
1.71388188, 1.71702662, 1.72017135, 1.72331609, 1.72646083,
1.72960557, 1.7327503 , 1.73589504, 1.73903978, 1.74218451,
1.74532925, 1.74847399, 1.75161873, 1.75476346, 1.7579082 ,
1.76105294, 1.76419768, 1.76734241, 1.77048715, 1.77363189,
1.77677663, 1.77992136, 1.7830661 , 1.78621084, 1.78935558,
1.79250031, 1.79564505, 1.79878979, 1.80193453, 1.80507926,
1.808224 , 1.81136874, 1.81451347, 1.81765821, 1.82080295,
1.82394769, 1.82709242, 1.83023716, 1.8333819 , 1.83652664,
1.83967137, 1.84281611, 1.84596085, 1.84910559, 1.85225032,
1.85539506, 1.8585398 , 1.86168454, 1.86482927, 1.86797401,
1.87111875, 1.87426349, 1.87740822, 1.88055296, 1.8836977 ,
1.88684243, 1.88998717, 1.89313191, 1.89627665, 1.89942138,
1.90256612, 1.90571086, 1.9088556 , 1.91200033, 1.91514507,
1.91828981, 1.92143455, 1.92457928, 1.92772402, 1.93086876,
1.9340135 , 1.93715823, 1.94030297, 1.94344771, 1.94659245,
1.94973718, 1.95288192, 1.95602666, 1.95917139, 1.96231613,
1.96546087, 1.96860561, 1.97175034, 1.97489508, 1.97803982,
1.98118456, 1.98432929, 1.98747403, 1.99061877, 1.99376351,
1.99690824, 2.00005298, 2.00319772, 2.00634246, 2.00948719,
2.01263193, 2.01577667, 2.01892141, 2.02206614, 2.02521088,
2.02835562, 2.03150035, 2.03464509, 2.03778983, 2.04093457,
2.0440793 , 2.04722404, 2.05036878, 2.05351352, 2.05665825,
2.05980299, 2.06294773, 2.06609247, 2.0692372 , 2.07238194,
2.07552668, 2.07867142, 2.08181615, 2.08496089, 2.08810563,
2.09125037, 2.0943951 , 2.09753984, 2.10068458, 2.10382931,
2.10697405, 2.11011879, 2.11326353, 2.11640826, 2.119553 ,
2.12269774, 2.12584248, 2.12898721, 2.13213195, 2.13527669,
2.13842143, 2.14156616, 2.1447109 , 2.14785564, 2.15100038,
2.15414511, 2.15728985, 2.16043459, 2.16357932, 2.16672406,
2.1698688 , 2.17301354, 2.17615827, 2.17930301, 2.18244775,
2.18559249, 2.18873722, 2.19188196, 2.1950267 , 2.19817144,
2.20131617, 2.20446091, 2.20760565, 2.21075039, 2.21389512,
2.21703986, 2.2201846 , 2.22332934, 2.22647407, 2.22961881,
2.23276355, 2.23590828, 2.23905302, 2.24219776, 2.2453425 ,
2.24848723, 2.25163197, 2.25477671, 2.25792145, 2.26106618,
2.26421092, 2.26735566, 2.2705004 , 2.27364513, 2.27678987,
2.27993461, 2.28307935, 2.28622408, 2.28936882, 2.29251356,
2.2956583 , 2.29880303, 2.30194777, 2.30509251, 2.30823724,
2.31138198, 2.31452672, 2.31767146, 2.32081619, 2.32396093,
2.32710567, 2.33025041, 2.33339514, 2.33653988, 2.33968462,
2.34282936, 2.34597409, 2.34911883, 2.35226357, 2.35540831,
2.35855304, 2.36169778, 2.36484252, 2.36798726, 2.37113199,
2.37427673, 2.37742147, 2.3805662 , 2.38371094, 2.38685568,
2.39000042, 2.39314515, 2.39628989, 2.39943463, 2.40257937,
2.4057241 , 2.40886884, 2.41201358, 2.41515832, 2.41830305,
2.42144779, 2.42459253, 2.42773727, 2.430882 , 2.43402674,
2.43717148, 2.44031622, 2.44346095, 2.44660569, 2.44975043,
2.45289516, 2.4560399 , 2.45918464, 2.46232938, 2.46547411,
2.46861885, 2.47176359, 2.47490833, 2.47805306, 2.4811978 ,
2.48434254, 2.48748728, 2.49063201, 2.49377675, 2.49692149,
2.50006623, 2.50321096, 2.5063557 , 2.50950044, 2.51264518,
2.51578991, 2.51893465, 2.52207939, 2.52522412, 2.52836886,
2.5315136 , 2.53465834, 2.53780307, 2.54094781, 2.54409255,
2.54723729, 2.55038202, 2.55352676, 2.5566715 , 2.55981624,
2.56296097, 2.56610571, 2.56925045, 2.57239519, 2.57553992,
2.57868466, 2.5818294 , 2.58497414, 2.58811887, 2.59126361,
2.59440835, 2.59755308, 2.60069782, 2.60384256, 2.6069873 ,
2.61013203, 2.61327677, 2.61642151, 2.61956625, 2.62271098,
2.62585572, 2.62900046, 2.6321452 , 2.63528993, 2.63843467,
2.64157941, 2.64472415, 2.64786888, 2.65101362, 2.65415836,
2.6573031 , 2.66044783, 2.66359257, 2.66673731, 2.66988204,
2.67302678, 2.67617152, 2.67931626, 2.68246099, 2.68560573,
2.68875047, 2.69189521, 2.69503994, 2.69818468, 2.70132942,
2.70447416, 2.70761889, 2.71076363, 2.71390837, 2.71705311,
2.72019784, 2.72334258, 2.72648732, 2.72963206, 2.73277679,
2.73592153, 2.73906627, 2.742211 , 2.74535574, 2.74850048,
2.75164522, 2.75478995, 2.75793469, 2.76107943, 2.76422417,
2.7673689 , 2.77051364, 2.77365838, 2.77680312, 2.77994785,
2.78309259, 2.78623733, 2.78938207, 2.7925268 , 2.79567154,
2.79881628, 2.80196102, 2.80510575, 2.80825049, 2.81139523,
2.81453996, 2.8176847 , 2.82082944, 2.82397418, 2.82711891,
2.83026365, 2.83340839, 2.83655313, 2.83969786, 2.8428426 ,
2.84598734, 2.84913208, 2.85227681, 2.85542155, 2.85856629,
2.86171103, 2.86485576, 2.8680005 , 2.87114524, 2.87428998,
2.87743471, 2.88057945, 2.88372419, 2.88686892, 2.89001366,
2.8931584 , 2.89630314, 2.89944787, 2.90259261, 2.90573735,
2.90888209, 2.91202682, 2.91517156, 2.9183163 , 2.92146104,
2.92460577, 2.92775051, 2.93089525, 2.93403999, 2.93718472,
2.94032946, 2.9434742 , 2.94661894, 2.94976367, 2.95290841,
2.95605315, 2.95919788, 2.96234262, 2.96548736, 2.9686321 ,
2.97177683, 2.97492157, 2.97806631, 2.98121105, 2.98435578,
2.98750052, 2.99064526, 2.99379 , 2.99693473, 3.00007947,
3.00322421, 3.00636895, 3.00951368, 3.01265842, 3.01580316,
3.0189479 , 3.02209263, 3.02523737, 3.02838211, 3.03152684,
3.03467158, 3.03781632, 3.04096106, 3.04410579, 3.04725053,
3.05039527, 3.05354001, 3.05668474, 3.05982948, 3.06297422,
3.06611896, 3.06926369, 3.07240843, 3.07555317, 3.07869791,
3.08184264, 3.08498738, 3.08813212, 3.09127686, 3.09442159,
3.09756633, 3.10071107, 3.1038558 , 3.10700054, 3.11014528,
3.11329002, 3.11643475, 3.11957949, 3.12272423, 3.12586897,
3.1290137 , 3.13215844, 3.13530318, 3.13844792, 3.14159265])
a = np.array([[1,2],[3,4]])
b = np.array([[5,6],[7,8]])
print(a)
print(b)
np.dot(a,b)
[[1 2]
[3 4]]
[[5 6]
[7 8]]
array([[19, 22],
[43, 50]])
np.exp(a)
array([[ 2.71828183, 7.3890561 ],
[20.08553692, 54.59815003]])
np.floor(10*np.random.rand(10))
array([3., 4., 9., 6., 1., 2., 5., 1., 6., 9.])
a = np.floor(10*np.random.random((2,2)))
b = np.floor(10*np.random.random((2,2)))
print(a)
print(b)
print('*'*20)
print(np.hstack((a,b)))
print(np.vstack((a,b)))
[[6. 0.]
[0. 8.]]
[[4. 7.]
[6. 6.]]
********************
[[6. 0. 4. 7.]
[0. 8. 6. 6.]]
[[6. 0.]
[0. 8.]
[4. 7.]
[6. 6.]]
Pandas
import pandas as pd
data = pd.DataFrame([[1,2,3,4,5,6,7,8,9,10],[2,3,4,5,6,7,8,9,10,11]])
data
| 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 |
---|
0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 | 10 |
---|
1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 | 10 | 11 |
---|
data.head()
| 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 |
---|
0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 | 10 |
---|
1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 | 10 | 11 |
---|
data[0]
0 1
1 2
Name: 0, dtype: int64
data.loc[0]
0 1
1 2
2 3
3 4
4 5
5 6
6 7
7 8
8 9
9 10
Name: 0, dtype: int64
data[2][1]
4
data[[1,2]]
data.sort_values(1,inplace=False,ascending=False)
| 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 |
---|
1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 | 10 | 11 |
---|
0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 | 10 |
---|
data_ = pd.read_csv('data/train.csv')
data_
| PassengerId | Survived | Pclass | Name | Sex | Age | SibSp | Parch | Ticket | Fare | Cabin | Embarked |
---|
0 | 1 | 0 | 3 | Braund, Mr. Owen Harris | male | 22.0 | 1 | 0 | A/5 21171 | 7.2500 | NaN | S |
---|
1 | 2 | 1 | 1 | Cumings, Mrs. John Bradley (Florence Briggs Th... | female | 38.0 | 1 | 0 | PC 17599 | 71.2833 | C85 | C |
---|
2 | 3 | 1 | 3 | Heikkinen, Miss. Laina | female | 26.0 | 0 | 0 | STON/O2. 3101282 | 7.9250 | NaN | S |
---|
3 | 4 | 1 | 1 | Futrelle, Mrs. Jacques Heath (Lily May Peel) | female | 35.0 | 1 | 0 | 113803 | 53.1000 | C123 | S |
---|
4 | 5 | 0 | 3 | Allen, Mr. William Henry | male | 35.0 | 0 | 0 | 373450 | 8.0500 | NaN | S |
---|
5 | 6 | 0 | 3 | Moran, Mr. James | male | NaN | 0 | 0 | 330877 | 8.4583 | NaN | Q |
---|
6 | 7 | 0 | 1 | McCarthy, Mr. Timothy J | male | 54.0 | 0 | 0 | 17463 | 51.8625 | E46 | S |
---|
7 | 8 | 0 | 3 | Palsson, Master. Gosta Leonard | male | 2.0 | 3 | 1 | 349909 | 21.0750 | NaN | S |
---|
8 | 9 | 1 | 3 | Johnson, Mrs. Oscar W (Elisabeth Vilhelmina Berg) | female | 27.0 | 0 | 2 | 347742 | 11.1333 | NaN | S |
---|
9 | 10 | 1 | 2 | Nasser, Mrs. Nicholas (Adele Achem) | female | 14.0 | 1 | 0 | 237736 | 30.0708 | NaN | C |
---|
10 | 11 | 1 | 3 | Sandstrom, Miss. Marguerite Rut | female | 4.0 | 1 | 1 | PP 9549 | 16.7000 | G6 | S |
---|
11 | 12 | 1 | 1 | Bonnell, Miss. Elizabeth | female | 58.0 | 0 | 0 | 113783 | 26.5500 | C103 | S |
---|
12 | 13 | 0 | 3 | Saundercock, Mr. William Henry | male | 20.0 | 0 | 0 | A/5. 2151 | 8.0500 | NaN | S |
---|
13 | 14 | 0 | 3 | Andersson, Mr. Anders Johan | male | 39.0 | 1 | 5 | 347082 | 31.2750 | NaN | S |
---|
14 | 15 | 0 | 3 | Vestrom, Miss. Hulda Amanda Adolfina | female | 14.0 | 0 | 0 | 350406 | 7.8542 | NaN | S |
---|
15 | 16 | 1 | 2 | Hewlett, Mrs. (Mary D Kingcome) | female | 55.0 | 0 | 0 | 248706 | 16.0000 | NaN | S |
---|
16 | 17 | 0 | 3 | Rice, Master. Eugene | male | 2.0 | 4 | 1 | 382652 | 29.1250 | NaN | Q |
---|
17 | 18 | 1 | 2 | Williams, Mr. Charles Eugene | male | NaN | 0 | 0 | 244373 | 13.0000 | NaN | S |
---|
18 | 19 | 0 | 3 | Vander Planke, Mrs. Julius (Emelia Maria Vande... | female | 31.0 | 1 | 0 | 345763 | 18.0000 | NaN | S |
---|
19 | 20 | 1 | 3 | Masselmani, Mrs. Fatima | female | NaN | 0 | 0 | 2649 | 7.2250 | NaN | C |
---|
20 | 21 | 0 | 2 | Fynney, Mr. Joseph J | male | 35.0 | 0 | 0 | 239865 | 26.0000 | NaN | S |
---|
21 | 22 | 1 | 2 | Beesley, Mr. Lawrence | male | 34.0 | 0 | 0 | 248698 | 13.0000 | D56 | S |
---|
22 | 23 | 1 | 3 | McGowan, Miss. Anna "Annie" | female | 15.0 | 0 | 0 | 330923 | 8.0292 | NaN | Q |
---|
23 | 24 | 1 | 1 | Sloper, Mr. William Thompson | male | 28.0 | 0 | 0 | 113788 | 35.5000 | A6 | S |
---|
24 | 25 | 0 | 3 | Palsson, Miss. Torborg Danira | female | 8.0 | 3 | 1 | 349909 | 21.0750 | NaN | S |
---|
25 | 26 | 1 | 3 | Asplund, Mrs. Carl Oscar (Selma Augusta Emilia... | female | 38.0 | 1 | 5 | 347077 | 31.3875 | NaN | S |
---|
26 | 27 | 0 | 3 | Emir, Mr. Farred Chehab | male | NaN | 0 | 0 | 2631 | 7.2250 | NaN | C |
---|
27 | 28 | 0 | 1 | Fortune, Mr. Charles Alexander | male | 19.0 | 3 | 2 | 19950 | 263.0000 | C23 C25 C27 | S |
---|
28 | 29 | 1 | 3 | O'Dwyer, Miss. Ellen "Nellie" | female | NaN | 0 | 0 | 330959 | 7.8792 | NaN | Q |
---|
29 | 30 | 0 | 3 | Todoroff, Mr. Lalio | male | NaN | 0 | 0 | 349216 | 7.8958 | NaN | S |
---|
... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
---|
861 | 862 | 0 | 2 | Giles, Mr. Frederick Edward | male | 21.0 | 1 | 0 | 28134 | 11.5000 | NaN | S |
---|
862 | 863 | 1 | 1 | Swift, Mrs. Frederick Joel (Margaret Welles Ba... | female | 48.0 | 0 | 0 | 17466 | 25.9292 | D17 | S |
---|
863 | 864 | 0 | 3 | Sage, Miss. Dorothy Edith "Dolly" | female | NaN | 8 | 2 | CA. 2343 | 69.5500 | NaN | S |
---|
864 | 865 | 0 | 2 | Gill, Mr. John William | male | 24.0 | 0 | 0 | 233866 | 13.0000 | NaN | S |
---|
865 | 866 | 1 | 2 | Bystrom, Mrs. (Karolina) | female | 42.0 | 0 | 0 | 236852 | 13.0000 | NaN | S |
---|
866 | 867 | 1 | 2 | Duran y More, Miss. Asuncion | female | 27.0 | 1 | 0 | SC/PARIS 2149 | 13.8583 | NaN | C |
---|
867 | 868 | 0 | 1 | Roebling, Mr. Washington Augustus II | male | 31.0 | 0 | 0 | PC 17590 | 50.4958 | A24 | S |
---|
868 | 869 | 0 | 3 | van Melkebeke, Mr. Philemon | male | NaN | 0 | 0 | 345777 | 9.5000 | NaN | S |
---|
869 | 870 | 1 | 3 | Johnson, Master. Harold Theodor | male | 4.0 | 1 | 1 | 347742 | 11.1333 | NaN | S |
---|
870 | 871 | 0 | 3 | Balkic, Mr. Cerin | male | 26.0 | 0 | 0 | 349248 | 7.8958 | NaN | S |
---|
871 | 872 | 1 | 1 | Beckwith, Mrs. Richard Leonard (Sallie Monypeny) | female | 47.0 | 1 | 1 | 11751 | 52.5542 | D35 | S |
---|
872 | 873 | 0 | 1 | Carlsson, Mr. Frans Olof | male | 33.0 | 0 | 0 | 695 | 5.0000 | B51 B53 B55 | S |
---|
873 | 874 | 0 | 3 | Vander Cruyssen, Mr. Victor | male | 47.0 | 0 | 0 | 345765 | 9.0000 | NaN | S |
---|
874 | 875 | 1 | 2 | Abelson, Mrs. Samuel (Hannah Wizosky) | female | 28.0 | 1 | 0 | P/PP 3381 | 24.0000 | NaN | C |
---|
875 | 876 | 1 | 3 | Najib, Miss. Adele Kiamie "Jane" | female | 15.0 | 0 | 0 | 2667 | 7.2250 | NaN | C |
---|
876 | 877 | 0 | 3 | Gustafsson, Mr. Alfred Ossian | male | 20.0 | 0 | 0 | 7534 | 9.8458 | NaN | S |
---|
877 | 878 | 0 | 3 | Petroff, Mr. Nedelio | male | 19.0 | 0 | 0 | 349212 | 7.8958 | NaN | S |
---|
878 | 879 | 0 | 3 | Laleff, Mr. Kristo | male | NaN | 0 | 0 | 349217 | 7.8958 | NaN | S |
---|
879 | 880 | 1 | 1 | Potter, Mrs. Thomas Jr (Lily Alexenia Wilson) | female | 56.0 | 0 | 1 | 11767 | 83.1583 | C50 | C |
---|
880 | 881 | 1 | 2 | Shelley, Mrs. William (Imanita Parrish Hall) | female | 25.0 | 0 | 1 | 230433 | 26.0000 | NaN | S |
---|
881 | 882 | 0 | 3 | Markun, Mr. Johann | male | 33.0 | 0 | 0 | 349257 | 7.8958 | NaN | S |
---|
882 | 883 | 0 | 3 | Dahlberg, Miss. Gerda Ulrika | female | 22.0 | 0 | 0 | 7552 | 10.5167 | NaN | S |
---|
883 | 884 | 0 | 2 | Banfield, Mr. Frederick James | male | 28.0 | 0 | 0 | C.A./SOTON 34068 | 10.5000 | NaN | S |
---|
884 | 885 | 0 | 3 | Sutehall, Mr. Henry Jr | male | 25.0 | 0 | 0 | SOTON/OQ 392076 | 7.0500 | NaN | S |
---|
885 | 886 | 0 | 3 | Rice, Mrs. William (Margaret Norton) | female | 39.0 | 0 | 5 | 382652 | 29.1250 | NaN | Q |
---|
886 | 887 | 0 | 2 | Montvila, Rev. Juozas | male | 27.0 | 0 | 0 | 211536 | 13.0000 | NaN | S |
---|
887 | 888 | 1 | 1 | Graham, Miss. Margaret Edith | female | 19.0 | 0 | 0 | 112053 | 30.0000 | B42 | S |
---|
888 | 889 | 0 | 3 | Johnston, Miss. Catherine Helen "Carrie" | female | NaN | 1 | 2 | W./C. 6607 | 23.4500 | NaN | S |
---|
889 | 890 | 1 | 1 | Behr, Mr. Karl Howell | male | 26.0 | 0 | 0 | 111369 | 30.0000 | C148 | C |
---|
890 | 891 | 0 | 3 | Dooley, Mr. Patrick | male | 32.0 | 0 | 0 | 370376 | 7.7500 | NaN | Q |
---|
891 rows × 12 columns
data_.head()
| PassengerId | Survived | Pclass | Name | Sex | Age | SibSp | Parch | Ticket | Fare | Cabin | Embarked |
---|
0 | 1 | 0 | 3 | Braund, Mr. Owen Harris | male | 22.0 | 1 | 0 | A/5 21171 | 7.2500 | NaN | S |
---|
1 | 2 | 1 | 1 | Cumings, Mrs. John Bradley (Florence Briggs Th... | female | 38.0 | 1 | 0 | PC 17599 | 71.2833 | C85 | C |
---|
2 | 3 | 1 | 3 | Heikkinen, Miss. Laina | female | 26.0 | 0 | 0 | STON/O2. 3101282 | 7.9250 | NaN | S |
---|
3 | 4 | 1 | 1 | Futrelle, Mrs. Jacques Heath (Lily May Peel) | female | 35.0 | 1 | 0 | 113803 | 53.1000 | C123 | S |
---|
4 | 5 | 0 | 3 | Allen, Mr. William Henry | male | 35.0 | 0 | 0 | 373450 | 8.0500 | NaN | S |
---|
age = data_['Age']
age.head()
0 22.0
1 38.0
2 26.0
3 35.0
4 35.0
Name: Age, dtype: float64
age_is_null = age.isnull()
age_is_null
0 False
1 False
2 False
3 False
4 False
5 True
6 False
7 False
8 False
9 False
10 False
11 False
12 False
13 False
14 False
15 False
16 False
17 True
18 False
19 True
20 False
21 False
22 False
23 False
24 False
25 False
26 True
27 False
28 True
29 True
...
861 False
862 False
863 True
864 False
865 False
866 False
867 False
868 True
869 False
870 False
871 False
872 False
873 False
874 False
875 False
876 False
877 False
878 True
879 False
880 False
881 False
882 False
883 False
884 False
885 False
886 False
887 False
888 True
889 False
890 False
Name: Age, Length: 891, dtype: bool
age[age.notnull()]
0 22.0
1 38.0
2 26.0
3 35.0
4 35.0
6 54.0
7 2.0
8 27.0
9 14.0
10 4.0
11 58.0
12 20.0
13 39.0
14 14.0
15 55.0
16 2.0
18 31.0
20 35.0
21 34.0
22 15.0
23 28.0
24 8.0
25 38.0
27 19.0
30 40.0
33 66.0
34 28.0
35 42.0
37 21.0
38 18.0
...
856 45.0
857 51.0
858 24.0
860 41.0
861 21.0
862 48.0
864 24.0
865 42.0
866 27.0
867 31.0
869 4.0
870 26.0
871 47.0
872 33.0
873 47.0
874 28.0
875 15.0
876 20.0
877 19.0
879 56.0
880 25.0
881 33.0
882 22.0
883 28.0
884 25.0
885 39.0
886 27.0
887 19.0
889 26.0
890 32.0
Name: Age, Length: 714, dtype: float64
预处理
data_.head(10)
| PassengerId | Survived | Pclass | Name | Sex | Age | SibSp | Parch | Ticket | Fare | Cabin | Embarked |
---|
0 | 1 | 0 | 3 | Braund, Mr. Owen Harris | male | 22.0 | 1 | 0 | A/5 21171 | 7.2500 | NaN | S |
---|
1 | 2 | 1 | 1 | Cumings, Mrs. John Bradley (Florence Briggs Th... | female | 38.0 | 1 | 0 | PC 17599 | 71.2833 | C85 | C |
---|
2 | 3 | 1 | 3 | Heikkinen, Miss. Laina | female | 26.0 | 0 | 0 | STON/O2. 3101282 | 7.9250 | NaN | S |
---|
3 | 4 | 1 | 1 | Futrelle, Mrs. Jacques Heath (Lily May Peel) | female | 35.0 | 1 | 0 | 113803 | 53.1000 | C123 | S |
---|
4 | 5 | 0 | 3 | Allen, Mr. William Henry | male | 35.0 | 0 | 0 | 373450 | 8.0500 | NaN | S |
---|
5 | 6 | 0 | 3 | Moran, Mr. James | male | NaN | 0 | 0 | 330877 | 8.4583 | NaN | Q |
---|
6 | 7 | 0 | 1 | McCarthy, Mr. Timothy J | male | 54.0 | 0 | 0 | 17463 | 51.8625 | E46 | S |
---|
7 | 8 | 0 | 3 | Palsson, Master. Gosta Leonard | male | 2.0 | 3 | 1 | 349909 | 21.0750 | NaN | S |
---|
8 | 9 | 1 | 3 | Johnson, Mrs. Oscar W (Elisabeth Vilhelmina Berg) | female | 27.0 | 0 | 2 | 347742 | 11.1333 | NaN | S |
---|
9 | 10 | 1 | 2 | Nasser, Mrs. Nicholas (Adele Achem) | female | 14.0 | 1 | 0 | 237736 | 30.0708 | NaN | C |
---|
data_1 = data_.pivot_table(index='Pclass',values='Survived',aggfunc=np.mean)
data_1
| Survived |
---|
Pclass | |
---|
1 | 0.629630 |
---|
2 | 0.472826 |
---|
3 | 0.242363 |
---|