1. 模拟数据
In [1]: import pandas as pd
In [2]: import numpy as np
In [3]: company=["A","B","C"]
...:
...: data=pd.DataFrame({
...: "company":[company[x] for x in np.random.randint(0,len(company),10)],
...: "salary":np.random.randint(5,50,10),
...: "age":np.random.randint(15,50,10)
...: }
...: )
In [4]: company
Out[4]: ['A', 'B', 'C']
In [5]: data
Out[5]:
company salary age
0 C 45 18
1 B 43 33
2 A 19 21
3 B 39 21
4 A 49 28
5 A 14