import pandas as pd
df = pd.DataFrame([['red', 'M', 10.1, 'type1'],
['blue', 'L', 12.5, 'type1'],
['white', 'XL', 13.3, 'type2']])
df.columns = ['color', 'size', 'price', 'type']
print(df)
# to convert type labels from strings to integers
type_mapping = { label: idx for idx, label in enumerate(df['type'].unique())}
print(type_mapping)
# map them
df['type_id'] = df['type'].map(type_mapping)
print(df)
# make a inverse mapping
inv_type_mapping = {v: k for k, v in type_mapping.items()}
df['type_id'] = df['type_id'].map(inv_type_mapping)
print(df)
result:
# bulid a mapping of the different type
from sklearn.preprocessing import LabelEncoder
type_le = LabelEncoder()
df['type_id'] = type_le.fit_transform(df['type'].values)
print(df,"type_id")
# inverse mapping
df['type_id'] = type_le.inverse_transform(df['type_id'].values)
print(df,"type_id")
result: