Python
파이썬_데이터 전처리 (Encoding) Data Preprocessing, GET DUMMIES, ONE HOT ENCODING, LABEL ENCODING
정문가
2020. 9. 6. 17:32
In [1]:
###LABEL ENCODING###
from sklearn.preprocessing import LabelEncoder
items=['냉장고','전자레인지','컴퓨터','선풍기','믹서','믹서']
encoder=LabelEncoder()
encoder.fit(items)
labels=encoder.transform(items)
print(labels)
In [2]:
print(encoder.classes_)
In [8]:
###ONE-HOT ENCODING###
from sklearn.preprocessing import OneHotEncoder
import numpy as np
items=['냉장고','전자레인지','컴퓨터','선풍기','믹서','믹서']
encoder=LabelEncoder()
encoder.fit(items)
labels=encoder.transform(items)
labels=labels.reshape(-1,1)
oh_encoder=OneHotEncoder()
oh_encoder.fit(labels)
oh_labels=oh_encoder.transform(labels)
oh_labels.toarray()
Out[8]:
In [10]:
###GET DUMMIES###
import pandas as pd
df=pd.DataFrame({'item':['냉장고','전자레인지','컴퓨터','선풍기','믹서','믹서']})
df.head()
Out[10]:
In [11]:
pd.get_dummies(df)
Out[11]: