sklearn-onehot编码

import  numpy as np
from sklearn.preprocessing import LabelEncoder  # 将类别转变为数字
from sklearn.preprocessing import OneHotEncoder  # 对数字进行one-hot编码,向量化

x=['a','a','b','c','d','c']
x=np.array(x)
x_lab=LabelEncoder().fit_transform(x)
print(x_lab.reshape(-1,1))
y_lab=OneHotEncoder(sparse = False).fit_transform(x_lab.reshape(-1,1))
print(y_lab)

猜你喜欢

转载自blog.csdn.net/huangqihao723/article/details/81220682