Encoder
import os
import numpy as np
import pandas as pd
# 設定 data_path, 並讀取 app_train
dir_data = '../../data/Part01/Part01/'
f_app_train = os.path.join(dir_data, 'application_train.csv')
app_train = pd.read_csv(f_app_train)
sub_train = pd.DataFrame(app_train['WEEKDAY_APPR_PROCESS_START'])
print(sub_train.shape)
sub_train.head()
from sklearn.preprocessing import LabelEncoder
labelencoder = LabelEncoder()
ndata = np.array(sub_train)
ndata[:, 0] = labelencoder.fit_transform(ndata[:, 0])
from sklearn.preprocessing import OneHotEncoder
oneHotCoder = OneHotEncoder()
enc = oneHotCoder.fit(ndata)
result = enc.transform(ndata).toarray()
print(result.shape)
test = pd.DataFrame(result)
test.head()Last updated