非常感谢你,Vivek!由于你的帮助,我已经解决了这个问题。
def data_transformation2(data, data_test, dummy): le = LabelEncoder() # Encoding the columns with multiple categorical levels for col in dummy: le.fit(data[col]) data[col] = le.transform(data[col]) for col in dummy: le.fit(data_test[col]) data_test[col] = le.transform(data_test[col]) enc = OneHotEncoder() dummy_data = np.array(data[dummy]) dummy_data_test = np.array(data_test[dummy]) enc.fit(dummy_data) dummy_data = enc.transform(dummy_data).toarray() dummy_data_test = enc.transform(dummy_data_test).toarray() print(dummy_data.shape) print(dummy_data_test.shape)