ML- Pandas Dataframe:
X y .
(X_train, y_train) (X_test, y_test).
AUC ( ). " IndexError: " - y_train, 1-D , 2-D , . "y_train" y_train [ ""] .
import pandas as pd
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import StratifiedShuffleSplit
data_X = df.drop(['y'], axis=1)
data_y = pd.DataFrame(df['y'])
rs = StratifiedShuffleSplit(n_splits=2, test_size=0.3,random_state=2)
rs.get_n_splits(data_X,data_y)
for train_index, test_index in rs.split(data_X,data_y):
X_train,X_test = data_X.iloc[train_index], data_X.iloc[test_index]
y_train,y_test = data_y.iloc[train_index], data_y.iloc[test_index]
classify_cross_val_score = cross_val_score(classify, X_train, y_train, cv=5, scoring='roc_auc').mean()
print("Classify_Cross_Val_Score ",classify_cross_val_score)
classify_cross_val_score = cross_val_score(classify, X_train, y_train['y'], cv=5, scoring='roc_auc').mean()
print("Classify_Cross_Val_Score ",classify_cross_val_score)
print(y_train.shape)
print(y_train['y'].shape)
:
Classify_Cross_Val_Score 0.7021433588790991
(31647, 1)
(31647,)
: sklearn.model_selection cross_val_score. cross_val_score sklearn.model_selection, sklearn.cross_validation, .