= pd.read_csv("../input/30-days-of-ml/train.csv") df_train
::: {#4e7e904b .cell _cell_guid=‘b1076dfc-b9ad-4769-8c92-a6c4dae69d19’ _uuid=‘8f2839f25d086af736a60e9eeb907d3b93b6e0e5’ execution=‘{“iopub.execute_input”:“2021-08-16T20:16:18.360034Z”,“iopub.status.busy”:“2021-08-16T20:16:18.358906Z”,“iopub.status.idle”:“2021-08-16T20:16:19.347479Z”,“shell.execute_reply”:“2021-08-16T20:16:19.348020Z”,“shell.execute_reply.started”:“2021-08-16T20:05:04.468564Z”}’ papermill=‘{“duration”:0.999913,“end_time”:“2021-08-16T20:16:19.348363”,“exception”:false,“start_time”:“2021-08-16T20:16:18.348450”,“status”:“completed”}’ tags=‘[]’ execution_count=1}
import numpy as np
import pandas as pd
from sklearn import model_selection
:::
"kfold"] = -1 df_train[
= model_selection.KFold(n_splits=5, shuffle=True, random_state=42)
kf for fold, (train_indicies, valid_indicies) in enumerate(kf.split(X=df_train)):
"kfold"] = fold df_train.loc[valid_indicies,
"train_folds.csv", index=False) df_train.to_csv(