Stratified Train Test Split

PHOTO EMBED

Tue May 17 2022 16:45:31 GMT+0000 (Coordinated Universal Time)

Saved by @biggusdickus #python

from sklearn.model_selection import StratifiedShuffleSplit
sss=StratifiedShuffleSplit(n_splits=1,test_size=0.25,random_state=0)

for train_index, test_index in sss.split(df, df["km_driven_cat"]):
    train_set = df.iloc[train_index]
    test_set = df.iloc[test_index]
content_copyCOPY