patientzero/group_k_fold_example.py

## group_k_fold_example.py
from sklearn.model_selection import GroupKFold
# define number of splits
n_splits = 10
# all data in a list
pics = list(data_dir.glob('**/*.png'))
# matching labels in list
labels = [pic.parent.stem for pic in pics]
# get all groups that should not be in the
groups = [pic.stem.split('_')[1] for pic in pics]
gkf = GroupKFold(n_splits=n_splits)

# Iterate over splits:
for train, test in gkf.split(pics, labels, groups=groups):
  # train & test contain indices for pics/labels
  # do training here
	from sklearn.model_selection import GroupKFold
	# define number of splits
	n_splits = 10
	# all data in a list
	pics = list(data_dir.glob('*/.png'))
	# matching labels in list
	labels = [pic.parent.stem for pic in pics]
	# get all groups that should not be in the
	groups = [pic.stem.split('_')[1] for pic in pics]
	gkf = GroupKFold(n_splits=n_splits)

	# Iterate over splits:
	for train, test in gkf.split(pics, labels, groups=groups):
	# train & test contain indices for pics/labels
	# do training here