Skip to content

Instantly share code, notes, and snippets.

What would you like to do?
Simple script to check if you run into ValueErrors when you do grid search with more jobs/folds than you have cores.
#!/usr/bin/env python
Simple test script to see if we get ValueErrors with joblib and the current
version of Python
import logging
import sys
from multiprocessing import cpu_count
import sklearn.datasets
from sklearn.grid_search import GridSearchCV
from sklearn.svm import LinearSVC
# Python 2.x backward compatibility
if sys.version_info < (3, 0):
range = xrange
def main():
Run a simple test
# initialize the logger
logging.basicConfig(format='%(asctime)s - %(levelname)s - %(message)s',
# Load test data'Loading iris data...')
iris = sklearn.datasets.load_iris()
# Set number of folds to be twice as many cores as we have
num_folds = int(cpu_count() * 2.5)
# Try to grid search a whole bunch of times
for i in range(1000):'Grid search run {0} out of 1000'.format(i))
GridSearchCV(LinearSVC(), param_grid={'C': [1, 10]}, n_jobs=num_folds,
if __name__ == '__main__':
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment
You can’t perform that action at this time.