vtalpaert/optuna_multiprocessing.py

## optuna_multiprocessing.py
import time
import multiprocessing
import optuna

# objective function, returns a score for example
def objective(trial):
    return 1

def optimize(study_name, n_trials, sleep):
    print(
        f"Starting study {study_name} for {n_trials} trials, waiting {sleep}")
    # You need a sleep here, otherwise all processes will open the journal at the same time
    # and generate the same trial parameters
    time.sleep(sleep)
    storage = optuna.storages.JournalStorage(
        optuna.storages.JournalFileStorage(f"optuna/{study_name}.log")
    )
    # load, do not re-create
    study = optuna.load_study(study_name=study_name, storage=storage)
    # single job study makes my CUDA library (it was pykeops) happy
    study.optimize(
        objective, n_trials=n_trials,
        n_jobs=1)


if __name__ == "__main__":
    n_trials = 1000
    n_jobs = 20
    study_name = "my-gist"

    # don't create more jobs than cpu threads
    _n_jobs = min(n_jobs, os.cpu_count() - 1)
    # wait between jobs
    _wait = 5  # [s]

    # create storage
    os.makedirs("optuna", exist_ok=True)
    storage = optuna.storages.JournalStorage(
        optuna.storages.JournalFileStorage(f"optuna/{study_name}.log")
    )

    # create study, adapt load_if_exists
    study = optuna.create_study(
        direction="maximize",
        study_name=study_name,
        storage=storage,
        load_if_exists=True,
    )

    multiprocessing.set_start_method('spawn')
    with multiprocessing.Pool(_n_jobs) as pool:
        pool.starmap(optimize, [
            (study_name, int(n_trials / _n_jobs), job_id * _wait)
            for job_id in range(n_jobs)])
	import time
	import multiprocessing
	import optuna

	# objective function, returns a score for example
	def objective(trial):
	return 1

	def optimize(study_name, n_trials, sleep):
	print(
	f"Starting study {study_name} for {n_trials} trials, waiting {sleep}")
	# You need a sleep here, otherwise all processes will open the journal at the same time
	# and generate the same trial parameters
	time.sleep(sleep)
	storage = optuna.storages.JournalStorage(
	optuna.storages.JournalFileStorage(f"optuna/{study_name}.log")
	)
	# load, do not re-create
	study = optuna.load_study(study_name=study_name, storage=storage)
	# single job study makes my CUDA library (it was pykeops) happy
	study.optimize(
	objective, n_trials=n_trials,
	n_jobs=1)


	if __name__ == "__main__":
	n_trials = 1000
	n_jobs = 20
	study_name = "my-gist"

	# don't create more jobs than cpu threads
	_n_jobs = min(n_jobs, os.cpu_count() - 1)
	# wait between jobs
	_wait = 5 # [s]

	# create storage
	os.makedirs("optuna", exist_ok=True)
	storage = optuna.storages.JournalStorage(
	optuna.storages.JournalFileStorage(f"optuna/{study_name}.log")
	)

	# create study, adapt load_if_exists
	study = optuna.create_study(
	direction="maximize",
	study_name=study_name,
	storage=storage,
	load_if_exists=True,
	)

	multiprocessing.set_start_method('spawn')
	with multiprocessing.Pool(_n_jobs) as pool:
	pool.starmap(optimize, [
	(study_name, int(n_trials / _n_jobs), job_id * _wait)
	for job_id in range(n_jobs)])