c-bata/generator.py

## generator.py
# Requirements:
# $ pip install optuna optuna-dashboard diffusers transformers accelerate scipy safetensors xformers botorch
#
# Process A: Launch a process that suggest new params and generate images.
# $ python generator.py
#
# Process B: Launch an Optuna Dashboard process.
# $ optuna-dashboard sqlite:///db.sqlite3 --artifact-dir ./artifact
import os
import time
import tempfile

import optuna
import torch
from optuna.trial import TrialState
from optuna.artifacts import upload_artifact, FileSystemArtifactStore
from optuna_dashboard.preferential import create_study
from optuna_dashboard.preferential.samplers.gp import PreferentialGPSampler
from optuna_dashboard import register_preference_feedback_component
from diffusers import StableDiffusionImg2ImgPipeline
from PIL import Image

device = "cuda:0"
torch_dtype = torch.float16

init_img = Image.open("./input.png")
init_img = init_img.resize((768, 768))
init_img = init_img.convert("RGB")
rng = torch.Generator(device)

# 画像(Artifact)のアップロード先の設定 - 今回はFileSystemArtifactStoreを用いて、 "artifact" ディレクトリ以下に保存。
base_path = os.path.join(os.path.dirname(__file__), "artifact")
os.makedirs(base_path, exist_ok=True)
artifact_store = FileSystemArtifactStore(base_path=base_path)


def suggest_and_generate_image(study: optuna.Study, pipe: StableDiffusionImg2ImgPipeline, tmpdir: str) -> None:
    # OptunaのTrialを生成し、パラメーターおよびプロンプトに含めるキーワードをサンプル
    trial = study.ask()
    guidance_scale = trial.suggest_float("guidance_scale", 1, 50)
    strength = trial.suggest_float("strength", 0.70, 1.0)
    num_inference_steps = trial.suggest_int("num_inference_steps", 5, 100)

    prompts = ["a mascot character with two eyes and a mouth"]
    prompts.append(trial.suggest_categorical("adjectives", ["cute", "funny", "memorable", "charming", "entertaining"]))
    prompts.append(trial.suggest_categorical("style", ["anime", "photo", "painting", ""]))
    prompts.append(trial.suggest_categorical("facial-expression", ["smiling", "frowning", "grinning", ""]))
    negative_prompt = []
    negative_prompt.append(trial.suggest_categorical("negative-quality", ["unnatural", "low-quality", ""]))
    negative_prompt.append(trial.suggest_categorical("negative-adjectives", ["dull", "boring", "unfriendly", ""]))

    # img2imgの実行
    image = pipe(
        ", ".join(prompts),
        negative_prompt=", ".join(negative_prompt),
        generator=rng,
        strength=strength,
        image=init_img,
        guidance_scale=guidance_scale,
        num_inference_steps=num_inference_steps,
        num_images_per_prompt=1,
    ).images[0]

    image_path = os.path.join(tmpdir, f"sample-{trial.number}.png")
    image.save(image_path)

    # Artifact Storeにアップロード
    artifact_id = upload_artifact(trial, image_path, artifact_store)
    trial.set_user_attr("image", artifact_id)


def main():
    study = create_study(
        study_name="preferential_diffusion",
        storage="sqlite:///db.sqlite3",
        sampler=PreferentialGPSampler(),
        load_if_exists=True,
        n_generate=3,
    )
    register_preference_feedback_component(study, component_type="artifact", artifact_key="image")

    pipe = StableDiffusionImg2ImgPipeline.from_pretrained(
        "stabilityai/stable-diffusion-2-1",
        torch_dtype=torch_dtype,
    )
    pipe = pipe.to(device)
    pipe.enable_xformers_memory_efficient_attention()

    # Start Preferential Optimization
    with tempfile.TemporaryDirectory() as tmpdir:
        while True:
            if not study.should_generate():
                time.sleep(0.1)  # Avoid busy-loop
                continue
            suggest_and_generate_image(study, pipe, tmpdir)


if __name__ == '__main__':
    main()
	# Requirements:
	# $ pip install optuna optuna-dashboard diffusers transformers accelerate scipy safetensors xformers botorch
	#
	# Process A: Launch a process that suggest new params and generate images.
	# $ python generator.py
	#
	# Process B: Launch an Optuna Dashboard process.
	# $ optuna-dashboard sqlite:///db.sqlite3 --artifact-dir ./artifact
	import os
	import time
	import tempfile

	import optuna
	import torch
	from optuna.trial import TrialState
	from optuna.artifacts import upload_artifact, FileSystemArtifactStore
	from optuna_dashboard.preferential import create_study
	from optuna_dashboard.preferential.samplers.gp import PreferentialGPSampler
	from optuna_dashboard import register_preference_feedback_component
	from diffusers import StableDiffusionImg2ImgPipeline
	from PIL import Image

	device = "cuda:0"
	torch_dtype = torch.float16

	init_img = Image.open("./input.png")
	init_img = init_img.resize((768, 768))
	init_img = init_img.convert("RGB")
	rng = torch.Generator(device)

	# 画像(Artifact)のアップロード先の設定 - 今回はFileSystemArtifactStoreを用いて、 "artifact" ディレクトリ以下に保存。
	base_path = os.path.join(os.path.dirname(__file__), "artifact")
	os.makedirs(base_path, exist_ok=True)
	artifact_store = FileSystemArtifactStore(base_path=base_path)


	def suggest_and_generate_image(study: optuna.Study, pipe: StableDiffusionImg2ImgPipeline, tmpdir: str) -> None:
	# OptunaのTrialを生成し、パラメーターおよびプロンプトに含めるキーワードをサンプル
	trial = study.ask()
	guidance_scale = trial.suggest_float("guidance_scale", 1, 50)
	strength = trial.suggest_float("strength", 0.70, 1.0)
	num_inference_steps = trial.suggest_int("num_inference_steps", 5, 100)

	prompts = ["a mascot character with two eyes and a mouth"]
	prompts.append(trial.suggest_categorical("adjectives", ["cute", "funny", "memorable", "charming", "entertaining"]))
	prompts.append(trial.suggest_categorical("style", ["anime", "photo", "painting", ""]))
	prompts.append(trial.suggest_categorical("facial-expression", ["smiling", "frowning", "grinning", ""]))
	negative_prompt = []
	negative_prompt.append(trial.suggest_categorical("negative-quality", ["unnatural", "low-quality", ""]))
	negative_prompt.append(trial.suggest_categorical("negative-adjectives", ["dull", "boring", "unfriendly", ""]))

	# img2imgの実行
	image = pipe(
	", ".join(prompts),
	negative_prompt=", ".join(negative_prompt),
	generator=rng,
	strength=strength,
	image=init_img,
	guidance_scale=guidance_scale,
	num_inference_steps=num_inference_steps,
	num_images_per_prompt=1,
	).images[0]

	image_path = os.path.join(tmpdir, f"sample-{trial.number}.png")
	image.save(image_path)

	# Artifact Storeにアップロード
	artifact_id = upload_artifact(trial, image_path, artifact_store)
	trial.set_user_attr("image", artifact_id)


	def main():
	study = create_study(
	study_name="preferential_diffusion",
	storage="sqlite:///db.sqlite3",
	sampler=PreferentialGPSampler(),
	load_if_exists=True,
	n_generate=3,
	)
	register_preference_feedback_component(study, component_type="artifact", artifact_key="image")

	pipe = StableDiffusionImg2ImgPipeline.from_pretrained(
	"stabilityai/stable-diffusion-2-1",
	torch_dtype=torch_dtype,
	)
	pipe = pipe.to(device)
	pipe.enable_xformers_memory_efficient_attention()

	# Start Preferential Optimization
	with tempfile.TemporaryDirectory() as tmpdir:
	while True:
	if not study.should_generate():
	time.sleep(0.1) # Avoid busy-loop
	continue
	suggest_and_generate_image(study, pipe, tmpdir)


	if __name__ == '__main__':
	main()