colors/newsearch.py

import subprocess  # noqa: F401
import sys
from random import sample, seed

import numpy as np  # noqa: F401
from lightning_sdk import Machine, Studio  # noqa: F401

# consistency of randomly sampled experiments.
seed(19920921)

NUM_JOBS = 10

# Define the ranges or sets of values for each hyperparameter
# alpha_values = list(np.round(np.linspace(2, 4, 21), 4))
# learning_rate_values = list(np.round(np.logspace(-5, -3, 21), 5))
learning_rate_values = [1e-3]
# learning_rate_values = [5e-4]

# alpha_values = [0, .25, 0.5, 0.75, 1]  # alpha = 0 is unsupervised. alpha = 1 is supervised.
alpha_values = [0, 0.1]
widths = [2**k for k in range(4, 13)]
depths = [1, 2, 4, 8, 16]
dropouts = [0, 0.25, 0.5]
# widths, depths = [512], [4]

batch_size_values = [256]
max_epochs_values = [420]  # at 12 fps, around 35s
seeds = list(range(21, 1992))
optimizers = [
    # "Adagrad",
    "Adam",
    "SGD",
    # "AdamW",
    # "LBFGS",
    # "RAdam",
    # "RMSprop",
    # "Adadelta",
]

# Generate all possible combinations of hyperparameters
all_params = [
    (alpha, lr, bs, me, s, w, d, opt, dr)
    for alpha in alpha_values
    for lr in learning_rate_values
    for bs in batch_size_values
    for me in max_epochs_values
    for s in seeds
    for w in widths
    for d in depths
    for opt in optimizers
    for dr in dropouts
]


# perform random search with a limit
search_params = sample(all_params, min(NUM_JOBS, len(all_params)))

# --trainer.callbacks+ lightning.pytorch.callbacks.EarlyStopping \
# --trainer.callbacks.init_args.monitor hp_metric \

for idx, params in enumerate(search_params):
    a, lr, bs, me, s, w, d, opt, dr = params
    # cmd = f"cd ~/colors && python main.py --alpha {a} --lr {lr} --bs {bs} --max_epochs {me} --seed {s} --width {w}"
    cmd = f"""
cd ~/colors && python newmain.py fit \
--seed_everything {s} \
--data.batch_size {bs} \
--data.train_size 0 \
--data.val_size 10000 \
--model.alpha {a} \
--model.width {w} \
--model.depth {d} \
--model.bias true \
--model.loop true \
--model.transform tanh \
--model.dropout {dr} \
--trainer.min_epochs 10 \
--trainer.max_epochs {me} \
--trainer.log_every_n_steps 3 \
--trainer.check_val_every_n_epoch 1 \
--trainer.limit_val_batches 50 \
--trainer.callbacks callbacks.SaveImageCallback \
--trainer.callbacks.init_args.final_dir out \
--trainer.callbacks.init_args.save_interval 1 \
--optimizer torch.optim.{opt} \
--optimizer.init_args.lr {lr} \
--trainer.callbacks+ lightning.pytorch.callbacks.LearningRateFinder
"""
    # --lr_scheduler lightning.pytorch.cli.ReduceLROnPlateau \
    # --lr_scheduler.init_args.monitor hp_metric \
    # --lr_scheduler.init_args.factor 0.05 \
    # --lr_scheduler.init_args.patience 5 \
    # --lr_scheduler.init_args.cooldown 10 \
    # --lr_scheduler.init_args.verbose true
    print(f"Running {params}: {cmd}")
    try:
        studio = Studio("colors-animate-jobs")
        studio.install_plugin("jobs")
        job_plugin = studio.installed_plugins["jobs"]
        job_name = f"colors-animate-20240303-{idx}"
        job_plugin.run(cmd, machine=Machine.T4, name=job_name)

        # Run the command and wait for it to complete
        # subprocess.run(cmd, shell=True, check=True)
    except KeyboardInterrupt:
        print("Interrupted by user")
        sys.exit(1)
    # except subprocess.CalledProcessError:
    #     pass
test run 9 months ago			`import subprocess # noqa: F401`
use lightning CLI everywhere 10 months ago			`import sys`
cull experimental range 10 months ago			`from random import sample, seed`
use lightning CLI everywhere 10 months ago
			`import numpy as np # noqa: F401`
			`from lightning_sdk import Machine, Studio # noqa: F401`

cull experimental range 10 months ago			`# consistency of randomly sampled experiments.`
weird setup, but sometimes possible to learn labels 10 months ago			`seed(19920921)`
cull experimental range 10 months ago
job looks good to go 9 months ago			`NUM_JOBS = 10`
use lightning CLI everywhere 10 months ago
			`# Define the ranges or sets of values for each hyperparameter`
			`# alpha_values = list(np.round(np.linspace(2, 4, 21), 4))`
			`# learning_rate_values = list(np.round(np.logspace(-5, -3, 21), 5))`
lets make sure this can learn via supervision first 10 months ago			`learning_rate_values = [1e-3]`
allow for mix of supervised and not with alpha 10 months ago			`# learning_rate_values = [5e-4]`

entirely supervised 10 months ago			`# alpha_values = [0, .25, 0.5, 0.75, 1] # alpha = 0 is unsupervised. alpha = 1 is supervised.`
prepare animations (supervised and not) 9 months ago			`alpha_values = [0, 0.1]`
			`widths = [2**k for k in range(4, 13)]`
			`depths = [1, 2, 4, 8, 16]`
job looks good to go 9 months ago			`dropouts = [0, 0.25, 0.5]`
prepare animations (supervised and not) 9 months ago			`# widths, depths = [512], [4]`
allow for mix of supervised and not with alpha 10 months ago
benchmark supervised again 10 months ago			`batch_size_values = [256]`
prep for job 9 months ago			`max_epochs_values = [420] # at 12 fps, around 35s`
job looks good to go 9 months ago			`seeds = list(range(21, 1992))`
optimizer search 10 months ago			`optimizers = [`
restrict optimizers 10 months ago			`# "Adagrad",`
recreate iris looking result. weird though. 10 months ago			`"Adam",`
prep for job 9 months ago			`"SGD",`
recreate iris looking result. weird though. 10 months ago			`# "AdamW",`
restrict optimizers 10 months ago			`# "LBFGS",`
			`# "RAdam",`
			`# "RMSprop",`
			`# "Adadelta",`
optimizer search 10 months ago			`]`
restrict optimizers 10 months ago
use lightning CLI everywhere 10 months ago			`# Generate all possible combinations of hyperparameters`
			`all_params = [`
job looks good to go 9 months ago			`(alpha, lr, bs, me, s, w, d, opt, dr)`
use lightning CLI everywhere 10 months ago			`for alpha in alpha_values`
			`for lr in learning_rate_values`
			`for bs in batch_size_values`
			`for me in max_epochs_values`
			`for s in seeds`
			`for w in widths`
job updates 10 months ago			`for d in depths`
optimizer search 10 months ago			`for opt in optimizers`
job looks good to go 9 months ago			`for dr in dropouts`
use lightning CLI everywhere 10 months ago			`]`


			`# perform random search with a limit`
			`search_params = sample(all_params, min(NUM_JOBS, len(all_params)))`

depth of 1 led to consistently bad learning 10 months ago			`# --trainer.callbacks+ lightning.pytorch.callbacks.EarlyStopping \`
			`# --trainer.callbacks.init_args.monitor hp_metric \`

use lightning CLI everywhere 10 months ago			`for idx, params in enumerate(search_params):`
job looks good to go 9 months ago			`a, lr, bs, me, s, w, d, opt, dr = params`
experiment loggin setup 10 months ago			`# cmd = f"cd ~/colors && python main.py --alpha {a} --lr {lr} --bs {bs} --max_epochs {me} --seed {s} --width {w}"`
use lightning CLI everywhere 10 months ago			`cmd = f"""`
prep for job 9 months ago			`cd ~/colors && python newmain.py fit \`
some missing params 10 months ago			`--seed_everything {s} \`
			`--data.batch_size {bs} \`
benchmark supervised again 10 months ago			`--data.train_size 0 \`
lets make sure this can learn via supervision first 10 months ago			`--data.val_size 10000 \`
some missing params 10 months ago			`--model.alpha {a} \`
			`--model.width {w} \`
job updates 10 months ago			`--model.depth {d} \`
cull experimental range 10 months ago			`--model.bias true \`
restrict experiment, add loop option + dropout 10 months ago			`--model.loop true \`
supervised experiment 9 months ago			`--model.transform tanh \`
job looks good to go 9 months ago			`--model.dropout {dr} \`
some missing params 10 months ago			`--trainer.min_epochs 10 \`
			`--trainer.max_epochs {me} \`
			`--trainer.log_every_n_steps 3 \`
weird setup, but sometimes possible to learn labels 10 months ago			`--trainer.check_val_every_n_epoch 1 \`
some missing params 10 months ago			`--trainer.limit_val_batches 50 \`
			`--trainer.callbacks callbacks.SaveImageCallback \`
			`--trainer.callbacks.init_args.final_dir out \`
supervised experiment 9 months ago			`--trainer.callbacks.init_args.save_interval 1 \`
optimizer search 10 months ago			`--optimizer torch.optim.{opt} \`
some missing params 10 months ago			`--optimizer.init_args.lr {lr} \`
benchmark supervised again 10 months ago			`--trainer.callbacks+ lightning.pytorch.callbacks.LearningRateFinder`
some missing params 10 months ago			`"""`
job looks good to go 9 months ago			`# --lr_scheduler lightning.pytorch.cli.ReduceLROnPlateau \`
			`# --lr_scheduler.init_args.monitor hp_metric \`
			`# --lr_scheduler.init_args.factor 0.05 \`
			`# --lr_scheduler.init_args.patience 5 \`
			`# --lr_scheduler.init_args.cooldown 10 \`
			`# --lr_scheduler.init_args.verbose true`
use lightning CLI everywhere 10 months ago			`print(f"Running {params}: {cmd}")`
			`try:`
really prepare for jobs 9 months ago			`studio = Studio("colors-animate-jobs")`
			`studio.install_plugin("jobs")`
			`job_plugin = studio.installed_plugins["jobs"]`
job looks good to go 9 months ago			`job_name = f"colors-animate-20240303-{idx}"`
really prepare for jobs 9 months ago			`job_plugin.run(cmd, machine=Machine.T4, name=job_name)`

use lightning CLI everywhere 10 months ago			`# Run the command and wait for it to complete`
really prepare for jobs 9 months ago			`# subprocess.run(cmd, shell=True, check=True)`
use lightning CLI everywhere 10 months ago			`except KeyboardInterrupt:`
			`print("Interrupted by user")`
			`sys.exit(1)`
job updates 10 months ago			`# except subprocess.CalledProcessError:`
			`# pass`