Base Configurations#

We can integrate tyro.cli() into common configuration patterns: here, we select one of multiple possible base configurations, create a subcommand for each one, and then use the CLI to either override (existing) or fill in (missing) values.

from dataclasses import dataclass
from typing import Callable, Literal

from torch import nn

import tyro


@dataclass(frozen=True)
class AdamOptimizer:
    learning_rate: float = 1e-3
    betas: tuple[float, float] = (0.9, 0.999)


@dataclass(frozen=True)
class ExperimentConfig:
    # Dataset to run experiment on.
    dataset: Literal["mnist", "imagenet-50"]

    # Optimizer parameters.
    optimizer: AdamOptimizer

    # Model size.
    num_layers: int
    units: int

    # Batch size.
    batch_size: int

    # Total number of training steps.
    train_steps: int

    # Random seed. This is helpful for making sure that our experiments are all
    # reproducible!
    seed: int

    # Activation to use. Not specifiable via the commandline.
    activation: Callable[[], nn.Module]


# Note that we could also define this library using separate YAML files (similar to
# `config_path`/`config_name` in Hydra), but staying in Python enables seamless type
# checking + IDE support.
Configs = tyro.extras.subcommand_type_from_defaults(
    {
        "small": ExperimentConfig(
            dataset="mnist",
            optimizer=AdamOptimizer(),
            batch_size=2048,
            num_layers=4,
            units=64,
            train_steps=30_000,
            seed=0,
            activation=nn.ReLU,
        ),
        "big": ExperimentConfig(
            dataset="imagenet-50",
            optimizer=AdamOptimizer(),
            batch_size=32,
            num_layers=8,
            units=256,
            train_steps=100_000,
            seed=0,
            activation=nn.GELU,
        ),
    }
)

if __name__ == "__main__":
    config = tyro.cli(Configs)
    print(config)

python 03_config_systems/01_base_configs.py --help

usage: 01_base_configs.py [-h] {small,big}

╭─ options ──────────────────────────────────────────╮
│ -h, --help         show this help message and exit │
╰────────────────────────────────────────────────────╯
╭─ subcommands ──────────────────────────────────────╮
│ {small,big}                                        │
│     small                                          │
│     big                                            │
╰────────────────────────────────────────────────────╯

python 03_config_systems/01_base_configs.py small --help

usage: 01_base_configs.py small [-h] [SMALL OPTIONS]

╭─ options ──────────────────────────────────────────────────────────────────╮
│ -h, --help              show this help message and exit                    │
│ --dataset {mnist,imagenet-50}                                              │
│                         Dataset to run experiment on. (default: mnist)     │
│ --num-layers INT        Model size. (default: 4)                           │
│ --units INT             Model size. (default: 64)                          │
│ --batch-size INT        Batch size. (default: 2048)                        │
│ --train-steps INT       Total number of training steps. (default: 30000)   │
│ --seed INT              Random seed. This is helpful for making sure that  │
│                         our experiments are all reproducible! (default: 0) │
│ --activation {fixed}    Activation to use. Not specifiable via the         │
│                         commandline. (fixed to: <class                     │
│                         'torch.nn.modules.activation.ReLU'>)               │
╰────────────────────────────────────────────────────────────────────────────╯
╭─ optimizer options ────────────────────────────────────────────────────────╮
│ Optimizer parameters.                                                      │
│ ────────────────────────────────────────────                               │
│ --optimizer.learning-rate FLOAT                                            │
│                         (default: 0.001)                                   │
│ --optimizer.betas FLOAT FLOAT                                              │
│                         (default: 0.9 0.999)                               │
╰────────────────────────────────────────────────────────────────────────────╯

python 03_config_systems/01_base_configs.py small --seed 94720

ExperimentConfig(dataset='mnist', optimizer=AdamOptimizer(learning_rate=0.001, betas=(0.9, 0.999)), num_layers=4, units=64, batch_size=2048, train_steps=30000, seed=94720, activation=<class 'torch.nn.modules.activation.ReLU'>)

python 03_config_systems/01_base_configs.py big --help

usage: 01_base_configs.py big [-h] [BIG OPTIONS]

╭─ options ──────────────────────────────────────────────────────────────────╮
│ -h, --help              show this help message and exit                    │
│ --dataset {mnist,imagenet-50}                                              │
│                         Dataset to run experiment on. (default:            │
│                         imagenet-50)                                       │
│ --num-layers INT        Model size. (default: 8)                           │
│ --units INT             Model size. (default: 256)                         │
│ --batch-size INT        Batch size. (default: 32)                          │
│ --train-steps INT       Total number of training steps. (default: 100000)  │
│ --seed INT              Random seed. This is helpful for making sure that  │
│                         our experiments are all reproducible! (default: 0) │
│ --activation {fixed}    Activation to use. Not specifiable via the         │
│                         commandline. (fixed to: <class                     │
│                         'torch.nn.modules.activation.GELU'>)               │
╰────────────────────────────────────────────────────────────────────────────╯
╭─ optimizer options ────────────────────────────────────────────────────────╮
│ Optimizer parameters.                                                      │
│ ────────────────────────────────────────────                               │
│ --optimizer.learning-rate FLOAT                                            │
│                         (default: 0.001)                                   │
│ --optimizer.betas FLOAT FLOAT                                              │
│                         (default: 0.9 0.999)                               │
╰────────────────────────────────────────────────────────────────────────────╯

python 03_config_systems/01_base_configs.py big --seed 94720

ExperimentConfig(dataset='imagenet-50', optimizer=AdamOptimizer(learning_rate=0.001, betas=(0.9, 0.999)), num_layers=8, units=256, batch_size=32, train_steps=100000, seed=94720, activation=<class 'torch.nn.modules.activation.GELU'>)