experiments.configs.utils

experiments/configs/utils.py
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100	import copy from configs.algorithm import algorithm_defaults from configs.data_loader import loader_defaults from configs.datasets import dataset_defaults from configs.model import model_defaults from configs.scheduler import scheduler_defaults def populate_defaults(config): """Populates hyperparameters with defaults implied by choices of other hyperparameters.""" orig_config = copy.deepcopy(config) assert config.dataset is not None, 'dataset must be specified' assert config.algorithm is not None, 'algorithm must be specified' # implied defaults from choice of dataset config = populate_config( config, dataset_defaults[config.dataset] ) # implied defaults from choice of algorithm config = populate_config( config, algorithm_defaults[config.algorithm] ) # implied defaults from choice of loader config = populate_config( config, loader_defaults ) # implied defaults from choice of model if config.model: config = populate_config( config, model_defaults[config.model], ) # implied defaults from choice of scheduler if config.scheduler: config = populate_config( config, scheduler_defaults[config.scheduler] ) # misc implied defaults if config.groupby_fields is None: config.no_group_logging = True config.no_group_logging = bool(config.no_group_logging) # basic checks required_fields = [ 'split_scheme', 'train_loader', 'uniform_over_groups', 'batch_size', 'eval_loader', 'model', 'loss_function', 'val_metric', 'val_metric_decreasing', 'n_epochs', 'optimizer', 'lr', 'weight_decay', ] for field in required_fields: assert getattr(config, field) is not None, f"Must manually specify {field} for this setup." # data loader validations # we only raise this error if the train_loader is standard, and # n_groups_per_batch or distinct_groups are # specified by the user (instead of populated as a default) if config.train_loader == 'standard': if orig_config.n_groups_per_batch is not None: raise ValueError( "n_groups_per_batch cannot be specified if the data loader is 'standard'. Consider using a 'group' data loader instead.") if orig_config.distinct_groups is not None: raise ValueError( "distinct_groups cannot be specified if the data loader is 'standard'. Consider using a 'group' data loader instead.") return config def populate_config(config, template: dict, force_compatibility=False): """Populates missing (key, val) pairs in config with (key, val) in template. Example usage: populate config with defaults Args: - config: namespace - template: dict - force_compatibility: option to raise errors if config.key != template[key] """ if template is None: return config d_config = vars(config) for key, val in template.items(): if not isinstance(val, dict): # config[key] expected to be a non-index-able if key not in d_config or d_config[key] is None: d_config[key] = val elif d_config[key] != val and force_compatibility: raise ValueError(f"Argument {key} must be set to {val}") else: # config[key] expected to be a kwarg dict for kwargs_key, kwargs_val in val.items(): if kwargs_key not in d_config[key] or d_config[key][kwargs_key] is None: d_config[key][kwargs_key] = kwargs_val elif d_config[key][kwargs_key] != kwargs_val and force_compatibility: raise ValueError(f"Argument {key}[{kwargs_key}] must be set to {val}") return config

experiments/configs/utils.py

import copy

from configs.algorithm import algorithm_defaults
from configs.data_loader import loader_defaults
from configs.datasets import dataset_defaults
from configs.model import model_defaults
from configs.scheduler import scheduler_defaults


def populate_defaults(config):
    """Populates hyperparameters with defaults implied by choices
    of other hyperparameters."""

    orig_config = copy.deepcopy(config)
    assert config.dataset is not None, 'dataset must be specified'
    assert config.algorithm is not None, 'algorithm must be specified'

    # implied defaults from choice of dataset
    config = populate_config(
        config,
        dataset_defaults[config.dataset]
    )

    # implied defaults from choice of algorithm
    config = populate_config(
        config,
        algorithm_defaults[config.algorithm]
    )

    # implied defaults from choice of loader
    config = populate_config(
        config,
        loader_defaults
    )
    # implied defaults from choice of model
    if config.model: config = populate_config(
        config,
        model_defaults[config.model],
    )

    # implied defaults from choice of scheduler
    if config.scheduler: config = populate_config(
        config,
        scheduler_defaults[config.scheduler]
    )

    # misc implied defaults
    if config.groupby_fields is None:
        config.no_group_logging = True
    config.no_group_logging = bool(config.no_group_logging)

    # basic checks
    required_fields = [
        'split_scheme', 'train_loader', 'uniform_over_groups', 'batch_size', 'eval_loader', 'model', 'loss_function',
        'val_metric', 'val_metric_decreasing', 'n_epochs', 'optimizer', 'lr', 'weight_decay',
    ]
    for field in required_fields:
        assert getattr(config, field) is not None, f"Must manually specify {field} for this setup."

    # data loader validations
    # we only raise this error if the train_loader is standard, and
    # n_groups_per_batch or distinct_groups are
    # specified by the user (instead of populated as a default)
    if config.train_loader == 'standard':
        if orig_config.n_groups_per_batch is not None:
            raise ValueError(
                "n_groups_per_batch cannot be specified if the data loader is 'standard'. Consider using a 'group' data loader instead.")
        if orig_config.distinct_groups is not None:
            raise ValueError(
                "distinct_groups cannot be specified if the data loader is 'standard'. Consider using a 'group' data loader instead.")

    return config


def populate_config(config, template: dict, force_compatibility=False):
    """Populates missing (key, val) pairs in config with (key, val) in template.
    Example usage: populate config with defaults
    Args:
        - config: namespace
        - template: dict
        - force_compatibility: option to raise errors if config.key != template[key]
    """
    if template is None:
        return config

    d_config = vars(config)
    for key, val in template.items():
        if not isinstance(val, dict):  # config[key] expected to be a non-index-able
            if key not in d_config or d_config[key] is None:
                d_config[key] = val
            elif d_config[key] != val and force_compatibility:
                raise ValueError(f"Argument {key} must be set to {val}")

        else:  # config[key] expected to be a kwarg dict
            for kwargs_key, kwargs_val in val.items():
                if kwargs_key not in d_config[key] or d_config[key][kwargs_key] is None:
                    d_config[key][kwargs_key] = kwargs_val
                elif d_config[key][kwargs_key] != kwargs_val and force_compatibility:
                    raise ValueError(f"Argument {key}[{kwargs_key}] must be set to {val}")
    return config