parse_tools.py

import argparse

top_usage = """
Usage: train.py {new|resume} [options]

train.py new [options] 
   -- train a new model
train.py resume [options]
   -- resume training from .ckpt file 
"""

test_usage = """
Usage: test.py {inverter} [options]

test.py inverter [options]
   -- generate samples from the mfcc_inverter model
"""


# Training options common to both "new" and "resume" training modes
def train_parser():
    train = argparse.ArgumentParser(add_help=False)

    # integer arguments
    iargs = [ 
        ('nb', 'n-batch', None),
        ('nw', 'n-win-batch', 100),
        ('ms', 'max-steps', 1e20),
        ('si', 'save-interval', 1000),
        ('pi', 'progress-interval', 1),
        ('rnd', 'random-seed', 2507),
        # VAE-specific Bottleneck
        ('fn', 'bn-free-nats', 9)
    ]
    

    # other arguments
    args = [ 
        ('hw', 'hwtype', str, None, 'STR', 'GPU'),
        ('lrs', 'learning-rate-steps', int, '+', 'INT', [0, 4e6, 6e6, 8e6]),
        ('lrr', 'learning-rate-rates', float, '+', 'FLOAT', [4e-4, 2e-4, 1e-4, 5e-5]),
        ('aws', 'bn-anneal-weight-steps', int, '+',
            'INT', [0, 2e3, 4e3, 6e3, 8e3, 1e4, 2e4, 3e4, 4e4, 5e4, 6e4]),
        ('awv', 'bn-anneal-weight-vals', float, '+',
            'FLOAT', [0, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1.0]
            )
    ]

    # help messages
    hmsg = {
        'nb': 'Batch size',
        'nw': '# of consecutive window samples in one slice',
        'ms': 'Maximum number of training steps',
        'si': 'Save a checkpoint after this many steps each time',
        'pi': 'Print a progress message at this interval',
        'rnd': 'Random seed for weights initialization etc',
        'fn': 'number of free nats in KL divergence that are not penalized',
        'hw': 'Harware target, one of CPU, GPU, or TPU',
        'lrs': 'Learning rate starting steps to apply --learning-rate-rates',
        'lrr': 'Each of these learning rates will be applied at the '
                'corresponding value for --learning-rate-steps',
        'aws': 'Learning rate starting steps to apply --anneal-weight-vals',
        'awv': 'Each of these anneal weights will be applied at the '
               'corresponding step for --anneal-weight-steps'
    }

    for sopt, lopt, t, n, meta, d in args:
        train.add_argument('--' + lopt, '-' + sopt, type=t, nargs=n,
                metavar=meta, default=d, help=hmsg[sopt])

    for sopt, lopt, d in iargs:
        train.add_argument('--' + lopt, '-' + sopt, type=int, nargs=None,
                metavar='INT', default=d, help=hmsg[sopt])

    train.add_argument('ckpt_template', type=str,
            metavar='CHECKPOINT_TEMPLATE',
            help="Full or relative path, including a filename template, containing "
            "a single %%, which will be replaced by the step number.")

    return train

# Complete parser for cold-start mode
def cold_parser():
    tp = train_parser()
    cold = argparse.ArgumentParser(parents=[tp])

    cold.add_argument('--arch-file', '-af', type=str, metavar='ARCH_FILE',
            help='INI file specifying architectural parameters')
    cold.add_argument('--train-file', '-tf', type=str, metavar='TRAIN_FILE',
            help='INI file specifying training and other hyperparameters')

    # Preprocessing parameters
    cold.add_argument('--pre-sample-rate', '-sr', type=int, metavar='INT', default=16000,
            help='# samples per second in input wav files')
    cold.add_argument('--pre-mfcc-win-sz', '-wl', type=int, metavar='INT', default=400,
            help='size of the MFCC window length in timesteps')
    cold.add_argument('--pre-mfcc-hop-sz', '-hl', type=int, metavar='INT', default=160,
            help='size of the hop length for MFCC preprocessing, in timesteps')
    cold.add_argument('--pre-n-mels', '-nm', type=int, metavar='INT', default=80,
            help='number of mel frequency values to calculate')
    cold.add_argument('--pre-n-mfcc', '-nf', type=int, metavar='INT', default=13,
            help='number of mfcc values to calculate')
    cold.prog += ' new'

    # Encoder architectural parameters
    cold.add_argument('--enc-n-out', '-no', type=int, metavar='INT', default=768,
            help='number of output channels')

    cold.add_argument('--global-model', '-gm', type=str, metavar='STR',
            default='autoencoder',
            help='type of model (autoencoder or mfcc_inverter)')

    # Bottleneck architectural parameters
    cold.add_argument('--bn-type', '-bt', type=str, metavar='STR',
            default='none',
            help='bottleneck type (one of "ae", "vae", "vqvae", or "none")')
    cold.add_argument('--bn-n-out', '-bo', type=int, metavar='INT', default=64,
            help='number of output channels for the bottleneck')
    cold.add_argument('--bn-vq-gamma', '-vqb', type=float, metavar='FLOAT', default=0.25,
            help='beta multiplier for commitment loss term, Eq 3 from Chorowski et al.')
    cold.add_argument('--bn-vq-n-embed', '-vqn', type=int, metavar='INT', default=4096,
            help='number of embedding vectors, K, in section 3.1 of VQVAE paper')

    # Parameters exclusive to Mfcc Inverter
    cold.add_argument('--mi-n-lc-in', '-mli', type=int, metavar='INT', default=-1,
            help='decoder number of local conditioning input channels')

    # Decoder architectural parameters (also used for mfccInverter)
    cold.add_argument('--jitter-prob', '-jp', type=float, metavar='FLOAT',
            default=0.12,
            help='replacement probability for time-jitter regularization')
    cold.add_argument('--dec-filter-sz', '-dfs', type=int, metavar='INT', default=2,
            help='decoder number of dilation kernel elements')
    # !!! This is set equal to --bn-n-out
    cold.add_argument('--dec-n-lc-out', '-dlo', type=int, metavar='INT', default=-1,
            help='decoder number of local conditioning output channels')
    cold.add_argument('--dec-n-res', '-dnr', type=int, metavar='INT', default=-1,
            help='decoder number of residual channels')
    cold.add_argument('--dec-n-dil', '-dnd', type=int, metavar='INT', default=-1,
            help='decoder number of dilation channels')
    cold.add_argument('--dec-n-skp', '-dns', type=int, metavar='INT', default=-1,
            help='decoder number of skip channels')
    cold.add_argument('--dec-n-post', '-dnp', type=int, metavar='INT', default=-1,
            help='decoder number of post-processing channels')
    cold.add_argument('--dec-n-quant', '-dnq', type=int, metavar='INT', 
            help='decoder number of input channels')
    cold.add_argument('--dec-n-blocks', '-dnb', type=int, metavar='INT',
            help='decoder number of dilation blocks')
    cold.add_argument('--dec-n-block-layers', '-dnl', type=int, metavar='INT', 
            help='decoder number of power-of-two dilated '
            'convolutions in each layer')
    cold.add_argument('--dec-n-global-embed', '-dng', type=int, metavar='INT',
            help='decoder number of global embedding channels')

    # MFCC parameters
    cold.add_argument('--win-size', '-ws', type=int, metavar='INT',
            default=400,
            help='Number of timesteps used to calculate MFCC coefficients')
    cold.add_argument('--hop-size', '-hs', type=int, metavar='INT',
            default=160,
            help='Number of timesteps to hop between consecutive MFCC coefficients')

    # positional arguments
    cold.add_argument('dat_file', type=str, metavar='DAT_FILE',
            help='File created by preprocess.py')
    return cold

# Complete parser for resuming from Checkpoint
def resume_parser():
    tp = train_parser()
    resume = argparse.ArgumentParser(parents=[tp], add_help=True)
    resume.add_argument('ckpt_file', type=str, metavar='CHECKPOINT_FILE',
            help="""Checkpoint file generated from a previous run.  Restores model
            architecture, model parameters, and data generator state.""")
    resume.add_argument('dat_file', type=str, metavar='DAT_FILE',
            help='File created by preprocess.py')
    resume.prog += ' resume'
    return resume


def wav_gen_parser():
    wp = argparse.ArgumentParser(parents=[])
    wp.add_argument('ckpt_file', type=str, metavar='CHECKPOINT_FILE',
            help="""Checkpoint file generated from a previous run.  Restores model
            architecture, model parameters, and data generator state.""")
    wp.add_argument('dat_file', type=str, metavar='DAT_FILE',
            help='File created by preprocess.py')
    wp.add_argument('--dec-n-replicas', '-nsr', type=int, metavar='INT',
            default=1,
            help='Number of output to generate for each input datum')
    wp.add_argument('--output-dir', '-od', type=str, metavar='STR',
            default='.',
            help="Directory to write output .wav files")
    wp.add_argument('--hwtype', '-hw', type=str, metavar='STR',
            default='GPU',
            help='Hardware type (GPU, TPU-single or TPU)')
    wp.add_argument('--jit-script-path', '-js', type=str, metavar='STR',
            default=None,
            help='If provided, save jit script for the wavenet model here, and exit')
    wp.add_argument('--data-write-tmpl', '-dw', type=str, metavar='STR',
            default=None,
            help='If provided, save data batch tensors here')
    wp.add_argument('--n-timesteps', '-nt', type=int, metavar='INT',
            default=None,
            help='If provided, only infer for this many timesteps')

    return wp


def two_stage_parse(cold_parser, args=None):  
    '''wrapper for parse_args for overriding options from file'''
    default_opts = cold_parser.parse_args(args)

    cli_parser = argparse.ArgumentParser(parents=[cold_parser], add_help=False)
    dests = {co.dest:argparse.SUPPRESS for co in cli_parser._actions}
    cli_parser.set_defaults(**dests)
    cli_parser._defaults = {} # hack to overcome bug in set_defaults
    cli_opts = cli_parser.parse_args(args)

    # Each option follows the rule:
    # Use JSON file setting if present.  Otherwise, use command-line argument,
    # Otherwise, use command-line default
    import json
    try:
        with open(cli_opts.arch_file) as fp:
            arch_opts = json.load(fp)
    except AttributeError:
        arch_opts = {} 
    except FileNotFoundError:
        print("Error: Couldn't open arch parameters file {}".format(cli_opts.arch_file))
        exit(1)

    try:
        with open(cli_opts.train_file) as fp:
            train_opts = json.load(fp)
    except AttributeError:
        train_opts = {}
    except FileNotFoundError:
        print("Error: Couldn't open train parameters file {}".format(cli_opts.train_file))
        exit(1)

    # Override with command-line settings, then defaults
    merged_opts = vars(default_opts)
    merged_opts.update(arch_opts)
    merged_opts.update(train_opts)
    merged_opts.update(vars(cli_opts))

    # Convert back to a Namespace object
    return argparse.Namespace(**merged_opts) 
    # return cli_opts


def get_prefixed_items(d, pfx):
    '''select all items whose keys start with pfx, and strip that prefix'''
    return { k[len(pfx):]:v for k,v in d.items() if k.startswith(pfx) }