mittagessen
diff --git a/‎kraken/ketos/__init__.py‎
Lines changed: 38 additions & 17 deletions b/‎kraken/ketos/__init__.py‎
Lines changed: 38 additions & 17 deletions
diff --git a/‎kraken/ketos/dataset.py‎
Lines changed: 1 addition & 1 deletion b/‎kraken/ketos/dataset.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎kraken/ketos/pretrain.py‎
Lines changed: 57 additions & 103 deletions b/‎kraken/ketos/pretrain.py‎
Lines changed: 57 additions & 103 deletions
@@ -29,6 +29,7 @@
 from kraken.registry import PRECISIONS
 
 from .dataset import compile
+from .util import _load_config
 from .pretrain import pretrain
 from .recognition import test, train
 from .repo import publish
@@ -45,41 +46,61 @@
 # raise default max image size to 20k * 20k pixels
 Image.MAX_IMAGE_PIXELS = 20000 ** 2
 
+from kraken.configs import (Config,
+                            TrainingDataConfig,
+                            VGSLRecognitionTrainingConfig,
+                            VGSLRecognitionTrainingDataConfig,
+                            BLLASegmentationTrainingConfig,
+                            BLLASegmentationTrainingDataConfig)
+
+@click.group(context_settings=dict(show_default=True,
+                                   default_map={**Config().__dict__,
+                                                **TrainingDataConfig().__dict__,
+                                                'train': {**VGSLRecognitionTrainingConfig().__dict__, **VGSLRecognitionTrainingDataConfig().__dict__},
+                                                'test': VGSLRecognitionTrainingDataConfig().__dict__,
+                                                'segtrain': {**BLLASegmentationTrainingConfig().__dict__, **BLLASegmentationTrainingDataConfig().__dict__},
+                                                'segtest': {**BLLASegmentationTrainingConfig().__dict__, **BLLASegmentationTrainingDataConfig().__dict__}}))
 
-@click.group()
 @click.version_option()
 @click.pass_context
 @click.option('-v', '--verbose', default=0, count=True)
-@click.option('-d', '--device', default='cpu', show_default=True,
+@click.option('-d', '--device', show_default=True,
               help='Select device to use (cpu, cuda:0, cuda:1, ...)')
 @click.option('--precision',
-              show_default=True,
-              default='32-true',
               type=click.Choice(PRECISIONS),
               help='Numerical precision to use for training. Default is 32-bit single-point precision.')
-@click.option('--workers', show_default=True, default=1, type=click.IntRange(0), help='Number of data loading worker processes.')
-@click.option('--threads', show_default=True, default=1, type=click.IntRange(1), help='Maximum size of OpenMP/BLAS thread pool.')
+@click.option('--workers', 'num_workers', type=click.IntRange(0), help='Number of data loading worker processes.')
+@click.option('--threads', 'num_threads', type=click.IntRange(1), help='Maximum size of OpenMP/BLAS thread pool.')
 @click.option('-s', '--seed', default=None, type=click.INT,
               help='Seed for numpy\'s and torch\'s RNG. Set to a fixed value to '
                    'ensure reproducible random splits of data')
-@click.option('-r', '--deterministic/--no-deterministic', default=False,
+@click.option('-r', '--deterministic/--no-deterministic',
               help="Enables deterministic training. If no seed is given and enabled the seed will be set to 42.")
-def cli(ctx, verbose, device, precision, workers, threads, seed, deterministic):
-    ctx.meta['deterministic'] = False if not deterministic else 'warn'
-    if seed:
+@click.option('--config',
+              type=click.File(mode='r', lazy=True),
+              help="Path to configuration file.",
+              callback=_load_config,
+              is_eager=True,
+              expose_value=False,
+              required=False)
+def cli(ctx, **kwargs):
+    params = ctx.params
+
+    ctx.meta['deterministic'] = False if not params['deterministic'] else 'warn'
+    if params['seed']:
         from lightning.pytorch import seed_everything
         seed_everything(seed, workers=True)
-    elif deterministic:
+    elif params['deterministic']:
         from lightning.pytorch import seed_everything
         seed_everything(42, workers=True)
 
-    ctx.meta['verbose'] = verbose
-    ctx.meta['device'] = device
-    ctx.meta['precision'] = precision
-    ctx.meta['workers'] = workers
-    ctx.meta['threads'] = threads
+    ctx.meta['verbose'] = params.get('verbose')
+    ctx.meta['device'] = params.get('device')
+    ctx.meta['precision'] = params.get('precision')
+    ctx.meta['num_workers'] = params.get('num_workers')
+    ctx.meta['num_threads'] = params.get('num_threads')
 
-    log.set_logger(logger, level=30 - min(10 * verbose, 20))
+    log.set_logger(logger, level=30 - min(10 * params['verbose'], 20))
 
 
 cli.add_command(compile)
 
@@ -92,7 +92,7 @@ def _update_bar(advance, total):
         arrow_dataset.build_binary_dataset(ground_truth,
                                            output,
                                            format_type,
-                                           ctx.meta['workers'],
+                                           ctx.meta['num_workers'],
                                            save_splits,
                                            random_split,
                                            force_type,
 
@@ -24,8 +24,6 @@
 from PIL import Image
 
 from kraken.registry import OPTIMIZERS, SCHEDULERS, STOPPERS
-from kraken.lib.default_specs import (RECOGNITION_PRETRAIN_HYPER_PARAMS,
-                                      RECOGNITION_SPEC)
 
 from .util import _expand_gt, _validate_manifests, message, to_ptl_device
 
@@ -38,136 +36,118 @@
 
 @click.command('pretrain')
 @click.pass_context
-@click.option('-B', '--batch-size', show_default=True, type=click.INT,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['batch_size'], help='batch sample size')
-@click.option('--pad', show_default=True, type=click.INT,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['pad'],
-              help='Left and right padding around lines')
-@click.option('-o', '--output', show_default=True, type=click.Path(), default='model', help='Output model file')
-@click.option('-s', '--spec', show_default=True, default=RECOGNITION_SPEC,
-              help='VGSL spec of the network to train.')
-@click.option('-i', '--load', show_default=True, type=click.Path(exists=True,
-              readable=True), help='Load existing file to continue training')
-@click.option('-F', '--freq', show_default=True, default=RECOGNITION_PRETRAIN_HYPER_PARAMS['freq'], type=click.FLOAT,
+@click.option('-B', '--batch-size', type=int, help='batch sample size')
+@click.option('--pad', 'padding', type=int, help='Left and right padding around lines')
+@click.option('-o', '--output', 'checkpoint_path', type=click.Path(), help='Output checkpoint path')
+@click.option('-s', '--spec', help='VGSL spec of the network to train.')
+@click.option('-i', '--load', type=click.Path(exists=True, readable=True),
+              help='Load existing file to continue training')
+@click.option('-F',
+              '--freq',
+              type=float,
               help='Model saving and report generation frequency in epochs '
                    'during training. If frequency is >1 it must be an integer, '
                    'i.e. running validation every n-th epoch.')
 @click.option('-q',
               '--quit',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['quit'],
               type=click.Choice(STOPPERS),
               help='Stop condition for training. Set to `early` for early stooping or `fixed` for fixed number of epochs')
 @click.option('-N',
               '--epochs',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['epochs'],
+              type=int,
               help='Number of epochs to train for')
 @click.option('--min-epochs',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['min_epochs'],
+              type=int,
               help='Minimal number of epochs to train for when using early stopping.')
 @click.option('--lag',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['lag'],
+              type=int,
               help='Number of evaluations (--report frequency) to wait before stopping training without improvement')
 @click.option('--min-delta',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['min_delta'],
-              type=click.FLOAT,
+              type=float,
               help='Minimum improvement between epochs to reset early stopping. Default is scales the delta by the best loss')
 @click.option('--optimizer',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['optimizer'],
               type=click.Choice(OPTIMIZERS),
               help='Select optimizer')
-@click.option('-r', '--lrate', show_default=True, default=RECOGNITION_PRETRAIN_HYPER_PARAMS['lrate'], help='Learning rate')
-@click.option('-m', '--momentum', show_default=True, default=RECOGNITION_PRETRAIN_HYPER_PARAMS['momentum'], help='Momentum')
-@click.option('-w', '--weight-decay', show_default=True, type=float,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['weight_decay'], help='Weight decay')
-@click.option('--warmup', show_default=True, type=float,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['warmup'], help='Number of samples to ramp up to `lrate` initial learning rate.')
+@click.option('-r',
+              '--lrate',
+              type=float,
+              help='Learning rate')
+@click.option('-m',
+              '--momentum',
+              type=float,
+              help='Momentum')
+@click.option('-w',
+              '--weight-decay',
+              type=float, help='Weight decay')
+@click.option('--warmup',
+              type=float,
+              help='Number of samples to ramp up to `lrate` initial learning rate.')
 @click.option('--schedule',
-              show_default=True,
               type=click.Choice(SCHEDULERS),
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['schedule'],
               help='Set learning rate scheduler. For 1cycle, cycle length is determined by the `--epoch` option.')
 @click.option('-g',
               '--gamma',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['gamma'],
+              type=float,
               help='Decay factor for exponential, step, and reduceonplateau learning rate schedules')
 @click.option('-ss',
               '--step-size',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['step_size'],
+              type=int,
               help='Number of validation runs between learning rate decay for exponential and step LR schedules')
 @click.option('--sched-patience',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['rop_patience'],
+              'rop_patience',
+              type=int,
               help='Minimal number of validation runs between LR reduction for reduceonplateau LR schedule.')
 @click.option('--cos-max',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['cos_t_max'],
+              'cos_max_t',
+              type=int,
               help='Epoch of minimal learning rate for cosine LR scheduler.')
 @click.option('--cos-min-lr',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['cos_min_lr'],
+              type=float,
               help='Minimal final learning rate for cosine LR scheduler.')
-@click.option('-p', '--partition', show_default=True, default=0.9,
+@click.option('-p',
+              '--partition',
+              type=float,
               help='Ground truth data partition ratio between train/validation set')
-@click.option('--fixed-splits/--ignore-fixed-splits', show_default=True, default=False,
+@click.option('--fixed-splits/--ignore-fixed-splits', default=False,
               help='Whether to honor fixed splits in binary datasets.')
-@click.option('-t', '--training-files', show_default=True, default=None, multiple=True,
+@click.option('-t', '--training-files', default=None, multiple=True,
               callback=_validate_manifests, type=click.File(mode='r', lazy=True),
               help='File(s) with additional paths to training data')
-@click.option('-e', '--evaluation-files', show_default=True, default=None, multiple=True,
+@click.option('-e', '--evaluation-files', default=None, multiple=True,
               callback=_validate_manifests, type=click.File(mode='r', lazy=True),
               help='File(s) with paths to evaluation data. Overrides the `-p` parameter')
-@click.option('--load-hyper-parameters/--no-load-hyper-parameters', show_default=True, default=False,
+@click.option('--load-hyper-parameters/--no-load-hyper-parameters', default=False,
               help='When loading an existing model, retrieve hyperparameters from the model')
-@click.option('--force-binarization/--no-binarization', show_default=True,
-              default=False, help='Forces input images to be binary, otherwise '
-              'the appropriate color format will be auto-determined through the '
-              'network specification. Will be ignored in `path` mode.')
-@click.option('-f', '--format-type', type=click.Choice(['path', 'xml', 'alto', 'page', 'binary']), default='path',
+@click.option('-f', '--format-type', type=click.Choice(['path', 'xml', 'alto', 'page', 'binary']),
               help='Sets the training data format. In ALTO and PageXML mode all '
               'data is extracted from xml files containing both line definitions and a '
               'link to source images. In `path` mode arguments are image files '
               'sharing a prefix up to the last extension with `.gt.txt` text files '
               'containing the transcription. In binary mode files are datasets '
               'files containing pre-extracted text lines.')
 @click.option('--augment/--no-augment',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['augment'],
               help='Enable image augmentation')
-@click.option('-mw', '--mask-width', show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['mask_width'],
+@click.option('-mw',
+              '--mask-width',
+              type=int,
               help='Width of sampled masks at scale of the sampled tensor, e.g. '
                    '4X subsampling in convolutional layers with mask width 3 results '
                    'in an effective mask width of 12.')
-@click.option('-mp', '--mask-probability',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['mask_prob'],
+@click.option('-mp',
+              '--mask-probability',
+              type=float,
               help='Probability of a particular position being the start position of a mask.')
-@click.option('-nn', '--num-negatives',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['num_negatives'],
+@click.option('-nn',
+              '--num-negatives',
+              type=int,
               help='Number of negative samples for the contrastive loss.')
-@click.option('-lt', '--logit-temp',
-              show_default=True,
-              default=RECOGNITION_PRETRAIN_HYPER_PARAMS['logit_temp'],
+@click.option('-lt',
+              '--logit-temp',
+              type=float,
               help='Multiplicative factor for the logits used in contrastive loss.')
+@click.option('--legacy-polygons', default=False, is_flag=True, help='Use the legacy polygon extractor.')
 @click.argument('ground_truth', nargs=-1, callback=_expand_gt, type=click.Path(exists=False, dir_okay=False))
-@click.option('--legacy-polygons', show_default=True, default=False, is_flag=True, help='Use the legacy polygon extractor.')
-def pretrain(ctx, batch_size, pad, output, spec, load, freq, quit, epochs,
-             min_epochs, lag, min_delta, optimizer, lrate, momentum,
-             weight_decay, warmup, schedule, gamma, step_size, sched_patience,
-             cos_max, cos_min_lr, partition, fixed_splits, training_files,
-             evaluation_files, load_hyper_parameters,
-             force_binarization, format_type, augment, mask_probability,
-             mask_width, num_negatives, logit_temp, ground_truth,
-             legacy_polygons):
+def pretrain(ctx, **kwargs):
     """
     Trains a model from image-text pairs.
     """
@@ -188,32 +168,6 @@ def pretrain(ctx, batch_size, pad, output, spec, load, freq, quit, epochs,
                                      RecognitionPretrainModel)
     from kraken.lib.train import KrakenTrainer
 
-    hyper_params = RECOGNITION_PRETRAIN_HYPER_PARAMS.copy()
-    hyper_params.update({'freq': freq,
-                         'pad': pad,
-                         'batch_size': batch_size,
-                         'quit': quit,
-                         'epochs': epochs,
-                         'min_epochs': min_epochs,
-                         'lag': lag,
-                         'min_delta': min_delta,
-                         'optimizer': optimizer,
-                         'lrate': lrate,
-                         'momentum': momentum,
-                         'weight_decay': weight_decay,
-                         'warmup': warmup,
-                         'schedule': schedule,
-                         'gamma': gamma,
-                         'step_size': step_size,
-                         'rop_patience': sched_patience,
-                         'cos_t_max': cos_max,
-                         'cos_min_lr': cos_min_lr,
-                         'augment': augment,
-                         'mask_prob': mask_probability,
-                         'mask_width': mask_width,
-                         'num_negatives': num_negatives,
-                         'logit_temp': logit_temp})
-
     # disable automatic partition when given evaluation set explicitly
     if evaluation_files:
         partition = 1
@@ -250,7 +204,7 @@ def pretrain(ctx, batch_size, pad, output, spec, load, freq, quit, epochs,
                                      evaluation_data=evaluation_files,
                                      partition=partition,
                                      binary_dataset_split=fixed_splits,
-                                     num_workers=ctx.meta['workers'],
+                                     num_workers=ctx.meta['num_workers'],
                                      height=model.height,
                                      width=model.width,
                                      channels=model.channels,