class_dim: 100
total_images: 50000
epochs: 1000
topk: 5
save_model_dir: ./output/
use_gpu: True
model_type: cls_distill

LEARNING_RATE:
    function: 'Cosine'
    params:
        lr: 0.001
        warmup_epoch: 5

OPTIMIZER:
    function: 'Momentum'
    params:
        momentum: 0.9
    regularizer:
        function: 'L2'
        factor: 0.00002

TRAIN:
    batch_size: 1280
    num_workers: 4

VALID:
    batch_size: 64
    num_workers: 4