| aa: rand-m9-mstd0.5-inc1 |
| amp: false |
| amp_dtype: float16 |
| amp_impl: native |
| aot_autograd: false |
| aug_repeats: 0 |
| aug_splits: 0 |
| batch_size: 148 |
| bce_loss: false |
| bce_target_thresh: null |
| bn_eps: null |
| bn_momentum: null |
| channels_last: false |
| checkpoint_hist: 10 |
| class_map: '' |
| clip_grad: null |
| clip_mode: norm |
| color_jitter: 0.4 |
| cooldown_epochs: 0 |
| crop_pct: null |
| cutmix: 0.0 |
| cutmix_minmax: null |
| data: null |
| data_dir: /scratch/imagenet/ |
| dataset: torch/folder |
| dataset_download: false |
| decay_epochs: 90 |
| decay_milestones: |
| - 90 |
| - 180 |
| - 270 |
| decay_rate: 0.1 |
| dist_bn: reduce |
| drop: 0.1 |
| drop_block: null |
| drop_connect: null |
| drop_path: 0.1 |
| epoch_repeats: 0.0 |
| epochs: 300 |
| eval_metric: top1 |
| experiment: vits_gem1.25_supervised_ep300 |
| fast_norm: false |
| fuser: '' |
| gp: null |
| grad_checkpointing: false |
| hflip: 0.5 |
| img_size: null |
| in_chans: null |
| initial_checkpoint: '' |
| input_size: null |
| interpolation: '' |
| jsd_loss: false |
| layer_decay: null |
| local_rank: 0 |
| log_interval: 50 |
| log_wandb: false |
| lr: 0.0005 |
| lr_base: 0.1 |
| lr_base_scale: '' |
| lr_base_size: 256 |
| lr_cycle_decay: 0.5 |
| lr_cycle_limit: 1 |
| lr_cycle_mul: 1.0 |
| lr_k_decay: 1.0 |
| lr_noise: null |
| lr_noise_pct: 0.67 |
| lr_noise_std: 1.0 |
| mean: null |
| min_lr: 0 |
| mixup: 0.2 |
| mixup_mode: batch |
| mixup_off_epoch: 0 |
| mixup_prob: 1.0 |
| mixup_switch_prob: 0.5 |
| model: vit_small_patch16_224 |
| model_ema: true |
| model_ema_decay: 0.99996 |
| model_ema_force_cpu: false |
| model_kwargs: {} |
| momentum: 0.9 |
| no_aug: false |
| no_ddp_bb: false |
| no_prefetcher: false |
| no_resume_opt: false |
| num_classes: null |
| opt: adamw |
| opt_betas: null |
| opt_eps: null |
| opt_kwargs: {} |
| output: /scratch/bill.psomas/logs/ |
| patience_epochs: 10 |
| pin_mem: false |
| pretrained: false |
| ratio: |
| - 0.75 |
| - 1.3333333333333333 |
| recount: 1 |
| recovery_interval: 0 |
| remode: pixel |
| reprob: 0.25 |
| resplit: false |
| resume: '' |
| save_images: false |
| scale: |
| - 0.08 |
| - 1.0 |
| sched: cosine |
| sched_on_updates: false |
| seed: 42 |
| smoothing: 0.1 |
| split_bn: false |
| start_epoch: null |
| std: null |
| subset: -1 |
| sync_bn: false |
| torchcompile: null |
| torchscript: false |
| train_interpolation: random |
| train_split: train |
| tta: 0 |
| use_multi_epochs_loader: false |
| val_split: validation |
| validation_batch_size: null |
| vflip: 0.0 |
| warmup_epochs: 5 |
| warmup_lr: 1.0e-06 |
| warmup_prefix: false |
| weight_decay: 0.05 |
| worker_seeding: all |
| workers: 8 |
|
|