| arch: vit_small | |
| backend: nccl | |
| batch_size_per_gpu: 100 | |
| clip_grad: 0.0 | |
| data_path: /path/to/imagenet/ | |
| dist_url: env:// | |
| drop_path_rate: 0.1 | |
| epochs: 100 | |
| eval_every: 30 | |
| freeze_last_layer: 1 | |
| gamma: 1.25 | |
| global_crops_scale: | |
| - 0.25 | |
| - 1.0 | |
| local_crops_number: 6 | |
| local_crops_scale: | |
| - 0.05 | |
| - 0.25 | |
| local_rank: 0 | |
| lr: 0.0005 | |
| min_lr: 1.0e-05 | |
| mode: simpool | |
| momentum_teacher: 0.996 | |
| nb_knn: | |
| - 10 | |
| - 20 | |
| - 100 | |
| - 200 | |
| norm_last_layer: false | |
| num_workers: 10 | |
| optimizer: adamw | |
| out_dim: 65536 | |
| output_dir: /path/to/output/ | |
| patch_size: 16 | |
| saveckp_freq: 20 | |
| seed: 0 | |
| subset: -1 | |
| teacher_temp: 0.07 | |
| temperature: 0.07 | |
| use_bn_in_head: false | |
| use_fp16: false | |
| warmup_epochs: 10 | |
| warmup_teacher_temp: 0.04 | |
| warmup_teacher_temp_epochs: 30 | |
| weight_decay: 0.04 | |
| weight_decay_end: 0.4 | |