diff --git a/README_revenge.md b/README_revenge.md index 322e9e5..0a69075 100644 --- a/README_revenge.md +++ b/README_revenge.md @@ -78,18 +78,1330 @@ Training on ImageNet-1k: ``` python run_with_submitit.py --model deit_small_patch16_LS --data-path /path/to/imagenet --batch 256 --lr 4e-3 --epochs 800 --weight-decay 0.05 --sched cosine --input-size 224 --reprob 0.0 --node 1 --gpu 8 --smoothing 0.0 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup .8 --drop-path 0.05 --cutmix 1.0 --unscale-lr --repeated-aug--bce-loss --color-jitter 0.3 --ThreeAugment ``` +
+ + logs + + +epoch 0: 0.1 + +epoch 5: 2.008 + +epoch 10: 9.258 + +epoch 15: 16.356 + +epoch 20: 24.752 + +epoch 25: 31.84 + +epoch 30: 38.52 + +epoch 35: 44.0 + +epoch 40: 48.034 + +epoch 45: 51.834 + +epoch 50: 53.628 + +epoch 55: 55.828 + +epoch 60: 57.12 + +epoch 65: 58.504 + +epoch 70: 59.218 + +epoch 75: 60.732 + +epoch 80: 60.98 + +epoch 85: 61.36 + +epoch 90: 61.842 + +epoch 95: 62.772 + +epoch 100: 63.122 + +epoch 105: 63.838 + +epoch 110: 63.902 + +epoch 115: 64.51 + +epoch 120: 64.822 + +epoch 125: 64.916 + +epoch 130: 65.518 + +epoch 135: 65.68 + +epoch 140: 65.796 + +epoch 145: 66.12 + +epoch 150: 66.18 + +epoch 155: 66.14 + +epoch 160: 66.666 + +epoch 165: 66.798 + +epoch 170: 66.974 + +epoch 175: 67.238 + +epoch 180: 67.446 + +epoch 185: 67.478 + +epoch 190: 67.656 + +epoch 195: 67.304 + +epoch 200: 67.9 + +epoch 205: 67.826 + +epoch 210: 68.372 + +epoch 215: 68.458 + +epoch 220: 68.764 + +epoch 225: 69.116 + +epoch 230: 69.016 + +epoch 235: 69.49 + +epoch 240: 69.296 + +epoch 245: 69.522 + +epoch 250: 69.678 + +epoch 255: 70.048 + +epoch 260: 69.648 + +epoch 265: 70.404 + +epoch 270: 70.232 + +epoch 275: 70.38 + +epoch 280: 70.726 + +epoch 285: 70.8 + +epoch 290: 70.844 + +epoch 295: 71.15 + +epoch 300: 71.56 + +epoch 305: 71.54 + +epoch 310: 71.538 + +epoch 315: 71.73 + +epoch 320: 72.144 + +epoch 325: 72.068 + +epoch 330: 72.182 + +epoch 335: 72.286 + +epoch 340: 72.434 + +epoch 345: 73.072 + +epoch 350: 72.998 + +epoch 355: 72.96 + +epoch 360: 73.062 + +epoch 365: 73.296 + +epoch 370: 73.85 + +epoch 375: 73.614 + +epoch 380: 73.934 + +epoch 385: 74.064 + +epoch 390: 74.35 + +epoch 395: 74.032 + +epoch 400: 74.446 + +epoch 405: 74.52 + +epoch 410: 74.736 + +epoch 415: 74.908 + +epoch 420: 75.154 + +epoch 425: 75.226 + +epoch 430: 75.556 + +epoch 435: 75.716 + +epoch 440: 75.612 + +epoch 445: 76.014 + +epoch 450: 75.798 + +epoch 455: 76.156 + +epoch 460: 76.268 + +epoch 465: 76.344 + +epoch 470: 76.656 + +epoch 475: 76.54 + +epoch 480: 76.572 + +epoch 485: 76.864 + +epoch 490: 77.142 + +epoch 495: 77.146 + +epoch 500: 77.664 + +epoch 505: 77.442 + +epoch 510: 77.72 + +epoch 515: 77.482 + +epoch 520: 77.788 + +epoch 525: 77.92 + +epoch 530: 78.172 + +epoch 535: 78.258 + +epoch 540: 78.44 + +epoch 545: 78.454 + +epoch 550: 78.522 + +epoch 555: 78.648 + +epoch 560: 78.574 + +epoch 565: 78.826 + +epoch 570: 78.874 + +epoch 575: 79.194 + +epoch 580: 78.97 + +epoch 585: 79.498 + +epoch 590: 79.432 + +epoch 595: 79.474 + +epoch 600: 79.6 + +epoch 605: 79.594 + +epoch 610: 79.934 + +epoch 615: 79.84 + +epoch 620: 79.916 + +epoch 625: 80.058 + +epoch 630: 80.038 + +epoch 635: 80.106 + +epoch 640: 80.302 + +epoch 645: 80.234 + +epoch 650: 80.388 + +epoch 655: 80.41 + +epoch 660: 80.47 + +epoch 665: 80.568 + +epoch 670: 80.57 + +epoch 675: 80.85 + +epoch 680: 80.862 + +epoch 685: 80.872 + +epoch 690: 80.918 + +epoch 695: 80.912 + +epoch 700: 81.012 + +epoch 705: 81.098 + +epoch 710: 81.042 + +epoch 715: 81.112 + +epoch 720: 81.154 + +epoch 725: 81.23 + +epoch 730: 81.118 + +epoch 735: 81.264 + +epoch 740: 81.24 + +epoch 745: 81.242 + +epoch 750: 81.21 + +epoch 755: 81.258 + +epoch 760: 81.342 + +epoch 765: 81.296 + +epoch 770: 81.33 + +epoch 775: 81.314 + +epoch 780: 81.312 + +epoch 785: 81.314 + +epoch 790: 81.334 + +epoch 795: 81.352 + +epoch 800: 81.376 +
``` python run_with_submitit.py --model deit_base_patch16_LS --data-path /path/to/imagenet --batch 256 --lr 3e-3 --epochs 800 --weight-decay 0.05 --sched cosine --input-size 192 --reprob 0.0 --node 1 --gpu 8 --smoothing 0.0 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup .8 --drop-path 0.2 --cutmix 1.0 --unscale-lr --repeated-aug --bce-loss --color-jitter 0.3 --ThreeAugment ``` +
+ + logs + + +epoch 0: 0.1 +epoch 5: 2.838 + +epoch 10: 10.308 + +epoch 15: 17.292 + +epoch 20: 25.55 + +epoch 25: 33.436 + +epoch 30: 40.38 + +epoch 35: 45.446 + +epoch 40: 50.766 + +epoch 45: 54.162 + +epoch 50: 56.572 + +epoch 55: 58.8 + +epoch 60: 60.496 + +epoch 65: 61.994 + +epoch 70: 62.904 + +epoch 75: 64.06 + +epoch 80: 65.224 + +epoch 85: 65.718 + +epoch 90: 66.012 + +epoch 95: 66.984 + +epoch 100: 67.198 + +epoch 105: 67.864 + +epoch 110: 68.098 + +epoch 115: 68.568 + +epoch 120: 69.208 + +epoch 125: 69.448 + +epoch 130: 69.286 + +epoch 135: 69.568 + +epoch 140: 70.282 + +epoch 145: 70.396 + +epoch 150: 70.46 + +epoch 155: 70.844 + +epoch 160: 70.852 + +epoch 165: 71.33 + +epoch 170: 71.56 + +epoch 175: 71.784 + +epoch 180: 71.798 + +epoch 185: 72.162 + +epoch 190: 72.14 + +epoch 195: 72.082 + +epoch 200: 72.978 + +epoch 205: 72.562 + +epoch 210: 72.714 + +epoch 215: 73.006 + +epoch 220: 73.02 + +epoch 225: 73.466 + +epoch 230: 73.62 + +epoch 235: 73.656 + +epoch 240: 73.754 + +epoch 245: 73.718 + +epoch 250: 73.806 + +epoch 255: 74.182 + +epoch 260: 74.276 + +epoch 265: 74.592 + +epoch 270: 74.752 + +epoch 275: 74.86 + +epoch 280: 74.88 + +epoch 285: 75.044 + +epoch 290: 75.154 + +epoch 295: 75.482 + +epoch 300: 75.332 + +epoch 305: 75.548 + +epoch 310: 75.79 + +epoch 315: 75.832 + +epoch 320: 76.11 + +epoch 325: 76.27 + +epoch 330: 76.102 + +epoch 335: 76.556 + +epoch 340: 76.468 + +epoch 345: 76.514 + +epoch 350: 76.84 + +epoch 355: 77.128 + +epoch 360: 77.1 + +epoch 365: 76.99 + +epoch 370: 77.588 + +epoch 375: 77.336 + +epoch 380: 77.444 + +epoch 385: 77.924 + +epoch 390: 77.766 + +epoch 395: 77.756 + +epoch 400: 78.004 + +epoch 405: 78.238 + +epoch 410: 78.376 + +epoch 415: 78.45 + +epoch 420: 78.62 + +epoch 425: 78.628 + +epoch 430: 78.828 + +epoch 435: 78.92 + +epoch 440: 78.902 + +epoch 445: 78.994 + +epoch 450: 79.086 + +epoch 455: 79.206 + +epoch 460: 79.422 + +epoch 465: 79.394 + +epoch 470: 79.556 + +epoch 475: 79.736 + +epoch 480: 79.69 + +epoch 485: 79.978 + +epoch 490: 80.108 + +epoch 495: 80.162 + +epoch 500: 80.23 + +epoch 505: 80.346 + +epoch 510: 80.378 + +epoch 515: 80.488 + +epoch 520: 80.638 + +epoch 525: 80.666 + +epoch 530: 80.694 + +epoch 535: 80.798 + +epoch 540: 80.866 + +epoch 545: 81.024 + +epoch 550: 81.266 + +epoch 555: 81.028 + +epoch 560: 81.27 + +epoch 565: 81.306 + +epoch 570: 81.384 + +epoch 575: 81.474 + +epoch 580: 81.42 + +epoch 585: 81.53 + +epoch 590: 81.578 + +epoch 595: 81.726 + +epoch 600: 81.75 + +epoch 605: 81.672 + +epoch 610: 81.86 + +epoch 615: 82.006 + +epoch 620: 81.926 + +epoch 625: 81.806 + +epoch 630: 81.968 + +epoch 635: 82.104 + +epoch 640: 82.184 + +epoch 645: 82.202 + +epoch 650: 82.262 + +epoch 655: 82.224 + +epoch 660: 82.256 + +epoch 665: 82.284 + +epoch 670: 82.38 + +epoch 675: 82.438 + +epoch 680: 82.498 + +epoch 685: 82.554 + +epoch 690: 82.552 + +epoch 695: 82.648 + +epoch 700: 82.548 + +epoch 705: 82.702 + +epoch 710: 82.64 + +epoch 715: 82.598 + +epoch 720: 82.7 + +epoch 725: 82.686 + +epoch 730: 82.718 + +epoch 735: 82.71 + +epoch 740: 82.748 + +epoch 745: 82.784 + +epoch 750: 82.736 + +epoch 755: 82.77 + +epoch 760: 82.808 + +epoch 765: 82.754 + +epoch 770: 82.766 + +epoch 775: 82.798 + +epoch 780: 82.784 + +epoch 785: 82.802 + +epoch 790: 82.858 + +epoch 795: 82.866 + +epoch 800: 82.82 + +
+ + ``` python run_with_submitit.py --model deit_large_patch16_LS --data-path /path/to/imagenet --batch 64 --lr 3e-3 --epochs 800 --weight-decay 0.05 --sched cosine --input-size 192 --reprob 0.0 --node 4 --gpu 8 --smoothing 0.0 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup .8 --drop-path 0.45 --cutmix 1.0 --unscale-lr --repeated-aug --bce-loss --color-jitter 0.3 --ThreeAugment ``` +
+ + logs + + +epoch 0: 0.092 + +epoch 5: 2.961 + +epoch 10: 9.847 + +epoch 15: 16.421 + +epoch 20: 24.51 + +epoch 25: 31.918 + +epoch 30: 39.016 + +epoch 35: 44.352 + +epoch 40: 49.568 + +epoch 45: 53.111 + +epoch 50: 55.806 + +epoch 55: 58.831 + +epoch 60: 60.379 + +epoch 65: 62.038 + +epoch 70: 63.162 + +epoch 75: 64.655 + +epoch 80: 65.499 + +epoch 85: 66.191 + +epoch 90: 66.557 + +epoch 95: 67.462 + +epoch 100: 68.096 + +epoch 105: 68.636 + +epoch 110: 68.924 + +epoch 115: 69.534 + +epoch 120: 70.024 + +epoch 125: 70.527 + +epoch 130: 70.783 + +epoch 135: 71.007 + +epoch 140: 71.211 + +epoch 145: 71.559 + +epoch 150: 71.819 + +epoch 155: 72.241 + +epoch 160: 72.095 + +epoch 165: 72.553 + +epoch 170: 72.945 + +epoch 175: 72.831 + +epoch 180: 73.313 + +epoch 185: 73.476 + +epoch 190: 73.534 + +epoch 195: 73.305 + +epoch 200: 73.85 + +epoch 205: 74.24 + +epoch 210: 74.34 + +epoch 215: 74.492 + +epoch 220: 74.67 + +epoch 225: 74.854 + +epoch 230: 74.94 + +epoch 235: 74.848 + +epoch 240: 75.082 + +epoch 245: 75.572 + +epoch 250: 75.698 + +epoch 255: 75.568 + +epoch 260: 75.948 + +epoch 265: 75.79 + +epoch 270: 76.116 + +epoch 275: 76.312 + +epoch 280: 76.322 + +epoch 285: 76.751 + +epoch 290: 76.891 + +epoch 295: 76.999 + +epoch 300: 77.251 + +epoch 305: 77.139 + +epoch 310: 77.207 + +epoch 315: 77.501 + +epoch 320: 77.467 + +epoch 325: 77.871 + +epoch 330: 77.689 + +epoch 335: 77.895 + +epoch 340: 78.013 + +epoch 345: 78.291 + +epoch 350: 78.295 + +epoch 355: 78.555 + +epoch 360: 78.877 + +epoch 365: 78.799 + +epoch 370: 79.163 + +epoch 375: 79.127 + +epoch 380: 79.319 + +epoch 385: 79.283 + +epoch 390: 79.239 + +epoch 395: 79.575 + +epoch 400: 79.617 + +epoch 405: 79.75 + +epoch 410: 79.95 + +epoch 415: 80.028 + +epoch 420: 80.21 + +epoch 425: 80.234 + +epoch 430: 80.42 + +epoch 435: 80.516 + +epoch 440: 80.802 + +epoch 445: 80.718 + +epoch 450: 80.878 + +epoch 455: 80.926 + +epoch 460: 81.118 + +epoch 465: 81.326 + +epoch 470: 81.298 + +epoch 475: 81.546 + +epoch 480: 81.626 + +epoch 485: 81.662 + +epoch 490: 81.624 + +epoch 495: 81.83 + +epoch 500: 81.854 + +epoch 505: 81.904 + +epoch 510: 82.192 + +epoch 515: 82.0 + +epoch 520: 82.112 + +epoch 525: 82.286 + +epoch 530: 82.318 + +epoch 535: 82.402 + +epoch 540: 82.514 + +epoch 545: 82.58 + +epoch 550: 82.626 + +epoch 555: 82.75 + +epoch 560: 82.762 + +epoch 565: 82.835 + +epoch 570: 83.019 + +epoch 575: 82.977 + +epoch 580: 83.033 + +epoch 585: 83.191 + +epoch 590: 83.145 + +epoch 595: 83.303 + +epoch 600: 83.313 + +epoch 605: 83.285 + +epoch 610: 83.443 + +epoch 615: 83.515 + +epoch 620: 83.517 + +epoch 625: 83.425 + +epoch 630: 83.487 + +epoch 635: 83.641 + +epoch 640: 83.635 + +epoch 645: 83.581 + +epoch 650: 83.667 + +epoch 655: 83.537 + +epoch 660: 83.669 + +epoch 665: 83.603 + +epoch 670: 83.775 + +epoch 675: 83.769 + +epoch 680: 83.703 + +epoch 685: 83.741 + +epoch 690: 83.737 + +epoch 695: 83.839 + +epoch 700: 83.873 + +epoch 705: 83.963 + +epoch 710: 83.929 + +epoch 715: 83.877 + +epoch 720: 83.919 + +epoch 725: 83.927 + +epoch 730: 83.943 + +epoch 735: 83.991 + +epoch 740: 84.037 + +epoch 745: 83.969 + +epoch 750: 83.941 + +epoch 755: 84.009 + +epoch 760: 84.009 + +epoch 765: 84.039 + +epoch 770: 84.047 + +epoch 775: 84.007 + +epoch 780: 83.995 + +epoch 785: 84.031 + +epoch 790: 84.031 + +epoch 795: 84.049 + +epoch 800: 84.024 + +
+ ``` python run_with_submitit.py --model deit_huge_patch14_LS --data-path /path/to/imagenet --batch 64 --lr 3e-3 --epochs 800 --weight-decay 0.05 --sched cosine --input-size 160 --reprob 0.0 --node 4 --gpu 8 --smoothing 0.0 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup .8 --drop-path 0.6 --cutmix 1.0 --unscale-lr --repeated-aug --bce-loss --color-jitter 0.3 --ThreeAugment ``` +
+ + logs + + +epoch 0: 0.062 + +epoch 5: 2.553 + +epoch 10: 8.143 + +epoch 15: 13.69 + +epoch 20: 19.48 + +epoch 25: 25.138 + +epoch 30: 30.98 + +epoch 35: 35.323 + +epoch 40: 40.369 + +epoch 45: 44.196 + +epoch 50: 47.299 + +epoch 55: 50.34 + +epoch 60: 52.623 + +epoch 65: 54.659 + +epoch 70: 56.062 + +epoch 75: 57.616 + +epoch 80: 58.977 + +epoch 85: 59.841 + +epoch 90: 60.899 + +epoch 95: 61.578 + +epoch 100: 62.444 + +epoch 105: 63.266 + +epoch 110: 63.598 + +epoch 115: 64.008 + +epoch 120: 64.867 + +epoch 125: 65.447 + +epoch 130: 65.621 + +epoch 135: 66.247 + +epoch 140: 66.597 + +epoch 145: 67.422 + +epoch 150: 67.266 + +epoch 155: 67.77 + +epoch 160: 67.966 + +epoch 165: 68.492 + +epoch 170: 68.84 + +epoch 175: 68.996 + +epoch 180: 69.322 + +epoch 185: 69.654 + +epoch 190: 69.816 + +epoch 195: 69.628 + +epoch 200: 70.276 + +epoch 205: 70.601 + +epoch 210: 70.879 + +epoch 215: 70.991 + +epoch 220: 71.069 + +epoch 225: 71.605 + +epoch 230: 71.439 + +epoch 235: 71.983 + +epoch 240: 72.033 + +epoch 245: 72.319 + +epoch 250: 72.567 + +epoch 255: 72.537 + +epoch 260: 73.025 + +epoch 265: 73.249 + +epoch 270: 73.205 + +epoch 275: 73.281 + +epoch 280: 73.556 + +epoch 285: 73.848 + +epoch 290: 73.974 + +epoch 295: 74.332 + +epoch 300: 74.044 + +epoch 305: 74.54 + +epoch 310: 74.576 + +epoch 315: 74.756 + +epoch 320: 75.01 + +epoch 325: 75.146 + +epoch 330: 75.42 + +epoch 335: 75.566 + +epoch 340: 75.764 + +epoch 345: 75.932 + +epoch 350: 76.132 + +epoch 355: 76.212 + +epoch 360: 76.426 + +epoch 365: 76.43 + +epoch 370: 76.953 + +epoch 375: 76.755 + +epoch 380: 77.125 + +epoch 385: 77.437 + +epoch 390: 77.227 + +epoch 395: 77.505 + +epoch 400: 77.715 + +epoch 405: 77.833 + +epoch 410: 77.801 + +epoch 415: 78.339 + +epoch 420: 78.231 + +epoch 425: 78.491 + +epoch 430: 78.541 + +epoch 435: 78.651 + +epoch 440: 78.877 + +epoch 445: 79.009 + +epoch 450: 79.079 + +epoch 455: 79.409 + +epoch 460: 79.365 + +epoch 465: 79.513 + +epoch 470: 79.782 + +epoch 475: 79.8 + +epoch 480: 79.938 + +epoch 485: 79.938 + +epoch 490: 80.01 + +epoch 495: 80.148 + +epoch 500: 80.348 + +epoch 505: 80.51 + +epoch 510: 80.79 + +epoch 515: 80.722 + +epoch 520: 80.72 + +epoch 525: 80.872 + +epoch 530: 81.276 + +epoch 535: 80.992 + +epoch 540: 81.354 + +epoch 545: 81.264 + +epoch 550: 81.312 + +epoch 555: 81.474 + +epoch 560: 81.46 + +epoch 565: 81.652 + +epoch 570: 81.634 + +epoch 575: 81.75 + +epoch 580: 81.868 + +epoch 585: 81.972 + +epoch 590: 81.924 + +epoch 595: 82.09 + +epoch 600: 82.236 + +epoch 605: 82.174 + +epoch 610: 82.36 + +epoch 615: 82.526 + +epoch 620: 82.47 + +epoch 625: 82.534 + +epoch 630: 82.678 + +epoch 635: 82.55 + +epoch 640: 82.716 + +epoch 645: 82.726 + +epoch 650: 82.825 + +epoch 655: 82.903 + +epoch 660: 82.913 + +epoch 665: 82.965 + +epoch 670: 83.003 + +epoch 675: 82.995 + +epoch 680: 82.989 + +epoch 685: 83.013 + +epoch 690: 83.047 + +epoch 695: 83.137 + +epoch 700: 83.241 + +epoch 705: 83.147 + +epoch 710: 83.207 + +epoch 715: 83.187 + +epoch 720: 83.307 + +epoch 725: 83.319 + +epoch 730: 83.371 + +epoch 735: 83.309 + +epoch 740: 83.259 + +epoch 745: 83.335 + +epoch 750: 83.389 + +epoch 755: 83.373 + +epoch 760: 83.357 + +epoch 765: 83.425 + +epoch 770: 83.367 + +epoch 775: 83.433 + +epoch 780: 83.387 + +epoch 785: 83.387 + +epoch 790: 83.449 + +epoch 795: 83.449 + +epoch 800: 83.484 +
finetuning for ViT-B, L and H at resolution 224x224: @@ -97,27 +1409,125 @@ finetuning for ViT-B, L and H at resolution 224x224: python run_with_submitit.py --model deit_base_patch16_LS --data-path /path/to/imagenet --batch 64 --lr 1e-5 --epochs 20 --weight-decay 0.1 --sched cosine --input-size 224 --reprob 0.0 --node 1 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt adamw --warmup-lr 1e-6 --mixup .8 --drop-path 0.2 --cutmix 1.0 --unscale-lr --aa rand-m9-mstd0.5-inc1 --no-repeated-aug --finetune model_path ``` +
+ + logs + + +epoch 0: 83.448 + +epoch 5: 83.71 + +epoch 10: 83.788 + +epoch 15: 83.826 + +epoch 20: 83.802 + +
+ ``` python run_with_submitit.py --model deit_large_patch16_LS --data-path /path/to/imagenet --batch 64 --lr 1e-5 --epochs 20 --weight-decay 0.1 --sched cosine --input-size 224 --reprob 0.0 --node 1 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt adamw --warmup-lr 1e-6 --mixup .8 --drop-path 0.45 --cutmix 1.0 --unscale-lr --aa rand-m9-mstd0.5-inc1 --no-repeated-aug --finetune model_path ``` +
+ + logs + + +epoch 0: 84.458 + +epoch 5: 84.716 + +epoch 10: 84.826 + +epoch 15: 84.796 + +epoch 20: 84.862 + +
+ ``` python run_with_submitit.py --model deit_huge_patch14_LS --data-path /path/to/imagenet --batch 32 --lr 1e-5 --epochs 20 --weight-decay 0.1 --sched cosine --input-size 224 --reprob 0.0 --node 2 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt adamw --warmup-lr 1e-6 --mixup .8 --drop-path 0.55 --cutmix 1.0 --unscale-lr --aa rand-m9-mstd0.5-inc1 --no-repeated-aug --finetune model_path ``` +
+ + logs + + +epoch 0: 84.328 + +epoch 5: 85.028 + +epoch 10: 85.128 + +epoch 15: 85.184 + +epoch 20: 85.218 + +
finetuning for ViT-S, B and L at resolution 384x384: ``` python run_with_submitit.py --model deit_small_patch16_LS --data-path /path/to/imagenet --batch 64 --lr 1e-5 --epochs 20 --weight-decay 0.1 --sched cosine --input-size 384 --reprob 0.0 --node 1 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt adamw --warmup-lr 1e-6 --mixup .8 --drop-path 0.0 --cutmix 1.0 --unscale-lr --no-repeated-aug --aa rand-m9-mstd0.5-inc1 --finetune model_path ``` +
+ + logs + + +epoch 0: 82.134 + +epoch 5: 83.256 + +epoch 10: 83.452 + +epoch 15: 83.428 + +epoch 20: 83.422 + +
``` python run_with_submitit.py --model deit_base_patch16_LS --data-path /path/to/imagenet --batch 32 --lr 1e-5 --epochs 20 --weight-decay 0.1 --sched cosine --input-size 384 --reprob 0.0 --node 2 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt adamw --warmup-lr 1e-6 --mixup .8 --drop-path 0.15 --cutmix 1.0 --unscale-lr --no-repeated-aug --aa rand-m9-mstd0.5-inc1 --finetune model_path ``` +
+ + logs + + +epoch 0: 84.296 + +epoch 5: 84.968 + +epoch 10: 85.002 + +epoch 15: 84.986 + +epoch 20: 85.076 + +
``` python run_with_submitit.py --model deit_large_patch16_LS --data-path /path/to/imagenet --batch 16 --lr 1e-5 --epochs 20 --weight-decay 0.1 --sched cosine --input-size 384 --reprob 0.0 --node 4 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt adamw --warmup-lr 1e-6 --mixup .8 --drop-path 0.4 --cutmix 1.0 --unscale-lr --no-repeated-aug --aa rand-m9-mstd0.5-inc1 --finetune model_path ``` +
+ + logs + + +epoch 0: 84.691 + +epoch 5: 85.458 + +epoch 10: 85.736 + +epoch 15: 85.794 + +epoch 20: 85.812 + +
Training on ImageNet-21k: @@ -127,36 +1537,510 @@ It is possible to train with a batch size of 4096 with a learning rate of 0.0015 python run_with_submitit.py --model deit_small_patch16_LS --data-path /path/to/imagenet --batch 128 --lr 0.001 --epochs 240 --weight-decay 0.02 --sched cosine --input-size 224 --reprob 0.0 --node 2 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup 0 --drop-path 0.05 --cutmix 1.0 --unscale-lr --no-repeated-aug --color-jitter 0.3 --ThreeAugment --src ``` +
+ + logs + + +epoch 0: 0.0 + +epoch 5: 8.105 + +epoch 10: 32.78 + +epoch 15: 41.501 + +epoch 20: 44.226 + +epoch 25: 45.172 + +epoch 30: 45.991 + +epoch 35: 47.491 + +epoch 40: 47.151 + +epoch 45: 47.923 + +epoch 50: 48.327 + +epoch 55: 48.039 + +epoch 60: 48.325 + +epoch 65: 48.972 + +epoch 70: 49.1 + +epoch 75: 49.572 + +epoch 80: 49.368 + +epoch 85: 50.138 + +epoch 90: 49.82 + +epoch 95: 50.33 + +epoch 100: 50.748 + +epoch 105: 50.624 + +epoch 110: 50.63 + +epoch 115: 50.458 + +epoch 120: 51.13 + +epoch 125: 51.184 + +epoch 130: 51.871 + +epoch 135: 51.931 + +epoch 140: 51.791 + +epoch 145: 52.369 + +epoch 150: 52.409 + +epoch 155: 52.449 + +epoch 160: 52.499 + +epoch 165: 52.723 + +epoch 170: 53.267 + +epoch 175: 53.413 + +epoch 180: 53.373 + +epoch 185: 53.481 + +epoch 190: 53.321 + +epoch 195: 53.945 + +epoch 200: 53.913 + +epoch 205: 53.791 + +epoch 210: 54.111 + +epoch 215: 53.963 + +epoch 220: 54.057 + +epoch 225: 54.045 + +epoch 230: 54.107 + +epoch 235: 54.143 + +epoch 240: 54.12 + +
+ ``` python run_with_submitit.py --model deit_base_patch16_LS --data-path /path/to/imagenet --batch 64 --lr 0.001 --epochs 240 --weight-decay 0.02 --sched cosine --input-size 224 --reprob 0.0 --node 4 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup 0 --drop-path 0.1 --cutmix 1.0 --unscale-lr --no-repeated-aug --color-jitter 0.3 --ThreeAugment --src ``` +
+ + logs + + +epoch 0: 0.0 + +epoch 5: 14.083 + +epoch 10: 40.471 + +epoch 15: 46.165 + +epoch 20: 48.88 + +epoch 25: 49.576 + +epoch 30: 50.562 + +epoch 35: 51.402 + +epoch 40: 51.681 + +epoch 45: 51.799 + +epoch 50: 52.783 + +epoch 55: 52.457 + +epoch 60: 52.675 + +epoch 65: 53.413 + +epoch 70: 53.029 + +epoch 75: 53.679 + +epoch 80: 53.265 + +epoch 85: 53.295 + +epoch 90: 53.811 + +epoch 95: 54.467 + +epoch 100: 54.223 + +epoch 105: 55.15 + +epoch 110: 55.112 + +epoch 115: 54.605 + +epoch 120: 54.826 + +epoch 125: 55.006 + +epoch 130: 55.244 + +epoch 135: 55.628 + +epoch 140: 55.344 + +epoch 145: 55.78 + +epoch 150: 55.896 + +epoch 155: 55.756 + +epoch 160: 56.002 + +epoch 165: 56.072 + +epoch 170: 56.472 + +epoch 175: 56.278 + +epoch 180: 56.442 + +epoch 185: 56.47 + +epoch 190: 56.298 + +epoch 195: 56.49 + +epoch 200: 56.64 + +epoch 205: 56.396 + +epoch 210: 56.678 + +epoch 215: 56.652 + +epoch 220: 56.444 + +epoch 225: 56.446 + +epoch 230: 56.512 + +epoch 235: 56.586 + +epoch 240: 56.462 + +
``` python run_with_submitit.py --model deit_large_patch16_LS --data-path /path/to/imagenet --batch 64 --lr 0.001 --epochs 240 --weight-decay 0.02 --sched cosine --input-size 224 --reprob 0.0 --node 4 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup 0 --drop-path 0.3 --cutmix 1.0 --unscale-lr --no-repeated-aug --color-jitter 0.3 --ThreeAugment --src ``` +
+ + logs + + +epoch 0: 0.0 + +epoch 5: 18.702 + +epoch 10: 43.678 + +epoch 15: 48.805 + +epoch 20: 51.103 + +epoch 25: 51.852 + +epoch 30: 52.725 + +epoch 35: 53.211 + +epoch 40: 53.82 + +epoch 45: 54.136 + +epoch 50: 55.141 + +epoch 55: 54.302 + +epoch 60: 55.085 + +epoch 65: 55.099 + +epoch 70: 55.113 + +epoch 75: 55.792 + +epoch 80: 55.493 + +epoch 85: 55.782 + +epoch 90: 55.567 + +epoch 95: 55.896 + +epoch 100: 56.132 + +epoch 105: 55.936 + +epoch 110: 56.498 + +epoch 115: 56.264 + +epoch 120: 56.45 + +epoch 125: 56.568 + +epoch 130: 56.734 + +epoch 135: 57.083 + +epoch 140: 56.915 + +epoch 145: 57.197 + +epoch 150: 56.999 + +epoch 155: 56.929 + +epoch 160: 57.211 + +epoch 165: 57.219 + +epoch 170: 57.623 + +epoch 175: 57.329 + +epoch 180: 57.243 + +epoch 185: 57.523 + +epoch 190: 57.257 + +epoch 195: 57.391 + +epoch 200: 57.343 + +epoch 205: 57.211 + +epoch 210: 57.437 + +epoch 215: 57.471 + +epoch 220: 57.481 + +epoch 225: 57.417 + +epoch 230: 57.439 + +epoch 235: 57.497 + +epoch 240: 57.412 + +
+ ``` python run_with_submitit.py --model deit_huge_patch14_LS --data-path /path/to/imagenet --batch 64 --lr 0.001 --epochs 90 --weight-decay 0.02 --sched cosine --input-size 128 --reprob 0.0 --node 4 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup 0 --drop-path 0.5 --cutmix 1.0 --unscale-lr --no-repeated-aug --color-jitter 0.3 --ThreeAugment --src ``` + +
+ + logs + + +epoch 0: 0.0 + +epoch 5: 31.292 + +epoch 10: 45.668 + +epoch 15: 48.563 + +epoch 20: 50.37 + +epoch 25: 51.143 + +epoch 30: 52.518 + +epoch 35: 53.205 + +epoch 40: 53.459 + +epoch 45: 54.482 + +epoch 50: 55.956 + +epoch 55: 55.872 + +epoch 60: 56.658 + +epoch 65: 57.173 + +epoch 70: 57.525 + +epoch 75: 57.882 + +epoch 80: 57.761 + +epoch 85: 58.006 + +epoch 90: 57.952 + +
+ finetuning on ImageNet-1k: ``` python run_with_submitit.py --model deit_small_patch16_LS --data-path /path/to/imagenet --batch 128 --lr 0.0003 --epochs 50 --weight-decay 0.02 --sched cosine --input-size 224 --reprob 0.0 --node 2 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup 0 --drop-path 0.05 --cutmix 1.0 --unscale-lr --no-repeated-aug --color-jitter 0.3 --ThreeAugment --src ``` +
+ + logs + + +epoch 0: 0.13 + +epoch 5: 79.023 + +epoch 10: 80.952 + +epoch 15: 81.68 + +epoch 20: 82.178 + +epoch 25: 82.436 + +epoch 30: 82.678 + +epoch 35: 82.925 + +epoch 40: 82.963 + +epoch 45: 83.053 + +epoch 50: 83.074 +
+ ``` python run_with_submitit.py --model deit_base_patch16_LS --data-path /path/to/imagenet --batch 64 --lr 0.0003 --epochs 50 --weight-decay 0.02 --sched cosine --input-size 224 --reprob 0.0 --node 4 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup 0 --drop-path 0.15 --cutmix 1.0 --unscale-lr --no-repeated-aug --color-jitter 0.3 --ThreeAugment --src ``` +
+ + logs + + +epoch 0: 0.11 + +epoch 5: 83.445 + +epoch 10: 84.677 + +epoch 15: 85.211 + +epoch 20: 85.265 + +epoch 25: 85.333 + +epoch 30: 85.437 + +epoch 35: 85.675 + +epoch 40: 85.671 + +epoch 45: 85.707 + +epoch 50: 85.698 + +
+ ``` python run_with_submitit.py --model deit_large_patch16_LS --data-path /path/to/imagenet --batch 64 --lr 0.0003 --epochs 50 --weight-decay 0.02 --sched cosine --input-size 224 --reprob 0.0 --node 4 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup 0 --drop-path 0.4 --cutmix 1.0 --unscale-lr --no-repeated-aug --color-jitter 0.3 --ThreeAugment --src ``` +
+ + logs + + +epoch 0: 0.106 + +epoch 5: 85.427 + +epoch 10: 86.362 + +epoch 15: 86.624 + +epoch 20: 86.696 + +epoch 25: 86.826 + +epoch 30: 86.83 + +epoch 35: 86.954 + +epoch 40: 86.944 + +epoch 45: 86.934 + +epoch 50: 86.98 + +
+ ``` python run_with_submitit.py --model deit_huge_patch14_LS --data-path /path/to/imagenet --batch 64 --lr 0.0003 --epochs 50 --weight-decay 0.02 --sched cosine --input-size 224 --reprob 0.0 --node 4 --gpu 8 --smoothing 0.1 --warmup-epochs 5 --drop 0.0 --nb-classes 1000 --seed 0 --opt fusedlamb --warmup-lr 1e-6 --mixup 0 --drop-path 0.45 --cutmix 1.0 --unscale-lr --no-repeated-aug --color-jitter 0.3 --ThreeAugment --src ``` +
+ + logs + + +epoch 0: 0.126 + +epoch 5: 84.681 + +epoch 10: 86.291 + +epoch 15: 86.753 + +epoch 20: 86.827 + +epoch 25: 86.903 + +epoch 30: 87.126 + +epoch 35: 87.056 + +epoch 40: 87.11 + +epoch 45: 87.154 + +epoch 50: 87.184 +
+ # License This repository is released under the Apache 2.0 license as found in the [LICENSE](LICENSE) file.