| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367 |
- Collections:
- - Name: MAE
- Metadata:
- Training Data: ImageNet-1k
- Training Techniques:
- - AdamW
- Training Resources: 8x A100-80G GPUs
- Architecture:
- - ViT
- Paper:
- Title: Masked Autoencoders Are Scalable Vision Learners
- URL: https://arxiv.org/abs/2111.06377
- README: configs/mae/README.md
- Models:
- - Name: mae_vit-base-p16_8xb512-amp-coslr-300e_in1k
- Metadata:
- Epochs: 300
- Batch Size: 4096
- FLOPs: 17581972224
- Parameters: 111907840
- Training Data: ImageNet-1k
- In Collection: MAE
- Results: null
- Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-base-p16_8xb512-fp16-coslr-300e_in1k/mae_vit-base-p16_8xb512-coslr-300e-fp16_in1k_20220829-c2cf66ba.pth
- Config: configs/mae/mae_vit-base-p16_8xb512-amp-coslr-300e_in1k.py
- Downstream:
- - vit-base-p16_mae-300e-pre_8xb2048-linear-coslr-90e_in1k
- - vit-base-p16_mae-300e-pre_8xb128-coslr-100e_in1k
- - Name: mae_vit-base-p16_8xb512-amp-coslr-400e_in1k
- Metadata:
- Epochs: 400
- Batch Size: 4096
- FLOPs: 17581972224
- Parameters: 111907840
- Training Data: ImageNet-1k
- In Collection: MAE
- Results: null
- Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-base-p16_8xb512-fp16-coslr-400e_in1k/mae_vit-base-p16_8xb512-coslr-400e-fp16_in1k_20220825-bc79e40b.pth
- Config: configs/mae/mae_vit-base-p16_8xb512-amp-coslr-400e_in1k.py
- Downstream:
- - vit-base-p16_mae-400e-pre_8xb2048-linear-coslr-90e_in1k
- - vit-base-p16_mae-400e-pre_8xb128-coslr-100e_in1k
- - Name: mae_vit-base-p16_8xb512-amp-coslr-800e_in1k
- Metadata:
- Epochs: 800
- Batch Size: 4096
- FLOPs: 17581972224
- Parameters: 111907840
- Training Data: ImageNet-1k
- In Collection: MAE
- Results: null
- Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-base-p16_8xb512-fp16-coslr-800e_in1k/mae_vit-base-p16_8xb512-coslr-800e-fp16_in1k_20220825-5d81fbc4.pth
- Config: configs/mae/mae_vit-base-p16_8xb512-amp-coslr-800e_in1k.py
- Downstream:
- - vit-base-p16_mae-800e-pre_8xb2048-linear-coslr-90e_in1k
- - vit-base-p16_mae-800e-pre_8xb128-coslr-100e_in1k
- - Name: mae_vit-base-p16_8xb512-amp-coslr-1600e_in1k
- Metadata:
- Epochs: 1600
- Batch Size: 4096
- FLOPs: 17581972224
- Parameters: 111907840
- Training Data: ImageNet-1k
- In Collection: MAE
- Results: null
- Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-base-p16_8xb512-fp16-coslr-1600e_in1k/mae_vit-base-p16_8xb512-fp16-coslr-1600e_in1k_20220825-f7569ca2.pth
- Config: configs/mae/mae_vit-base-p16_8xb512-amp-coslr-1600e_in1k.py
- Downstream:
- - vit-base-p16_mae-1600e-pre_8xb2048-linear-coslr-90e_in1k
- - vit-base-p16_mae-1600e-pre_8xb128-coslr-100e_in1k
- - Name: mae_vit-large-p16_8xb512-amp-coslr-400e_in1k
- Metadata:
- Epochs: 400
- Batch Size: 4096
- FLOPs: 61603111936
- Parameters: 329541888
- Training Data: ImageNet-1k
- In Collection: MAE
- Results: null
- Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-large-p16_8xb512-fp16-coslr-400e_in1k/mae_vit-large-p16_8xb512-fp16-coslr-400e_in1k_20220825-b11d0425.pth
- Config: configs/mae/mae_vit-large-p16_8xb512-amp-coslr-400e_in1k.py
- Downstream:
- - vit-large-p16_mae-400e-pre_8xb2048-linear-coslr-90e_in1k
- - vit-large-p16_mae-400e-pre_8xb128-coslr-50e_in1k
- - Name: mae_vit-large-p16_8xb512-amp-coslr-800e_in1k
- Metadata:
- Epochs: 800
- Batch Size: 4096
- FLOPs: 61603111936
- Parameters: 329541888
- Training Data: ImageNet-1k
- In Collection: MAE
- Results: null
- Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-large-p16_8xb512-fp16-coslr-800e_in1k/mae_vit-large-p16_8xb512-fp16-coslr-800e_in1k_20220825-df72726a.pth
- Config: configs/mae/mae_vit-large-p16_8xb512-amp-coslr-800e_in1k.py
- Downstream:
- - vit-large-p16_mae-800e-pre_8xb2048-linear-coslr-90e_in1k
- - vit-large-p16_mae-800e-pre_8xb128-coslr-50e_in1k
- - Name: mae_vit-large-p16_8xb512-amp-coslr-1600e_in1k
- Metadata:
- Epochs: 1600
- Batch Size: 4096
- FLOPs: 61603111936
- Parameters: 329541888
- Training Data: ImageNet-1k
- In Collection: MAE
- Results: null
- Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-large-p16_8xb512-fp16-coslr-1600e_in1k/mae_vit-large-p16_8xb512-fp16-coslr-1600e_in1k_20220825-cc7e98c9.pth
- Config: configs/mae/mae_vit-large-p16_8xb512-amp-coslr-1600e_in1k.py
- Downstream:
- - vit-large-p16_mae-1600e-pre_8xb2048-linear-coslr-90e_in1k
- - vit-large-p16_mae-1600e-pre_8xb128-coslr-50e_in1k
- - Name: mae_vit-huge-p16_8xb512-amp-coslr-1600e_in1k
- Metadata:
- Epochs: 1600
- Batch Size: 4096
- FLOPs: 167400741120
- Parameters: 657074508
- Training Data: ImageNet-1k
- In Collection: MAE
- Results: null
- Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-huge-p16_8xb512-fp16-coslr-1600e_in1k/mae_vit-huge-p16_8xb512-fp16-coslr-1600e_in1k_20220916-ff848775.pth
- Config: configs/mae/mae_vit-huge-p14_8xb512-amp-coslr-1600e_in1k.py
- Downstream:
- - vit-huge-p14_mae-1600e-pre_8xb128-coslr-50e_in1k
- - vit-huge-p14_mae-1600e-pre_32xb8-coslr-50e_in1k-448px
- - Name: vit-base-p16_mae-300e-pre_8xb128-coslr-100e_in1k
- Metadata:
- Epochs: 100
- Batch Size: 1024
- FLOPs: 17581215744
- Parameters: 86566120
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 83.1
- Weights: null
- Config: configs/mae/benchmarks/vit-base-p16_8xb128-coslr-100e_in1k.py
- - Name: vit-base-p16_mae-400e-pre_8xb128-coslr-100e_in1k
- Metadata:
- Epochs: 100
- Batch Size: 1024
- FLOPs: 17581215744
- Parameters: 86566120
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 83.3
- Weights: null
- Config: configs/mae/benchmarks/vit-base-p16_8xb128-coslr-100e_in1k.py
- - Name: vit-base-p16_mae-800e-pre_8xb128-coslr-100e_in1k
- Metadata:
- Epochs: 100
- Batch Size: 1024
- FLOPs: 17581215744
- Parameters: 86566120
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 83.3
- Weights: null
- Config: configs/mae/benchmarks/vit-base-p16_8xb128-coslr-100e_in1k.py
- - Name: vit-base-p16_mae-1600e-pre_8xb128-coslr-100e_in1k
- Metadata:
- Epochs: 100
- Batch Size: 1024
- FLOPs: 17581215744
- Parameters: 86566120
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 83.5
- Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-base-p16_8xb512-fp16-coslr-1600e_in1k/vit-base-p16_ft-8xb128-coslr-100e_in1k/vit-base-p16_ft-8xb128-coslr-100e_in1k_20220825-cf70aa21.pth
- Config: configs/mae/benchmarks/vit-base-p16_8xb128-coslr-100e_in1k.py
- - Name: vit-base-p16_mae-300e-pre_8xb2048-linear-coslr-90e_in1k
- Metadata:
- Epochs: 90
- Batch Size: 16384
- FLOPs: 17581972992
- Parameters: 86567656
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 60.8
- Weights: null
- Config: configs/mae/benchmarks/vit-base-p16_8xb2048-linear-coslr-90e_in1k.py
- - Name: vit-base-p16_mae-400e-pre_8xb2048-linear-coslr-90e_in1k
- Metadata:
- Epochs: 90
- Batch Size: 16384
- FLOPs: 17581972992
- Parameters: 86567656
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 62.5
- Weights: null
- Config: configs/mae/benchmarks/vit-base-p16_8xb2048-linear-coslr-90e_in1k.py
- - Name: vit-base-p16_mae-800e-pre_8xb2048-linear-coslr-90e_in1k
- Metadata:
- Epochs: 90
- Batch Size: 16384
- FLOPs: 17581972992
- Parameters: 86567656
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 65.1
- Weights: null
- Config: configs/mae/benchmarks/vit-base-p16_8xb2048-linear-coslr-90e_in1k.py
- - Name: vit-base-p16_mae-1600e-pre_8xb2048-linear-coslr-90e_in1k
- Metadata:
- Epochs: 90
- Batch Size: 16384
- FLOPs: 17581972992
- Parameters: 86567656
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 67.1
- Weights: null
- Config: configs/mae/benchmarks/vit-base-p16_8xb2048-linear-coslr-90e_in1k.py
- - Name: vit-large-p16_mae-400e-pre_8xb128-coslr-50e_in1k
- Metadata:
- Epochs: 50
- Batch Size: 1024
- FLOPs: 61602103296
- Parameters: 304324584
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 85.2
- Weights: null
- Config: configs/mae/benchmarks/vit-large-p16_8xb128-coslr-50e_in1k.py
- - Name: vit-large-p16_mae-800e-pre_8xb128-coslr-50e_in1k
- Metadata:
- Epochs: 50
- Batch Size: 1024
- FLOPs: 61602103296
- Parameters: 304324584
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 85.4
- Weights: null
- Config: configs/mae/benchmarks/vit-large-p16_8xb128-coslr-50e_in1k.py
- - Name: vit-large-p16_mae-1600e-pre_8xb128-coslr-50e_in1k
- Metadata:
- Epochs: 50
- Batch Size: 1024
- FLOPs: 61602103296
- Parameters: 304324584
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 85.7
- Weights: null
- Config: configs/mae/benchmarks/vit-large-p16_8xb128-coslr-50e_in1k.py
- - Name: vit-large-p16_mae-400e-pre_8xb2048-linear-coslr-90e_in1k
- Metadata:
- Epochs: 90
- Batch Size: 16384
- FLOPs: 61603112960
- Parameters: 304326632
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 70.7
- Weights: null
- Config: configs/mae/benchmarks/vit-large-p16_8xb2048-linear-coslr-90e_in1k.py
- - Name: vit-large-p16_mae-800e-pre_8xb2048-linear-coslr-90e_in1k
- Metadata:
- Epochs: 90
- Batch Size: 16384
- FLOPs: 61603112960
- Parameters: 304326632
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 73.7
- Weights: null
- Config: configs/mae/benchmarks/vit-large-p16_8xb2048-linear-coslr-90e_in1k.py
- - Name: vit-large-p16_mae-1600e-pre_8xb2048-linear-coslr-90e_in1k
- Metadata:
- Epochs: 90
- Batch Size: 16384
- FLOPs: 61603112960
- Parameters: 304326632
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 75.5
- Weights: null
- Config: configs/mae/benchmarks/vit-large-p16_8xb2048-linear-coslr-90e_in1k.py
- - Name: vit-huge-p14_mae-1600e-pre_8xb128-coslr-50e_in1k
- Metadata:
- Epochs: 50
- Batch Size: 1024
- FLOPs: 167399096320
- Parameters: 632043240
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 86.9
- Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-huge-p16_8xb512-fp16-coslr-1600e_in1k/vit-huge-p16_ft-8xb128-coslr-50e_in1k/vit-huge-p16_ft-8xb128-coslr-50e_in1k_20220916-0bfc9bfd.pth
- Config: configs/mae/benchmarks/vit-huge-p14_8xb128-coslr-50e_in1k.py
- - Name: vit-huge-p14_mae-1600e-pre_32xb8-coslr-50e_in1k-448px
- Metadata:
- Epochs: 50
- Batch Size: 256
- FLOPs: 732131983360
- Parameters: 633026280
- Training Data: ImageNet-1k
- In Collection: MAE
- Results:
- - Task: Image Classification
- Dataset: ImageNet-1k
- Metrics:
- Top 1 Accuracy: 87.3
- Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-huge-p16_8xb512-fp16-coslr-1600e_in1k/vit-huge-p16_ft-32xb8-coslr-50e_in1k-448/vit-huge-p16_ft-32xb8-coslr-50e_in1k-448_20220916-95b6a0ce.pth
- Config: configs/mae/benchmarks/vit-huge-p14_32xb8-coslr-50e_in1k-448px.py
|