metafile.yml 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367
  1. Collections:
  2. - Name: MAE
  3. Metadata:
  4. Training Data: ImageNet-1k
  5. Training Techniques:
  6. - AdamW
  7. Training Resources: 8x A100-80G GPUs
  8. Architecture:
  9. - ViT
  10. Paper:
  11. Title: Masked Autoencoders Are Scalable Vision Learners
  12. URL: https://arxiv.org/abs/2111.06377
  13. README: configs/mae/README.md
  14. Models:
  15. - Name: mae_vit-base-p16_8xb512-amp-coslr-300e_in1k
  16. Metadata:
  17. Epochs: 300
  18. Batch Size: 4096
  19. FLOPs: 17581972224
  20. Parameters: 111907840
  21. Training Data: ImageNet-1k
  22. In Collection: MAE
  23. Results: null
  24. Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-base-p16_8xb512-fp16-coslr-300e_in1k/mae_vit-base-p16_8xb512-coslr-300e-fp16_in1k_20220829-c2cf66ba.pth
  25. Config: configs/mae/mae_vit-base-p16_8xb512-amp-coslr-300e_in1k.py
  26. Downstream:
  27. - vit-base-p16_mae-300e-pre_8xb2048-linear-coslr-90e_in1k
  28. - vit-base-p16_mae-300e-pre_8xb128-coslr-100e_in1k
  29. - Name: mae_vit-base-p16_8xb512-amp-coslr-400e_in1k
  30. Metadata:
  31. Epochs: 400
  32. Batch Size: 4096
  33. FLOPs: 17581972224
  34. Parameters: 111907840
  35. Training Data: ImageNet-1k
  36. In Collection: MAE
  37. Results: null
  38. Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-base-p16_8xb512-fp16-coslr-400e_in1k/mae_vit-base-p16_8xb512-coslr-400e-fp16_in1k_20220825-bc79e40b.pth
  39. Config: configs/mae/mae_vit-base-p16_8xb512-amp-coslr-400e_in1k.py
  40. Downstream:
  41. - vit-base-p16_mae-400e-pre_8xb2048-linear-coslr-90e_in1k
  42. - vit-base-p16_mae-400e-pre_8xb128-coslr-100e_in1k
  43. - Name: mae_vit-base-p16_8xb512-amp-coslr-800e_in1k
  44. Metadata:
  45. Epochs: 800
  46. Batch Size: 4096
  47. FLOPs: 17581972224
  48. Parameters: 111907840
  49. Training Data: ImageNet-1k
  50. In Collection: MAE
  51. Results: null
  52. Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-base-p16_8xb512-fp16-coslr-800e_in1k/mae_vit-base-p16_8xb512-coslr-800e-fp16_in1k_20220825-5d81fbc4.pth
  53. Config: configs/mae/mae_vit-base-p16_8xb512-amp-coslr-800e_in1k.py
  54. Downstream:
  55. - vit-base-p16_mae-800e-pre_8xb2048-linear-coslr-90e_in1k
  56. - vit-base-p16_mae-800e-pre_8xb128-coslr-100e_in1k
  57. - Name: mae_vit-base-p16_8xb512-amp-coslr-1600e_in1k
  58. Metadata:
  59. Epochs: 1600
  60. Batch Size: 4096
  61. FLOPs: 17581972224
  62. Parameters: 111907840
  63. Training Data: ImageNet-1k
  64. In Collection: MAE
  65. Results: null
  66. Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-base-p16_8xb512-fp16-coslr-1600e_in1k/mae_vit-base-p16_8xb512-fp16-coslr-1600e_in1k_20220825-f7569ca2.pth
  67. Config: configs/mae/mae_vit-base-p16_8xb512-amp-coslr-1600e_in1k.py
  68. Downstream:
  69. - vit-base-p16_mae-1600e-pre_8xb2048-linear-coslr-90e_in1k
  70. - vit-base-p16_mae-1600e-pre_8xb128-coslr-100e_in1k
  71. - Name: mae_vit-large-p16_8xb512-amp-coslr-400e_in1k
  72. Metadata:
  73. Epochs: 400
  74. Batch Size: 4096
  75. FLOPs: 61603111936
  76. Parameters: 329541888
  77. Training Data: ImageNet-1k
  78. In Collection: MAE
  79. Results: null
  80. Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-large-p16_8xb512-fp16-coslr-400e_in1k/mae_vit-large-p16_8xb512-fp16-coslr-400e_in1k_20220825-b11d0425.pth
  81. Config: configs/mae/mae_vit-large-p16_8xb512-amp-coslr-400e_in1k.py
  82. Downstream:
  83. - vit-large-p16_mae-400e-pre_8xb2048-linear-coslr-90e_in1k
  84. - vit-large-p16_mae-400e-pre_8xb128-coslr-50e_in1k
  85. - Name: mae_vit-large-p16_8xb512-amp-coslr-800e_in1k
  86. Metadata:
  87. Epochs: 800
  88. Batch Size: 4096
  89. FLOPs: 61603111936
  90. Parameters: 329541888
  91. Training Data: ImageNet-1k
  92. In Collection: MAE
  93. Results: null
  94. Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-large-p16_8xb512-fp16-coslr-800e_in1k/mae_vit-large-p16_8xb512-fp16-coslr-800e_in1k_20220825-df72726a.pth
  95. Config: configs/mae/mae_vit-large-p16_8xb512-amp-coslr-800e_in1k.py
  96. Downstream:
  97. - vit-large-p16_mae-800e-pre_8xb2048-linear-coslr-90e_in1k
  98. - vit-large-p16_mae-800e-pre_8xb128-coslr-50e_in1k
  99. - Name: mae_vit-large-p16_8xb512-amp-coslr-1600e_in1k
  100. Metadata:
  101. Epochs: 1600
  102. Batch Size: 4096
  103. FLOPs: 61603111936
  104. Parameters: 329541888
  105. Training Data: ImageNet-1k
  106. In Collection: MAE
  107. Results: null
  108. Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-large-p16_8xb512-fp16-coslr-1600e_in1k/mae_vit-large-p16_8xb512-fp16-coslr-1600e_in1k_20220825-cc7e98c9.pth
  109. Config: configs/mae/mae_vit-large-p16_8xb512-amp-coslr-1600e_in1k.py
  110. Downstream:
  111. - vit-large-p16_mae-1600e-pre_8xb2048-linear-coslr-90e_in1k
  112. - vit-large-p16_mae-1600e-pre_8xb128-coslr-50e_in1k
  113. - Name: mae_vit-huge-p16_8xb512-amp-coslr-1600e_in1k
  114. Metadata:
  115. Epochs: 1600
  116. Batch Size: 4096
  117. FLOPs: 167400741120
  118. Parameters: 657074508
  119. Training Data: ImageNet-1k
  120. In Collection: MAE
  121. Results: null
  122. Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-huge-p16_8xb512-fp16-coslr-1600e_in1k/mae_vit-huge-p16_8xb512-fp16-coslr-1600e_in1k_20220916-ff848775.pth
  123. Config: configs/mae/mae_vit-huge-p14_8xb512-amp-coslr-1600e_in1k.py
  124. Downstream:
  125. - vit-huge-p14_mae-1600e-pre_8xb128-coslr-50e_in1k
  126. - vit-huge-p14_mae-1600e-pre_32xb8-coslr-50e_in1k-448px
  127. - Name: vit-base-p16_mae-300e-pre_8xb128-coslr-100e_in1k
  128. Metadata:
  129. Epochs: 100
  130. Batch Size: 1024
  131. FLOPs: 17581215744
  132. Parameters: 86566120
  133. Training Data: ImageNet-1k
  134. In Collection: MAE
  135. Results:
  136. - Task: Image Classification
  137. Dataset: ImageNet-1k
  138. Metrics:
  139. Top 1 Accuracy: 83.1
  140. Weights: null
  141. Config: configs/mae/benchmarks/vit-base-p16_8xb128-coslr-100e_in1k.py
  142. - Name: vit-base-p16_mae-400e-pre_8xb128-coslr-100e_in1k
  143. Metadata:
  144. Epochs: 100
  145. Batch Size: 1024
  146. FLOPs: 17581215744
  147. Parameters: 86566120
  148. Training Data: ImageNet-1k
  149. In Collection: MAE
  150. Results:
  151. - Task: Image Classification
  152. Dataset: ImageNet-1k
  153. Metrics:
  154. Top 1 Accuracy: 83.3
  155. Weights: null
  156. Config: configs/mae/benchmarks/vit-base-p16_8xb128-coslr-100e_in1k.py
  157. - Name: vit-base-p16_mae-800e-pre_8xb128-coslr-100e_in1k
  158. Metadata:
  159. Epochs: 100
  160. Batch Size: 1024
  161. FLOPs: 17581215744
  162. Parameters: 86566120
  163. Training Data: ImageNet-1k
  164. In Collection: MAE
  165. Results:
  166. - Task: Image Classification
  167. Dataset: ImageNet-1k
  168. Metrics:
  169. Top 1 Accuracy: 83.3
  170. Weights: null
  171. Config: configs/mae/benchmarks/vit-base-p16_8xb128-coslr-100e_in1k.py
  172. - Name: vit-base-p16_mae-1600e-pre_8xb128-coslr-100e_in1k
  173. Metadata:
  174. Epochs: 100
  175. Batch Size: 1024
  176. FLOPs: 17581215744
  177. Parameters: 86566120
  178. Training Data: ImageNet-1k
  179. In Collection: MAE
  180. Results:
  181. - Task: Image Classification
  182. Dataset: ImageNet-1k
  183. Metrics:
  184. Top 1 Accuracy: 83.5
  185. Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-base-p16_8xb512-fp16-coslr-1600e_in1k/vit-base-p16_ft-8xb128-coslr-100e_in1k/vit-base-p16_ft-8xb128-coslr-100e_in1k_20220825-cf70aa21.pth
  186. Config: configs/mae/benchmarks/vit-base-p16_8xb128-coslr-100e_in1k.py
  187. - Name: vit-base-p16_mae-300e-pre_8xb2048-linear-coslr-90e_in1k
  188. Metadata:
  189. Epochs: 90
  190. Batch Size: 16384
  191. FLOPs: 17581972992
  192. Parameters: 86567656
  193. Training Data: ImageNet-1k
  194. In Collection: MAE
  195. Results:
  196. - Task: Image Classification
  197. Dataset: ImageNet-1k
  198. Metrics:
  199. Top 1 Accuracy: 60.8
  200. Weights: null
  201. Config: configs/mae/benchmarks/vit-base-p16_8xb2048-linear-coslr-90e_in1k.py
  202. - Name: vit-base-p16_mae-400e-pre_8xb2048-linear-coslr-90e_in1k
  203. Metadata:
  204. Epochs: 90
  205. Batch Size: 16384
  206. FLOPs: 17581972992
  207. Parameters: 86567656
  208. Training Data: ImageNet-1k
  209. In Collection: MAE
  210. Results:
  211. - Task: Image Classification
  212. Dataset: ImageNet-1k
  213. Metrics:
  214. Top 1 Accuracy: 62.5
  215. Weights: null
  216. Config: configs/mae/benchmarks/vit-base-p16_8xb2048-linear-coslr-90e_in1k.py
  217. - Name: vit-base-p16_mae-800e-pre_8xb2048-linear-coslr-90e_in1k
  218. Metadata:
  219. Epochs: 90
  220. Batch Size: 16384
  221. FLOPs: 17581972992
  222. Parameters: 86567656
  223. Training Data: ImageNet-1k
  224. In Collection: MAE
  225. Results:
  226. - Task: Image Classification
  227. Dataset: ImageNet-1k
  228. Metrics:
  229. Top 1 Accuracy: 65.1
  230. Weights: null
  231. Config: configs/mae/benchmarks/vit-base-p16_8xb2048-linear-coslr-90e_in1k.py
  232. - Name: vit-base-p16_mae-1600e-pre_8xb2048-linear-coslr-90e_in1k
  233. Metadata:
  234. Epochs: 90
  235. Batch Size: 16384
  236. FLOPs: 17581972992
  237. Parameters: 86567656
  238. Training Data: ImageNet-1k
  239. In Collection: MAE
  240. Results:
  241. - Task: Image Classification
  242. Dataset: ImageNet-1k
  243. Metrics:
  244. Top 1 Accuracy: 67.1
  245. Weights: null
  246. Config: configs/mae/benchmarks/vit-base-p16_8xb2048-linear-coslr-90e_in1k.py
  247. - Name: vit-large-p16_mae-400e-pre_8xb128-coslr-50e_in1k
  248. Metadata:
  249. Epochs: 50
  250. Batch Size: 1024
  251. FLOPs: 61602103296
  252. Parameters: 304324584
  253. Training Data: ImageNet-1k
  254. In Collection: MAE
  255. Results:
  256. - Task: Image Classification
  257. Dataset: ImageNet-1k
  258. Metrics:
  259. Top 1 Accuracy: 85.2
  260. Weights: null
  261. Config: configs/mae/benchmarks/vit-large-p16_8xb128-coslr-50e_in1k.py
  262. - Name: vit-large-p16_mae-800e-pre_8xb128-coslr-50e_in1k
  263. Metadata:
  264. Epochs: 50
  265. Batch Size: 1024
  266. FLOPs: 61602103296
  267. Parameters: 304324584
  268. Training Data: ImageNet-1k
  269. In Collection: MAE
  270. Results:
  271. - Task: Image Classification
  272. Dataset: ImageNet-1k
  273. Metrics:
  274. Top 1 Accuracy: 85.4
  275. Weights: null
  276. Config: configs/mae/benchmarks/vit-large-p16_8xb128-coslr-50e_in1k.py
  277. - Name: vit-large-p16_mae-1600e-pre_8xb128-coslr-50e_in1k
  278. Metadata:
  279. Epochs: 50
  280. Batch Size: 1024
  281. FLOPs: 61602103296
  282. Parameters: 304324584
  283. Training Data: ImageNet-1k
  284. In Collection: MAE
  285. Results:
  286. - Task: Image Classification
  287. Dataset: ImageNet-1k
  288. Metrics:
  289. Top 1 Accuracy: 85.7
  290. Weights: null
  291. Config: configs/mae/benchmarks/vit-large-p16_8xb128-coslr-50e_in1k.py
  292. - Name: vit-large-p16_mae-400e-pre_8xb2048-linear-coslr-90e_in1k
  293. Metadata:
  294. Epochs: 90
  295. Batch Size: 16384
  296. FLOPs: 61603112960
  297. Parameters: 304326632
  298. Training Data: ImageNet-1k
  299. In Collection: MAE
  300. Results:
  301. - Task: Image Classification
  302. Dataset: ImageNet-1k
  303. Metrics:
  304. Top 1 Accuracy: 70.7
  305. Weights: null
  306. Config: configs/mae/benchmarks/vit-large-p16_8xb2048-linear-coslr-90e_in1k.py
  307. - Name: vit-large-p16_mae-800e-pre_8xb2048-linear-coslr-90e_in1k
  308. Metadata:
  309. Epochs: 90
  310. Batch Size: 16384
  311. FLOPs: 61603112960
  312. Parameters: 304326632
  313. Training Data: ImageNet-1k
  314. In Collection: MAE
  315. Results:
  316. - Task: Image Classification
  317. Dataset: ImageNet-1k
  318. Metrics:
  319. Top 1 Accuracy: 73.7
  320. Weights: null
  321. Config: configs/mae/benchmarks/vit-large-p16_8xb2048-linear-coslr-90e_in1k.py
  322. - Name: vit-large-p16_mae-1600e-pre_8xb2048-linear-coslr-90e_in1k
  323. Metadata:
  324. Epochs: 90
  325. Batch Size: 16384
  326. FLOPs: 61603112960
  327. Parameters: 304326632
  328. Training Data: ImageNet-1k
  329. In Collection: MAE
  330. Results:
  331. - Task: Image Classification
  332. Dataset: ImageNet-1k
  333. Metrics:
  334. Top 1 Accuracy: 75.5
  335. Weights: null
  336. Config: configs/mae/benchmarks/vit-large-p16_8xb2048-linear-coslr-90e_in1k.py
  337. - Name: vit-huge-p14_mae-1600e-pre_8xb128-coslr-50e_in1k
  338. Metadata:
  339. Epochs: 50
  340. Batch Size: 1024
  341. FLOPs: 167399096320
  342. Parameters: 632043240
  343. Training Data: ImageNet-1k
  344. In Collection: MAE
  345. Results:
  346. - Task: Image Classification
  347. Dataset: ImageNet-1k
  348. Metrics:
  349. Top 1 Accuracy: 86.9
  350. Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-huge-p16_8xb512-fp16-coslr-1600e_in1k/vit-huge-p16_ft-8xb128-coslr-50e_in1k/vit-huge-p16_ft-8xb128-coslr-50e_in1k_20220916-0bfc9bfd.pth
  351. Config: configs/mae/benchmarks/vit-huge-p14_8xb128-coslr-50e_in1k.py
  352. - Name: vit-huge-p14_mae-1600e-pre_32xb8-coslr-50e_in1k-448px
  353. Metadata:
  354. Epochs: 50
  355. Batch Size: 256
  356. FLOPs: 732131983360
  357. Parameters: 633026280
  358. Training Data: ImageNet-1k
  359. In Collection: MAE
  360. Results:
  361. - Task: Image Classification
  362. Dataset: ImageNet-1k
  363. Metrics:
  364. Top 1 Accuracy: 87.3
  365. Weights: https://download.openmmlab.com/mmselfsup/1.x/mae/mae_vit-huge-p16_8xb512-fp16-coslr-1600e_in1k/vit-huge-p16_ft-32xb8-coslr-50e_in1k-448/vit-huge-p16_ft-32xb8-coslr-50e_in1k-448_20220916-95b6a0ce.pth
  366. Config: configs/mae/benchmarks/vit-huge-p14_32xb8-coslr-50e_in1k-448px.py