metafile.yml 2.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869
  1. Collections:
  2. - Name: BEiTv2
  3. Metadata:
  4. Architecture:
  5. - Attention Dropout
  6. - Convolution
  7. - Dense Connections
  8. - Dropout
  9. - GELU
  10. - Layer Normalization
  11. - Multi-Head Attention
  12. - Scaled Dot-Product Attention
  13. - Tanh Activation
  14. Paper:
  15. Title: 'BEiT v2: Masked Image Modeling with Vector-Quantized Visual Tokenizers'
  16. URL: https://arxiv.org/abs/2208.06366
  17. README: configs/beitv2/README.md
  18. Code:
  19. URL: https://github.com/open-mmlab/mmpretrain/blob/main/mmpretrain/models/backbones/beit.py
  20. Version: v1.0.0rc4
  21. Models:
  22. - Name: beitv2_beit-base-p16_8xb256-amp-coslr-300e_in1k
  23. Metadata:
  24. Epochs: 300
  25. Batch Size: 2048
  26. FLOPs: 17581223424
  27. Parameters: 192811376
  28. Training Data: ImageNet-1k
  29. In Collection: BEiTv2
  30. Results: null
  31. Weights: https://download.openmmlab.com/mmselfsup/1.x/beitv2/beitv2_vit-base-p16_8xb256-amp-coslr-300e_in1k/beitv2_vit-base-p16_8xb256-amp-coslr-300e_in1k_20221212-a157be30.pth
  32. Config: configs/beitv2/beitv2_beit-base-p16_8xb256-amp-coslr-300e_in1k.py
  33. Downstream:
  34. - beit-base-p16_beitv2-pre_8xb128-coslr-100e_in1k
  35. - Name: beit-base-p16_beitv2-pre_8xb128-coslr-100e_in1k
  36. Metadata:
  37. Epochs: 100
  38. Batch Size: 1024
  39. FLOPs: 17581219584
  40. Parameters: 86530984
  41. Training Data: ImageNet-1k
  42. In Collection: BEiTv2
  43. Results:
  44. - Task: Image Classification
  45. Dataset: ImageNet-1k
  46. Metrics:
  47. Top 1 Accuracy: 85.0
  48. Weights: https://download.openmmlab.com/mmselfsup/1.x/beitv2/beitv2_vit-base-p16_8xb256-amp-coslr-300e_in1k/vit-base-p16_ft-8xb128-coslr-100e_in1k/vit-base-p16_ft-8xb128-coslr-100e_in1k_20221212-d1c0789e.pth
  49. Config: configs/beitv2/benchmarks/beit-base-p16_8xb128-coslr-100e_in1k.py
  50. - Name: beit-base-p16_beitv2-in21k-pre_3rdparty_in1k
  51. Metadata:
  52. FLOPs: 17581219584
  53. Parameters: 86530984
  54. Training Data:
  55. - ImageNet-21k
  56. - ImageNet-1k
  57. In Collection: BEiTv2
  58. Results:
  59. - Dataset: ImageNet-1k
  60. Task: Image Classification
  61. Metrics:
  62. Top 1 Accuracy: 86.47
  63. Top 5 Accuracy: 97.99
  64. Weights: https://download.openmmlab.com/mmclassification/v0/beit/beitv2-base_3rdparty_in1k_20221114-73e11905.pth
  65. Config: configs/beitv2/benchmarks/beit-base-p16_8xb64_in1k.py
  66. Converted From:
  67. Weights: https://conversationhub.blob.core.windows.net/beit-share-public/beitv2/beitv2_base_patch16_224_pt1k_ft21kto1k.pth
  68. Code: https://github.com/microsoft/unilm/tree/master/beit2