metafile.yml 1.2 KB

12345678910111213141516171819202122232425262728293031323334353637
  1. Collections:
  2. - Name: MiniGPT4
  3. Metadata:
  4. Architecture:
  5. - Transformer
  6. - Gated Cross-Attention Dense
  7. Paper:
  8. Title: 'MiniGPT-4: Enhancing Vision-language Understanding with Advanced Large Language Models'
  9. URL: https://arxiv.org/abs/2304.10592
  10. README: configs/minigpt4/README.md
  11. Models:
  12. - Name: minigpt-4_vicuna-7b_caption
  13. Metadata:
  14. FLOPs: null
  15. Parameters: 8121315072
  16. In Collection: MiniGPT4
  17. Results:
  18. - Task: Image Caption
  19. Dataset: COCO
  20. Metrics: null
  21. Weights: https://download.openmmlab.com/mmclassification/v1/minigpt4/minigpt-4_linear_vicuna7b_20230615-714b5f52.pth
  22. Config: configs/minigpt4/minigpt-4_vicuna-7b_caption.py
  23. Converted From:
  24. Weights: https://github.com/Vision-CAIR/MiniGPT-4/tree/main
  25. Code: https://github.com/Vision-CAIR/MiniGPT-4/tree/main
  26. - Name: minigpt-4_baichuan-7b_caption
  27. Metadata:
  28. FLOPs: null
  29. Parameters: 8094769024
  30. In Collection: MiniGPT4
  31. Results:
  32. - Task: Image Caption
  33. Dataset: COCO
  34. Metrics: null
  35. Weights: https://download.openmmlab.com/mmclassification/v1/minigpt4/minigpt-4_linear_baichuan7b_20231011-5dca7ed6.pth
  36. Config: configs/minigpt4/minigpt-4_baichuan-7b_caption.py