license: mit | |
datasets: | |
- TIGER-Lab/MMEB-train | |
language: | |
- en | |
base_model: | |
- microsoft/Phi-3.5-vision-instruct | |
library_name: transformers | |
tags: | |
- Retrieval | |
- Multimodal | |
- Embedding | |
pipeline_tag: image-text-to-text | |
license: mit | |
datasets: | |
- TIGER-Lab/MMEB-train | |
language: | |
- en | |
base_model: | |
- microsoft/Phi-3.5-vision-instruct | |
library_name: transformers | |
tags: | |
- Retrieval | |
- Multimodal | |
- Embedding | |
pipeline_tag: image-text-to-text | |