Zero-Shot Image Classification
OpenCLIP
ONNX
Safetensors
Transformers
Transformers.js
English
siglip
clip
e-commerce
fashion
multimodal retrieval
custom_code
Instructions to use Marqo/marqo-fashionSigLIP with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- OpenCLIP
How to use Marqo/marqo-fashionSigLIP with OpenCLIP:
import open_clip model, preprocess_train, preprocess_val = open_clip.create_model_and_transforms('hf-hub:Marqo/marqo-fashionSigLIP') tokenizer = open_clip.get_tokenizer('hf-hub:Marqo/marqo-fashionSigLIP') - Transformers
How to use Marqo/marqo-fashionSigLIP with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("zero-shot-image-classification", model="Marqo/marqo-fashionSigLIP", trust_remote_code=True) pipe( "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/hub/parrots.png", candidate_labels=["animals", "humans", "landscape"], )# Load model directly from transformers import AutoModel model = AutoModel.from_pretrained("Marqo/marqo-fashionSigLIP", trust_remote_code=True, dtype="auto") - Transformers.js
How to use Marqo/marqo-fashionSigLIP with Transformers.js:
// npm i @huggingface/transformers import { pipeline } from '@huggingface/transformers'; // Allocate pipeline const pipe = await pipeline('zero-shot-image-classification', 'Marqo/marqo-fashionSigLIP'); - Notebooks
- Google Colab
- Kaggle
| { | |
| "model_cfg": { | |
| "embed_dim": 768, | |
| "init_logit_bias": -10, | |
| "custom_text": true, | |
| "vision_cfg": { | |
| "image_size": 224, | |
| "timm_model_name": "vit_base_patch16_siglip_224", | |
| "timm_model_pretrained": false, | |
| "timm_pool": "map", | |
| "timm_proj": "none" | |
| }, | |
| "text_cfg": { | |
| "context_length": 64, | |
| "vocab_size": 32000, | |
| "hf_tokenizer_name": "timm/ViT-B-16-SigLIP", | |
| "tokenizer_kwargs": { | |
| "clean": "canonicalize" | |
| }, | |
| "width": 768, | |
| "heads": 12, | |
| "layers": 12, | |
| "no_causal_mask": true, | |
| "proj_bias": true, | |
| "pool_type": "last", | |
| "norm_kwargs": { | |
| "eps": 1e-06 | |
| } | |
| } | |
| }, | |
| "preprocess_cfg": { | |
| "mean": [ | |
| 0.5, | |
| 0.5, | |
| 0.5 | |
| ], | |
| "std": [ | |
| 0.5, | |
| 0.5, | |
| 0.5 | |
| ], | |
| "interpolation": "bicubic", | |
| "resize_mode": "squash" | |
| } | |
| } |