mixvideo-v2/cargos/tvai-v2/models/ViT-gopt-16-SigLIP2-384.json

33 lines
823 B
JSON

{
"embed_dim": 1536,
"init_logit_bias": -10,
"custom_text": true,
"vision_cfg": {
"image_size": 384,
"timm_model_name": "vit_giantopt_patch16_siglip_384",
"timm_model_pretrained": false,
"timm_pool": "map",
"timm_proj": "none"
},
"text_cfg": {
"context_length": 64,
"vocab_size": 256000,
"hf_tokenizer_name": "timm/ViT-gopt-16-SigLIP2-384",
"tokenizer_kwargs": {
"clean": "canonicalize"
},
"width": 1152,
"heads": 16,
"layers": 27,
"mlp_ratio": 3.7362,
"no_causal_mask": true,
"proj_bias": true,
"pool_type": "last",
"norm_kwargs":{
"eps": 1e-6
},
"act_kwargs": {
"approximate": "tanh"
}
}
}