Talk2DINO-ViTL / config.json
lorebianchi98's picture
Push model using huggingface_hub.
4313f8a verified
raw
history blame
529 Bytes
{
"avg_self_attn_token": false,
"clip_model_name": "ViT-B/16",
"disentangled_self_attn_token": true,
"is_eval": true,
"keep_cls": false,
"keep_end_seq": false,
"loss": null,
"model_name": "dinov2_vitl14_reg",
"pre_trained": true,
"proj_class": "vitl_mlp_infonce",
"proj_model": "ProjectionLayer",
"proj_name": "vitl_mlp_infonce",
"resize_dim": 518,
"type": "DINOText",
"unfreeze_last_image_layer": false,
"unfreeze_last_text_layer": false,
"use_avg_text_token": false,
"with_bg_clean": false
}