Files
DiffSynth-Studio/diffsynth/extensions/QualityMetric/open_clip/model_configs/coca_roberta-ViT-B-32.json
2025-02-14 12:39:06 +08:00

25 lines
517 B
JSON

{
"embed_dim": 512,
"vision_cfg": {
"image_size": 224,
"layers": 12,
"width": 768,
"patch_size": 32,
"output_tokens": true
},
"text_cfg": {
"hf_model_name": "roberta-base",
"hf_tokenizer_name": "roberta-base",
"proj": "linear",
"width": 768,
"output_tokens": true
},
"multimodal_cfg": {
"context_length": 76,
"width": 768,
"heads": 8,
"layers": 12
},
"custom_text": true
}