| { | |
| "model_config_dict": { | |
| "agg_arch": "QAA", | |
| "agg_config": { | |
| "attn_arch": "conv", | |
| "cluster_dim": 128, | |
| "divide": 1, | |
| "divide_ratio": [ | |
| 1, | |
| 1, | |
| 1, | |
| 0 | |
| ], | |
| "dropout": 0.3, | |
| "feature_nheads": 16, | |
| "freeze": "none", | |
| "num_channels": 768, | |
| "num_clusters": 16, | |
| "num_queries": 256, | |
| "out_norm": false, | |
| "score_nheads": 16, | |
| "score_norm": "none", | |
| "self_attn_out_norm": true, | |
| "skip_connection": "none", | |
| "token_dim": 0 | |
| }, | |
| "backbone_arch": "dinov2_vitb14", | |
| "backbone_config": { | |
| "cluster_dim": 16, | |
| "divide": 1, | |
| "divide_ratio": [ | |
| 1, | |
| 1, | |
| 1, | |
| 0 | |
| ], | |
| "domain_prompt": "none", | |
| "dropout": 0.3, | |
| "multi_scale": "1", | |
| "norm_layer": true, | |
| "num_clusters": 16, | |
| "num_trainable_blocks": 2, | |
| "return_token": true, | |
| "token_dim": 256 | |
| } | |
| } | |
| } |