gated-david / MODELS_INDEX.json
AbstractPhil's picture
Update models index - David-decoupled-cantor_scale @ 78.90%
6a31c3e verified
{
"repository": "AbstractPhil/gated-david",
"updated": "2025-11-04T15:57:32.580623",
"models": [
{
"model_name": "David-decoupled-cantor_scale",
"run_id": "20251104_144102",
"timestamp": "2025-11-04T15:01:54.717226",
"best_val_acc": 85.25,
"best_epoch": 4,
"num_scales": 8,
"scales": [
384,
512,
768,
1024,
1280,
1536,
1792,
2048
],
"parameters": 70207625,
"sharing_mode": "decoupled",
"fusion_mode": "cantor_scale",
"preset": "clip_vit_bigg14_cantor_decoupled",
"weights_path": "weights/David-decoupled-cantor_scale/20251104_144102/best_model_acc85.25.safetensors",
"config_path": "weights/David-decoupled-cantor_scale/20251104_144102/david_config.json",
"history_path": "weights/David-decoupled-cantor_scale/20251104_144102/training_history.json"
},
{
"model_name": "David-partial_shared-cantor_scale",
"run_id": "20251104_140742",
"timestamp": "2025-11-04T14:34:12.310619",
"best_val_acc": 84.916,
"best_epoch": 4,
"num_scales": 8,
"scales": [
384,
512,
768,
1024,
1280,
1536,
1792,
2048
],
"parameters": 82601993,
"sharing_mode": "partial_shared",
"fusion_mode": "cantor_scale",
"preset": "clip_vit_bigg14_cantor",
"weights_path": "weights/David-partial_shared-cantor_scale/20251104_140742/best_model_acc84.92.safetensors",
"config_path": "weights/David-partial_shared-cantor_scale/20251104_140742/david_config.json",
"history_path": "weights/David-partial_shared-cantor_scale/20251104_140742/training_history.json"
},
{
"model_name": "David-partial_shared-deep_efficiency",
"run_id": "20251012_181608",
"timestamp": "2025-10-12T18:49:28.035826",
"best_val_acc": 84.726,
"best_epoch": 2,
"num_scales": 8,
"scales": [
384,
512,
768,
1024,
1280,
1536,
1792,
2048
],
"parameters": 60814373,
"sharing_mode": "partial_shared",
"fusion_mode": "deep_efficiency",
"preset": "clip_vit_bigg14",
"weights_path": "weights/David-partial_shared-deep_efficiency/20251012_181608/best_model_acc84.73.safetensors",
"config_path": "weights/David-partial_shared-deep_efficiency/20251012_181608/david_config.json",
"history_path": "weights/David-partial_shared-deep_efficiency/20251012_181608/training_history.json"
},
{
"model_name": "David-partial_shared-deep_efficiency",
"run_id": "20251012_161107",
"timestamp": "2025-10-12T16:46:37.288111",
"best_val_acc": 84.66,
"best_epoch": 9,
"num_scales": 8,
"scales": [
384,
512,
768,
1024,
1280,
1536,
1792,
2048
],
"parameters": 60814373,
"sharing_mode": "partial_shared",
"fusion_mode": "deep_efficiency",
"preset": "clip_vit_bigg14",
"weights_path": "weights/David-partial_shared-deep_efficiency/20251012_161107/best_model_acc84.66.safetensors",
"config_path": "weights/David-partial_shared-deep_efficiency/20251012_161107/david_config.json",
"history_path": "weights/David-partial_shared-deep_efficiency/20251012_161107/training_history.json"
},
{
"model_name": "David-partial_shared-cantor_scale",
"run_id": "20251104_133602",
"timestamp": "2025-11-04T13:51:53.224432",
"best_val_acc": 82.862,
"best_epoch": 3,
"num_scales": 5,
"scales": [
384,
768,
1024,
1280,
1536
],
"parameters": 32436998,
"sharing_mode": "partial_shared",
"fusion_mode": "cantor_scale",
"preset": "clip_vit_l14_cantor",
"weights_path": "weights/David-partial_shared-cantor_scale/20251104_133602/best_model_acc82.86.safetensors",
"config_path": "weights/David-partial_shared-cantor_scale/20251104_133602/david_config.json",
"history_path": "weights/David-partial_shared-cantor_scale/20251104_133602/training_history.json"
},
{
"model_name": "David-decoupled-cantor_scale",
"run_id": "20251104_154540",
"timestamp": "2025-11-04T15:57:32.580584",
"best_val_acc": 78.904,
"best_epoch": 4,
"num_scales": 6,
"scales": [
256,
512,
768,
1024,
2048,
4096
],
"parameters": 60452103,
"sharing_mode": "decoupled",
"fusion_mode": "cantor_scale",
"preset": "clip_vit_b16_cantor_big_window",
"weights_path": "weights/David-decoupled-cantor_scale/20251104_154540/best_model_acc78.90.safetensors",
"config_path": "weights/David-decoupled-cantor_scale/20251104_154540/david_config.json",
"history_path": "weights/David-decoupled-cantor_scale/20251104_154540/training_history.json"
},
{
"model_name": "David-decoupled-cantor_scale",
"run_id": "20251104_125328",
"timestamp": "2025-11-04T13:32:58.081861",
"best_val_acc": 78.866,
"best_epoch": 4,
"num_scales": 4,
"scales": [
512,
4096,
8192,
16384
],
"parameters": 751239941,
"sharing_mode": "decoupled",
"fusion_mode": "cantor_scale",
"preset": "clip_vit_b16_cantor_decoupled_massive",
"weights_path": "weights/David-decoupled-cantor_scale/20251104_125328/best_model_acc78.87.safetensors",
"config_path": "weights/David-decoupled-cantor_scale/20251104_125328/david_config.json",
"history_path": "weights/David-decoupled-cantor_scale/20251104_125328/training_history.json"
},
{
"model_name": "David-partial_shared-cantor_scale",
"run_id": "20251104_124032",
"timestamp": "2025-11-04T12:50:54.398340",
"best_val_acc": 78.182,
"best_epoch": 4,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 12895621,
"sharing_mode": "partial_shared",
"fusion_mode": "cantor_scale",
"preset": "clip_vit_b16_cantor",
"weights_path": "weights/David-partial_shared-cantor_scale/20251104_124032/best_model_acc78.18.safetensors",
"config_path": "weights/David-partial_shared-cantor_scale/20251104_124032/david_config.json",
"history_path": "weights/David-partial_shared-cantor_scale/20251104_124032/training_history.json"
},
{
"model_name": "David-partial_shared-geometric_attention",
"run_id": "20251104_122236",
"timestamp": "2025-11-04T12:32:30.016304",
"best_val_acc": 78.06,
"best_epoch": 4,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 12599556,
"sharing_mode": "partial_shared",
"fusion_mode": "geometric_attention",
"preset": "clip_vit_b16_geometric",
"weights_path": "weights/David-partial_shared-geometric_attention/20251104_122236/best_model_acc78.06.safetensors",
"config_path": "weights/David-partial_shared-geometric_attention/20251104_122236/david_config.json",
"history_path": "weights/David-partial_shared-geometric_attention/20251104_122236/training_history.json"
},
{
"model_name": "David-hierarchical-progressive",
"run_id": "20251012_145649",
"timestamp": "2025-10-12T15:15:00.402465",
"best_val_acc": 76.864,
"best_epoch": 9,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 10493184,
"sharing_mode": "hierarchical",
"fusion_mode": "progressive",
"preset": "hierarchical_refinement",
"weights_path": "weights/David-hierarchical-progressive/20251012_145649/best_model_acc76.86.safetensors",
"config_path": "weights/David-hierarchical-progressive/20251012_145649/david_config.json",
"history_path": "weights/David-hierarchical-progressive/20251012_145649/training_history.json"
},
{
"model_name": "David-decoupled-cantor_scale",
"run_id": "20251104_152832",
"timestamp": "2025-11-04T15:39:27.530053",
"best_val_acc": 76.498,
"best_epoch": 4,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 9057029,
"sharing_mode": "decoupled",
"fusion_mode": "cantor_scale",
"preset": "clip_vit_b16_cantor",
"weights_path": "weights/David-decoupled-cantor_scale/20251104_152832/best_model_acc76.50.safetensors",
"config_path": "weights/David-decoupled-cantor_scale/20251104_152832/david_config.json",
"history_path": "weights/David-decoupled-cantor_scale/20251104_152832/training_history.json"
},
{
"model_name": "David-decoupled-deep_efficiency",
"run_id": "20251104_151233",
"timestamp": "2025-11-04T15:26:18.612383",
"best_val_acc": 75.774,
"best_epoch": 4,
"num_scales": 5,
"scales": [
256,
512,
768,
1024,
1280
],
"parameters": 14877593,
"sharing_mode": "decoupled",
"fusion_mode": "deep_efficiency",
"preset": "high_accuracy",
"weights_path": "weights/David-decoupled-deep_efficiency/20251104_151233/best_model_acc75.77.safetensors",
"config_path": "weights/David-decoupled-deep_efficiency/20251104_151233/david_config.json",
"history_path": "weights/David-decoupled-deep_efficiency/20251104_151233/training_history.json"
},
{
"model_name": "David-partial_shared-hierarchical_tree",
"run_id": "20251012_152245",
"timestamp": "2025-10-12T15:40:37.893214",
"best_val_acc": 75.532,
"best_epoch": 8,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 8758271,
"sharing_mode": "partial_shared",
"fusion_mode": "hierarchical_tree",
"preset": "balanced",
"weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_152245/best_model_acc75.53.safetensors",
"config_path": "weights/David-partial_shared-hierarchical_tree/20251012_152245/david_config.json",
"history_path": "weights/David-partial_shared-hierarchical_tree/20251012_152245/training_history.json"
},
{
"model_name": "David-hierarchical-progressive",
"run_id": "20251012_151647",
"timestamp": "2025-10-12T15:18:31.111538",
"best_val_acc": 72.232,
"best_epoch": 0,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 10493184,
"sharing_mode": "hierarchical",
"fusion_mode": "progressive",
"preset": "hierarchical_refinement",
"weights_path": "weights/David-hierarchical-progressive/20251012_151647/best_model_acc72.23.safetensors",
"config_path": "weights/David-hierarchical-progressive/20251012_151647/david_config.json",
"history_path": "weights/David-hierarchical-progressive/20251012_151647/training_history.json"
},
{
"model_name": "David-fully_shared-weighted_sum",
"run_id": "20251012_135249",
"timestamp": "2025-10-12T14:09:57.535871",
"best_val_acc": 71.994,
"best_epoch": 9,
"num_scales": 2,
"scales": [
256,
512
],
"parameters": 656898,
"sharing_mode": "fully_shared",
"fusion_mode": "weighted_sum",
"preset": "small_fast",
"weights_path": "weights/David-fully_shared-weighted_sum/20251012_135249/best_model_acc71.99.safetensors",
"config_path": "weights/David-fully_shared-weighted_sum/20251012_135249/david_config.json",
"history_path": "weights/David-fully_shared-weighted_sum/20251012_135249/training_history.json"
},
{
"model_name": "David-fully_shared-weighted_sum",
"run_id": "20251012_141246",
"timestamp": "2025-10-12T14:29:34.375797",
"best_val_acc": 71.726,
"best_epoch": 9,
"num_scales": 2,
"scales": [
256,
512
],
"parameters": 656898,
"sharing_mode": "fully_shared",
"fusion_mode": "weighted_sum",
"preset": "small_fast",
"weights_path": "weights/David-fully_shared-weighted_sum/20251012_141246/best_model_acc71.73.safetensors",
"config_path": "weights/David-fully_shared-weighted_sum/20251012_141246/david_config.json",
"history_path": "weights/David-fully_shared-weighted_sum/20251012_141246/training_history.json"
}
],
"total_models": 16
}