{ "repository": "AbstractPhil/gated-david", "updated": "2025-11-04T15:57:32.580623", "models": [ { "model_name": "David-decoupled-cantor_scale", "run_id": "20251104_144102", "timestamp": "2025-11-04T15:01:54.717226", "best_val_acc": 85.25, "best_epoch": 4, "num_scales": 8, "scales": [ 384, 512, 768, 1024, 1280, 1536, 1792, 2048 ], "parameters": 70207625, "sharing_mode": "decoupled", "fusion_mode": "cantor_scale", "preset": "clip_vit_bigg14_cantor_decoupled", "weights_path": "weights/David-decoupled-cantor_scale/20251104_144102/best_model_acc85.25.safetensors", "config_path": "weights/David-decoupled-cantor_scale/20251104_144102/david_config.json", "history_path": "weights/David-decoupled-cantor_scale/20251104_144102/training_history.json" }, { "model_name": "David-partial_shared-cantor_scale", "run_id": "20251104_140742", "timestamp": "2025-11-04T14:34:12.310619", "best_val_acc": 84.916, "best_epoch": 4, "num_scales": 8, "scales": [ 384, 512, 768, 1024, 1280, 1536, 1792, 2048 ], "parameters": 82601993, "sharing_mode": "partial_shared", "fusion_mode": "cantor_scale", "preset": "clip_vit_bigg14_cantor", "weights_path": "weights/David-partial_shared-cantor_scale/20251104_140742/best_model_acc84.92.safetensors", "config_path": "weights/David-partial_shared-cantor_scale/20251104_140742/david_config.json", "history_path": "weights/David-partial_shared-cantor_scale/20251104_140742/training_history.json" }, { "model_name": "David-partial_shared-deep_efficiency", "run_id": "20251012_181608", "timestamp": "2025-10-12T18:49:28.035826", "best_val_acc": 84.726, "best_epoch": 2, "num_scales": 8, "scales": [ 384, 512, 768, 1024, 1280, 1536, 1792, 2048 ], "parameters": 60814373, "sharing_mode": "partial_shared", "fusion_mode": "deep_efficiency", "preset": "clip_vit_bigg14", "weights_path": "weights/David-partial_shared-deep_efficiency/20251012_181608/best_model_acc84.73.safetensors", "config_path": "weights/David-partial_shared-deep_efficiency/20251012_181608/david_config.json", "history_path": "weights/David-partial_shared-deep_efficiency/20251012_181608/training_history.json" }, { "model_name": "David-partial_shared-deep_efficiency", "run_id": "20251012_161107", "timestamp": "2025-10-12T16:46:37.288111", "best_val_acc": 84.66, "best_epoch": 9, "num_scales": 8, "scales": [ 384, 512, 768, 1024, 1280, 1536, 1792, 2048 ], "parameters": 60814373, "sharing_mode": "partial_shared", "fusion_mode": "deep_efficiency", "preset": "clip_vit_bigg14", "weights_path": "weights/David-partial_shared-deep_efficiency/20251012_161107/best_model_acc84.66.safetensors", "config_path": "weights/David-partial_shared-deep_efficiency/20251012_161107/david_config.json", "history_path": "weights/David-partial_shared-deep_efficiency/20251012_161107/training_history.json" }, { "model_name": "David-partial_shared-cantor_scale", "run_id": "20251104_133602", "timestamp": "2025-11-04T13:51:53.224432", "best_val_acc": 82.862, "best_epoch": 3, "num_scales": 5, "scales": [ 384, 768, 1024, 1280, 1536 ], "parameters": 32436998, "sharing_mode": "partial_shared", "fusion_mode": "cantor_scale", "preset": "clip_vit_l14_cantor", "weights_path": "weights/David-partial_shared-cantor_scale/20251104_133602/best_model_acc82.86.safetensors", "config_path": "weights/David-partial_shared-cantor_scale/20251104_133602/david_config.json", "history_path": "weights/David-partial_shared-cantor_scale/20251104_133602/training_history.json" }, { "model_name": "David-decoupled-cantor_scale", "run_id": "20251104_154540", "timestamp": "2025-11-04T15:57:32.580584", "best_val_acc": 78.904, "best_epoch": 4, "num_scales": 6, "scales": [ 256, 512, 768, 1024, 2048, 4096 ], "parameters": 60452103, "sharing_mode": "decoupled", "fusion_mode": "cantor_scale", "preset": "clip_vit_b16_cantor_big_window", "weights_path": "weights/David-decoupled-cantor_scale/20251104_154540/best_model_acc78.90.safetensors", "config_path": "weights/David-decoupled-cantor_scale/20251104_154540/david_config.json", "history_path": "weights/David-decoupled-cantor_scale/20251104_154540/training_history.json" }, { "model_name": "David-decoupled-cantor_scale", "run_id": "20251104_125328", "timestamp": "2025-11-04T13:32:58.081861", "best_val_acc": 78.866, "best_epoch": 4, "num_scales": 4, "scales": [ 512, 4096, 8192, 16384 ], "parameters": 751239941, "sharing_mode": "decoupled", "fusion_mode": "cantor_scale", "preset": "clip_vit_b16_cantor_decoupled_massive", "weights_path": "weights/David-decoupled-cantor_scale/20251104_125328/best_model_acc78.87.safetensors", "config_path": "weights/David-decoupled-cantor_scale/20251104_125328/david_config.json", "history_path": "weights/David-decoupled-cantor_scale/20251104_125328/training_history.json" }, { "model_name": "David-partial_shared-cantor_scale", "run_id": "20251104_124032", "timestamp": "2025-11-04T12:50:54.398340", "best_val_acc": 78.182, "best_epoch": 4, "num_scales": 4, "scales": [ 256, 512, 768, 1024 ], "parameters": 12895621, "sharing_mode": "partial_shared", "fusion_mode": "cantor_scale", "preset": "clip_vit_b16_cantor", "weights_path": "weights/David-partial_shared-cantor_scale/20251104_124032/best_model_acc78.18.safetensors", "config_path": "weights/David-partial_shared-cantor_scale/20251104_124032/david_config.json", "history_path": "weights/David-partial_shared-cantor_scale/20251104_124032/training_history.json" }, { "model_name": "David-partial_shared-geometric_attention", "run_id": "20251104_122236", "timestamp": "2025-11-04T12:32:30.016304", "best_val_acc": 78.06, "best_epoch": 4, "num_scales": 4, "scales": [ 256, 512, 768, 1024 ], "parameters": 12599556, "sharing_mode": "partial_shared", "fusion_mode": "geometric_attention", "preset": "clip_vit_b16_geometric", "weights_path": "weights/David-partial_shared-geometric_attention/20251104_122236/best_model_acc78.06.safetensors", "config_path": "weights/David-partial_shared-geometric_attention/20251104_122236/david_config.json", "history_path": "weights/David-partial_shared-geometric_attention/20251104_122236/training_history.json" }, { "model_name": "David-hierarchical-progressive", "run_id": "20251012_145649", "timestamp": "2025-10-12T15:15:00.402465", "best_val_acc": 76.864, "best_epoch": 9, "num_scales": 4, "scales": [ 256, 512, 768, 1024 ], "parameters": 10493184, "sharing_mode": "hierarchical", "fusion_mode": "progressive", "preset": "hierarchical_refinement", "weights_path": "weights/David-hierarchical-progressive/20251012_145649/best_model_acc76.86.safetensors", "config_path": "weights/David-hierarchical-progressive/20251012_145649/david_config.json", "history_path": "weights/David-hierarchical-progressive/20251012_145649/training_history.json" }, { "model_name": "David-decoupled-cantor_scale", "run_id": "20251104_152832", "timestamp": "2025-11-04T15:39:27.530053", "best_val_acc": 76.498, "best_epoch": 4, "num_scales": 4, "scales": [ 256, 512, 768, 1024 ], "parameters": 9057029, "sharing_mode": "decoupled", "fusion_mode": "cantor_scale", "preset": "clip_vit_b16_cantor", "weights_path": "weights/David-decoupled-cantor_scale/20251104_152832/best_model_acc76.50.safetensors", "config_path": "weights/David-decoupled-cantor_scale/20251104_152832/david_config.json", "history_path": "weights/David-decoupled-cantor_scale/20251104_152832/training_history.json" }, { "model_name": "David-decoupled-deep_efficiency", "run_id": "20251104_151233", "timestamp": "2025-11-04T15:26:18.612383", "best_val_acc": 75.774, "best_epoch": 4, "num_scales": 5, "scales": [ 256, 512, 768, 1024, 1280 ], "parameters": 14877593, "sharing_mode": "decoupled", "fusion_mode": "deep_efficiency", "preset": "high_accuracy", "weights_path": "weights/David-decoupled-deep_efficiency/20251104_151233/best_model_acc75.77.safetensors", "config_path": "weights/David-decoupled-deep_efficiency/20251104_151233/david_config.json", "history_path": "weights/David-decoupled-deep_efficiency/20251104_151233/training_history.json" }, { "model_name": "David-partial_shared-hierarchical_tree", "run_id": "20251012_152245", "timestamp": "2025-10-12T15:40:37.893214", "best_val_acc": 75.532, "best_epoch": 8, "num_scales": 4, "scales": [ 256, 512, 768, 1024 ], "parameters": 8758271, "sharing_mode": "partial_shared", "fusion_mode": "hierarchical_tree", "preset": "balanced", "weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_152245/best_model_acc75.53.safetensors", "config_path": "weights/David-partial_shared-hierarchical_tree/20251012_152245/david_config.json", "history_path": "weights/David-partial_shared-hierarchical_tree/20251012_152245/training_history.json" }, { "model_name": "David-hierarchical-progressive", "run_id": "20251012_151647", "timestamp": "2025-10-12T15:18:31.111538", "best_val_acc": 72.232, "best_epoch": 0, "num_scales": 4, "scales": [ 256, 512, 768, 1024 ], "parameters": 10493184, "sharing_mode": "hierarchical", "fusion_mode": "progressive", "preset": "hierarchical_refinement", "weights_path": "weights/David-hierarchical-progressive/20251012_151647/best_model_acc72.23.safetensors", "config_path": "weights/David-hierarchical-progressive/20251012_151647/david_config.json", "history_path": "weights/David-hierarchical-progressive/20251012_151647/training_history.json" }, { "model_name": "David-fully_shared-weighted_sum", "run_id": "20251012_135249", "timestamp": "2025-10-12T14:09:57.535871", "best_val_acc": 71.994, "best_epoch": 9, "num_scales": 2, "scales": [ 256, 512 ], "parameters": 656898, "sharing_mode": "fully_shared", "fusion_mode": "weighted_sum", "preset": "small_fast", "weights_path": "weights/David-fully_shared-weighted_sum/20251012_135249/best_model_acc71.99.safetensors", "config_path": "weights/David-fully_shared-weighted_sum/20251012_135249/david_config.json", "history_path": "weights/David-fully_shared-weighted_sum/20251012_135249/training_history.json" }, { "model_name": "David-fully_shared-weighted_sum", "run_id": "20251012_141246", "timestamp": "2025-10-12T14:29:34.375797", "best_val_acc": 71.726, "best_epoch": 9, "num_scales": 2, "scales": [ 256, 512 ], "parameters": 656898, "sharing_mode": "fully_shared", "fusion_mode": "weighted_sum", "preset": "small_fast", "weights_path": "weights/David-fully_shared-weighted_sum/20251012_141246/best_model_acc71.73.safetensors", "config_path": "weights/David-fully_shared-weighted_sum/20251012_141246/david_config.json", "history_path": "weights/David-fully_shared-weighted_sum/20251012_141246/training_history.json" } ], "total_models": 16 }