| { | |
| "repository": "AbstractPhil/david-shared-space", | |
| "updated": "2025-10-13T01:33:24.619384", | |
| "models": [ | |
| { | |
| "model_name": "David-partial_shared-hierarchical_tree", | |
| "run_id": "20251012_194945", | |
| "timestamp": "2025-10-12T20:21:46.311771", | |
| "best_val_acc": 75.74, | |
| "best_epoch": 9, | |
| "num_scales": 4, | |
| "scales": [ | |
| 256, | |
| 512, | |
| 768, | |
| 1024 | |
| ], | |
| "parameters": 8758271, | |
| "sharing_mode": "partial_shared", | |
| "fusion_mode": "hierarchical_tree", | |
| "preset": "balanced", | |
| "weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_194945/best_model_acc75.74.safetensors", | |
| "config_path": "weights/David-partial_shared-hierarchical_tree/20251012_194945/david_config.json", | |
| "history_path": "weights/David-partial_shared-hierarchical_tree/20251012_194945/training_history.json" | |
| }, | |
| { | |
| "model_name": "David-partial_shared-hierarchical_tree", | |
| "run_id": "20251012_210041", | |
| "timestamp": "2025-10-12T21:45:34.243260", | |
| "best_val_acc": 74.22733333333333, | |
| "best_epoch": 7, | |
| "num_scales": 4, | |
| "scales": [ | |
| 256, | |
| 512, | |
| 768, | |
| 1024 | |
| ], | |
| "parameters": 8758271, | |
| "sharing_mode": "partial_shared", | |
| "fusion_mode": "hierarchical_tree", | |
| "preset": "balanced", | |
| "weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_210041/best_model_acc74.23.safetensors", | |
| "config_path": "weights/David-partial_shared-hierarchical_tree/20251012_210041/david_config.json", | |
| "history_path": "weights/David-partial_shared-hierarchical_tree/20251012_210041/training_history.json" | |
| }, | |
| { | |
| "model_name": "David-partial_shared-hierarchical_tree", | |
| "run_id": "20251012_191456", | |
| "timestamp": "2025-10-12T19:48:30.099231", | |
| "best_val_acc": 73.695, | |
| "best_epoch": 9, | |
| "num_scales": 4, | |
| "scales": [ | |
| 256, | |
| 512, | |
| 768, | |
| 1024 | |
| ], | |
| "parameters": 8758271, | |
| "sharing_mode": "partial_shared", | |
| "fusion_mode": "hierarchical_tree", | |
| "preset": "balanced", | |
| "weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_191456/best_model_acc73.69.safetensors", | |
| "config_path": "weights/David-partial_shared-hierarchical_tree/20251012_191456/david_config.json", | |
| "history_path": "weights/David-partial_shared-hierarchical_tree/20251012_191456/training_history.json" | |
| }, | |
| { | |
| "model_name": "David-decoupled-deep_efficiency", | |
| "run_id": "20251012_221046", | |
| "timestamp": "2025-10-12T22:58:06.100595", | |
| "best_val_acc": 66.84133333333334, | |
| "best_epoch": 9, | |
| "num_scales": 5, | |
| "scales": [ | |
| 256, | |
| 512, | |
| 768, | |
| 1024, | |
| 1280 | |
| ], | |
| "parameters": 14877593, | |
| "sharing_mode": "decoupled", | |
| "fusion_mode": "deep_efficiency", | |
| "preset": "high_accuracy", | |
| "weights_path": "weights/David-decoupled-deep_efficiency/20251012_221046/best_model_acc66.84.safetensors", | |
| "config_path": "weights/David-decoupled-deep_efficiency/20251012_221046/david_config.json", | |
| "history_path": "weights/David-decoupled-deep_efficiency/20251012_221046/training_history.json" | |
| }, | |
| { | |
| "model_name": "David-fully_shared-weighted_sum", | |
| "run_id": "20251012_235237", | |
| "timestamp": "2025-10-13T00:38:45.818425", | |
| "best_val_acc": 66.52333333333333, | |
| "best_epoch": 9, | |
| "num_scales": 2, | |
| "scales": [ | |
| 256, | |
| 512 | |
| ], | |
| "parameters": 656898, | |
| "sharing_mode": "fully_shared", | |
| "fusion_mode": "weighted_sum", | |
| "preset": "small_fast", | |
| "weights_path": "weights/David-fully_shared-weighted_sum/20251012_235237/best_model_acc66.52.safetensors", | |
| "config_path": "weights/David-fully_shared-weighted_sum/20251012_235237/david_config.json", | |
| "history_path": "weights/David-fully_shared-weighted_sum/20251012_235237/training_history.json" | |
| }, | |
| { | |
| "model_name": "David-fully_shared-weighted_sum", | |
| "run_id": "20251012_231445", | |
| "timestamp": "2025-10-12T23:51:38.341849", | |
| "best_val_acc": 66.5, | |
| "best_epoch": 7, | |
| "num_scales": 2, | |
| "scales": [ | |
| 256, | |
| 512 | |
| ], | |
| "parameters": 656898, | |
| "sharing_mode": "fully_shared", | |
| "fusion_mode": "weighted_sum", | |
| "preset": "small_fast", | |
| "weights_path": "weights/David-fully_shared-weighted_sum/20251012_231445/best_model_acc66.50.safetensors", | |
| "config_path": "weights/David-fully_shared-weighted_sum/20251012_231445/david_config.json", | |
| "history_path": "weights/David-fully_shared-weighted_sum/20251012_231445/training_history.json" | |
| }, | |
| { | |
| "model_name": "David-decoupled-deep_efficiency", | |
| "run_id": "20251013_004438", | |
| "timestamp": "2025-10-13T01:33:24.619350", | |
| "best_val_acc": 62.938, | |
| "best_epoch": 9, | |
| "num_scales": 9, | |
| "scales": [ | |
| 128, | |
| 256, | |
| 384, | |
| 448, | |
| 512, | |
| 576, | |
| 640, | |
| 768, | |
| 896 | |
| ], | |
| "parameters": 22133801, | |
| "sharing_mode": "decoupled", | |
| "fusion_mode": "deep_efficiency", | |
| "preset": "gated_expert_team", | |
| "weights_path": "weights/David-decoupled-deep_efficiency/20251013_004438/best_model_acc62.94.safetensors", | |
| "config_path": "weights/David-decoupled-deep_efficiency/20251013_004438/david_config.json", | |
| "history_path": "weights/David-decoupled-deep_efficiency/20251013_004438/training_history.json" | |
| } | |
| ], | |
| "total_models": 7 | |
| } |