david-shared-space / MODELS_INDEX.json
AbstractPhil's picture
Update models index - David-decoupled-deep_efficiency @ 62.94%
85649e3 verified
raw
history blame
5.58 kB
{
"repository": "AbstractPhil/david-shared-space",
"updated": "2025-10-13T01:33:24.619384",
"models": [
{
"model_name": "David-partial_shared-hierarchical_tree",
"run_id": "20251012_194945",
"timestamp": "2025-10-12T20:21:46.311771",
"best_val_acc": 75.74,
"best_epoch": 9,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 8758271,
"sharing_mode": "partial_shared",
"fusion_mode": "hierarchical_tree",
"preset": "balanced",
"weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_194945/best_model_acc75.74.safetensors",
"config_path": "weights/David-partial_shared-hierarchical_tree/20251012_194945/david_config.json",
"history_path": "weights/David-partial_shared-hierarchical_tree/20251012_194945/training_history.json"
},
{
"model_name": "David-partial_shared-hierarchical_tree",
"run_id": "20251012_210041",
"timestamp": "2025-10-12T21:45:34.243260",
"best_val_acc": 74.22733333333333,
"best_epoch": 7,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 8758271,
"sharing_mode": "partial_shared",
"fusion_mode": "hierarchical_tree",
"preset": "balanced",
"weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_210041/best_model_acc74.23.safetensors",
"config_path": "weights/David-partial_shared-hierarchical_tree/20251012_210041/david_config.json",
"history_path": "weights/David-partial_shared-hierarchical_tree/20251012_210041/training_history.json"
},
{
"model_name": "David-partial_shared-hierarchical_tree",
"run_id": "20251012_191456",
"timestamp": "2025-10-12T19:48:30.099231",
"best_val_acc": 73.695,
"best_epoch": 9,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 8758271,
"sharing_mode": "partial_shared",
"fusion_mode": "hierarchical_tree",
"preset": "balanced",
"weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_191456/best_model_acc73.69.safetensors",
"config_path": "weights/David-partial_shared-hierarchical_tree/20251012_191456/david_config.json",
"history_path": "weights/David-partial_shared-hierarchical_tree/20251012_191456/training_history.json"
},
{
"model_name": "David-decoupled-deep_efficiency",
"run_id": "20251012_221046",
"timestamp": "2025-10-12T22:58:06.100595",
"best_val_acc": 66.84133333333334,
"best_epoch": 9,
"num_scales": 5,
"scales": [
256,
512,
768,
1024,
1280
],
"parameters": 14877593,
"sharing_mode": "decoupled",
"fusion_mode": "deep_efficiency",
"preset": "high_accuracy",
"weights_path": "weights/David-decoupled-deep_efficiency/20251012_221046/best_model_acc66.84.safetensors",
"config_path": "weights/David-decoupled-deep_efficiency/20251012_221046/david_config.json",
"history_path": "weights/David-decoupled-deep_efficiency/20251012_221046/training_history.json"
},
{
"model_name": "David-fully_shared-weighted_sum",
"run_id": "20251012_235237",
"timestamp": "2025-10-13T00:38:45.818425",
"best_val_acc": 66.52333333333333,
"best_epoch": 9,
"num_scales": 2,
"scales": [
256,
512
],
"parameters": 656898,
"sharing_mode": "fully_shared",
"fusion_mode": "weighted_sum",
"preset": "small_fast",
"weights_path": "weights/David-fully_shared-weighted_sum/20251012_235237/best_model_acc66.52.safetensors",
"config_path": "weights/David-fully_shared-weighted_sum/20251012_235237/david_config.json",
"history_path": "weights/David-fully_shared-weighted_sum/20251012_235237/training_history.json"
},
{
"model_name": "David-fully_shared-weighted_sum",
"run_id": "20251012_231445",
"timestamp": "2025-10-12T23:51:38.341849",
"best_val_acc": 66.5,
"best_epoch": 7,
"num_scales": 2,
"scales": [
256,
512
],
"parameters": 656898,
"sharing_mode": "fully_shared",
"fusion_mode": "weighted_sum",
"preset": "small_fast",
"weights_path": "weights/David-fully_shared-weighted_sum/20251012_231445/best_model_acc66.50.safetensors",
"config_path": "weights/David-fully_shared-weighted_sum/20251012_231445/david_config.json",
"history_path": "weights/David-fully_shared-weighted_sum/20251012_231445/training_history.json"
},
{
"model_name": "David-decoupled-deep_efficiency",
"run_id": "20251013_004438",
"timestamp": "2025-10-13T01:33:24.619350",
"best_val_acc": 62.938,
"best_epoch": 9,
"num_scales": 9,
"scales": [
128,
256,
384,
448,
512,
576,
640,
768,
896
],
"parameters": 22133801,
"sharing_mode": "decoupled",
"fusion_mode": "deep_efficiency",
"preset": "gated_expert_team",
"weights_path": "weights/David-decoupled-deep_efficiency/20251013_004438/best_model_acc62.94.safetensors",
"config_path": "weights/David-decoupled-deep_efficiency/20251013_004438/david_config.json",
"history_path": "weights/David-decoupled-deep_efficiency/20251013_004438/training_history.json"
}
],
"total_models": 7
}