geoclip-vit-base-unicode-32x1000d / symbolic_vitb32_encoder_snapshot.meta.json
AbstractPhil's picture
Upload symbolic_vitb32_encoder_snapshot.meta.json
3f6ec28 verified
{
"epoch": 1,
"global_step": 196,
"avg_loss": 3.920882177810669,
"best_metric": 0.4896,
"timestamp": "2025-08-28T11:37:07.258947",
"run_name": "symbolic_vitb32",
"group": "encoder",
"metrics": {
"epoch": 1,
"train_loss": 3.920882177810669,
"val_loss": 2.4135699951171876,
"top1": 0.4896,
"top3": 0.6524
},
"config_snapshot": {
"device": "cuda",
"seed": 42,
"precision": "fp32",
"hf_clip_id": "openai/clip-vit-base-patch32",
"freeze_encoder": true,
"normalize_output": true,
"dataset": "cifar100",
"data_root": "./data",
"image_size": 224,
"clip_mean": [
0.48145466,
0.4578275,
0.40821073
],
"clip_std": [
0.26862954,
0.26130258,
0.27577711
],
"train_aug": true,
"train_crop_scale": [
0.9,
1.0
],
"hflip_p": 0.5,
"vocab_repo": "AbstractPhil/geometric-vocab-32d",
"vocab_split": "unicode",
"vocab_dim_override": 32,
"crystal_dims": 1000,
"role_index": {
"anchor": 0,
"support": 1,
"contrast": 2,
"purpose": 3,
"observer": 4
},
"classes": 100,
"classes_per_penta": 2,
"penta_branches": 50,
"pentachora_blocks": 4,
"temperature": 0.07,
"batch_size": 256,
"epochs": 20,
"lr": 0.0003,
"weight_decay": 0.0001,
"label_smoothing": 0.0,
"use_cosine_sched": true,
"warmup_steps": 250,
"max_steps": null,
"amp": true,
"grad_clip_norm": null,
"log_every": 25,
"auto_train": false,
"num_workers": 2,
"pin_memory": false,
"persistent_workers": false,
"ckpt_dir": "./checkpoints",
"run_name": "symbolic_vitb32",
"save_latest": true,
"save_best": true,
"resume": true,
"resume_which": "best",
"resume_source": "auto",
"hf_enable": true,
"hf_repo_id": "AbstractPhil/geoclip-vit-base-unicode-32x1000d",
"hf_branch": "main",
"hf_private": false,
"hf_push_latest": false,
"hf_push_best": true,
"hf_create": true,
"hf_token_env": [
"HF_TOKEN",
"HUGGINGFACE_HUB_TOKEN"
]
}
}