lumi-classifier / AnatomyFlaws-v15.5_dinov3_7b_bnb_fl.config.json
Enferlain's picture
Upload 2 files
d444abd verified
{
"data_root": "data",
"wandb_project": "lumi-classifiers",
"resume": null,
"base": "AnatomyFlaws",
"rev": "v15.5_dinov3_7b_bnb_fl",
"arch": "class",
"name": "AnatomyFlaws-v15.5_dinov3_7b_bnb_fl",
"base_vision_model": "dinov3-vit7b16-pretrain-lvd1689m-8bit",
"embed_ver": "fb_dinov3_vit7b16_pretrain_lvd1689m_8bit_DINOv3_8bit_BnB",
"data_mode": "embeddings",
"is_end_to_end": false,
"features": 4096,
"preload_data": true,
"hidden_dim": 1536,
"use_attention": true,
"num_attn_heads": 32,
"attn_dropout": 0.218,
"num_res_blocks": 4,
"dropout_rate": 0.218,
"output_mode": "linear",
"lr": "1e-4",
"batch": 64,
"loss_function": "focal",
"optimizer": "adabelief",
"betas": [
0.9,
0.999
],
"eps": "1e-8",
"weight_decay": "1e-3",
"max_train_epochs": null,
"max_train_steps": 3500,
"precision": "bf16",
"nsave": 100,
"val_split_count": 241,
"seed": 218,
"num_workers": 0,
"save_full_model": false,
"log_every_n": 10,
"validate_every_n": 34,
"focal_loss_gamma": 2.0,
"rectify": true,
"weight_decouple": true,
"gamma": 0.005,
"r_sf": 0.0,
"wlpow_sf": 2.0,
"state_precision": "parameter",
"adaptive_clip": 1.0,
"adaptive_clip_eps": "1e-3",
"scheduler_name": "RexAnnealingWarmRestarts",
"scheduler_gamma": 0.95,
"scheduler_cycle_multiplier": 1.0,
"scheduler_first_cycle_max_steps": 350,
"scheduler_min_lr": "1e-7",
"scheduler_warmup_steps": 50,
"labels": {
"0": "Bad Anatomy",
"1": "Good Anatomy"
},
"weights": [
1.0,
1.0
],
"num_labels": 2,
"steps_per_epoch": 67,
"num_train_epochs": 53,
"num_classes": 2
}