vit-beatrix / config.json
AbstractPhil's picture
Update best model - Epoch 0 - Acc: 0.0892
0a86595 verified
{
"num_classes": 100,
"img_size": 32,
"patch_size": 4,
"embed_dim": 256,
"k_simplex": 5,
"depth": 12,
"num_heads": 8,
"mlp_ratio": 4.0,
"dropout": 0.0,
"pe_levels": 12,
"pe_features_per_level": 2,
"pe_smooth_tau": 0.25,
"simplex_feature_weight": 0.2,
"batch_size": 512,
"num_epochs": 10,
"learning_rate": 0.001,
"weight_decay": 0.005,
"warmup_epochs": 2,
"task_loss_weight": 1.0,
"flow_loss_weight": 0.5,
"coherence_loss_weight": 0.3,
"multiscale_loss_weight": 0.2,
"volume_reg_weight": 0.1,
"use_augmentation": true,
"mixup_alpha": 0.2,
"cutmix_alpha": 1.0,
"device": "cuda",
"num_workers": 2,
"pin_memory": true,
"save_dir": "./checkpoints",
"save_every": 10,
"use_safetensors": true,
"timestamp_dirs": true,
"push_to_hub": true,
"hub_model_id": "AbstractPhil/vit-beatrix",
"hub_model_name": "beatrix-cifar100",
"hub_upload_best_only": true,
"use_tensorboard": true,
"log_dir": "./logs",
"log_every": 50,
"train_baseline": false
}