AbstractPhil
/

vit-beatrix

@@ -18,8 +18,8 @@ for vision tasks. Trained on CIFAR-10.
 - **Architecture**: Vision Transformer with fractal positional encoding
 - **Dataset**: CIFAR-100 (100 classes)
-- **Embedding Dimension**: 512
-- **Depth**: 4 layers
 - **Patch Size**: 4x4
 - **PE Levels**: 12
 - **Simplex Dimension**: 5-simplex
@@ -27,8 +27,8 @@ for vision tasks. Trained on CIFAR-10.
 ## Training
 - **Dataset**: CIFAR-100
-- **Epochs**: 8
-- **Best Accuracy**: 0.2937
 - **Batch Size**: 512
 - **Learning Rate**: 0.001
@@ -44,17 +44,24 @@ for vision tasks. Trained on CIFAR-10.
 ```python
 from geovocab2.train.model.vit_beatrix import SimplifiedGeometricClassifier
 from safetensors.torch import load_file
 # Load model
 model = SimplifiedGeometricClassifier(
     num_classes=100,  # CIFAR-100
     img_size=32,
-    embed_dim=512,
-    depth=4
 )
-# Load weights (renamed from model_best.safetensors to model.safetensors in Hub)
-state_dict = load_file("model.safetensors")
 model.load_state_dict(state_dict)
 model.eval()

 - **Architecture**: Vision Transformer with fractal positional encoding
 - **Dataset**: CIFAR-100 (100 classes)
+- **Embedding Dimension**: 256
+- **Depth**: 12 layers
 - **Patch Size**: 4x4
 - **PE Levels**: 12
 - **Simplex Dimension**: 5-simplex
 ## Training
 - **Dataset**: CIFAR-100
+- **Epochs**: 0
+- **Best Accuracy**: 0.0892
 - **Batch Size**: 512
 - **Learning Rate**: 0.001
 ```python
 from geovocab2.train.model.vit_beatrix import SimplifiedGeometricClassifier
 from safetensors.torch import load_file
+from huggingface_hub import hf_hub_download
+# Download weights from Hub
+weights_path = hf_hub_download(
+    repo_id="AbstractPhil/vit-beatrix",
+    filename="weights/beatrix-cifar100/20251007_181653/model.safetensors"
+)
 # Load model
 model = SimplifiedGeometricClassifier(
     num_classes=100,  # CIFAR-100
     img_size=32,
+    embed_dim=256,
+    depth=12
 )
+# Load weights
+state_dict = load_file(weights_path)
 model.load_state_dict(state_dict)
 model.eval()

config.json CHANGED Viewed

@@ -2,9 +2,9 @@
   "num_classes": 100,
   "img_size": 32,
   "patch_size": 4,
-  "embed_dim": 512,
   "k_simplex": 5,
-  "depth": 4,
   "num_heads": 8,
   "mlp_ratio": 4.0,
   "dropout": 0.0,
@@ -13,10 +13,10 @@
   "pe_smooth_tau": 0.25,
   "simplex_feature_weight": 0.2,
   "batch_size": 512,
-  "num_epochs": 50,
   "learning_rate": 0.001,
   "weight_decay": 0.005,
-  "warmup_epochs": 10,
   "task_loss_weight": 1.0,
   "flow_loss_weight": 0.5,
   "coherence_loss_weight": 0.3,
@@ -34,10 +34,10 @@
   "timestamp_dirs": true,
   "push_to_hub": true,
   "hub_model_id": "AbstractPhil/vit-beatrix",
   "hub_upload_best_only": true,
   "use_tensorboard": true,
   "log_dir": "./logs",
   "log_every": 50,
-  "train_baseline": false,
-  "hub_token": null
 }

   "num_classes": 100,
   "img_size": 32,
   "patch_size": 4,
+  "embed_dim": 256,
   "k_simplex": 5,
+  "depth": 12,
   "num_heads": 8,
   "mlp_ratio": 4.0,
   "dropout": 0.0,
   "pe_smooth_tau": 0.25,
   "simplex_feature_weight": 0.2,
   "batch_size": 512,
+  "num_epochs": 10,
   "learning_rate": 0.001,
   "weight_decay": 0.005,
+  "warmup_epochs": 2,
   "task_loss_weight": 1.0,
   "flow_loss_weight": 0.5,
   "coherence_loss_weight": 0.3,
   "timestamp_dirs": true,
   "push_to_hub": true,
   "hub_model_id": "AbstractPhil/vit-beatrix",
+  "hub_model_name": "beatrix-cifar100",
   "hub_upload_best_only": true,
   "use_tensorboard": true,
   "log_dir": "./logs",
   "log_every": 50,
+  "train_baseline": false
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d014abe00fd634e8607d5421a9834b4dc7aae0b905e55e4491cd5612a052284b
-size 50831604

 version https://git-lfs.github.com/spec/v1
+oid sha256:1f25f11e2851e52c4ee631b191044282ff7e23236f4b6a7fed2388d32f045a29
+size 38117196