maximuspowers
/

weight-autoencoder-mlp-v1

@@ -27,15 +27,15 @@ It includes both an encoder (compresses weights into latent representations) and
 ## Training Config
-- **Loss Functions**: reconstruction, contrastive, functional
 - **Optimizer**: adamw
 - **Learning Rate**: 0.0001
 - **Batch Size**: 32
 ## Performance Metrics (Test Set)
-- **MSE**: 0.125011
-- **MAE**: 0.259796
-- **RMSE**: 0.353570
-- **Cosine Similarity**: 0.0348
-- **R² Score**: -0.0097

 ## Training Config
+- **Loss Functions**: reconstruction, functional
 - **Optimizer**: adamw
 - **Learning Rate**: 0.0001
 - **Batch Size**: 32
 ## Performance Metrics (Test Set)
+- **MSE**: 0.122959
+- **MAE**: 0.256139
+- **RMSE**: 0.350655
+- **Cosine Similarity**: 0.0575
+- **R² Score**: 0.0069

config.yaml CHANGED Viewed

@@ -12,6 +12,7 @@ architecture:
       dropout: 0.025
       num_heads: 8
       num_layers: 6
     encoder:
       activation: gelu
       d_model: 512
@@ -78,7 +79,7 @@ logging:
   verbose: true
 loss:
   contrastive:
-    enabled: true
     projection_head:
       hidden_dim: 128
       input_dim: 256
@@ -89,12 +90,16 @@ loss:
     benchmark_path: /Users/max/Desktop/muat/model_zoo/configs/autoencoder/benchmark_dataset.json
     enabled: true
     test_samples: null
-    weight: 0.5
   reconstruction:
     enabled: true
     type: mse
     weight: 0.6
-run_dir: /Users/max/Desktop/muat/model_zoo/runs/train-encoder-decoder_config_2025-12-18_22-23-46
 run_log_cleanup: false
 tokenization:
   chunk_size: 1

       dropout: 0.025
       num_heads: 8
       num_layers: 6
+      num_memory_tokens: 8
     encoder:
       activation: gelu
       d_model: 512
   verbose: true
 loss:
   contrastive:
+    enabled: false
     projection_head:
       hidden_dim: 128
       input_dim: 256
     benchmark_path: /Users/max/Desktop/muat/model_zoo/configs/autoencoder/benchmark_dataset.json
     enabled: true
     test_samples: null
+    weight: 0.05
   reconstruction:
     enabled: true
     type: mse
     weight: 0.6
+  variance:
+    enabled: false
+    target_variance: 0.01
+    weight: 0.1
+run_dir: /Users/max/Desktop/muat/model_zoo/runs/train-encoder-decoder_config_2025-12-20_12-55-25
 run_log_cleanup: false
 tokenization:
   chunk_size: 1

decoder.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0c8bdb28e21e756364067eaee646097f7e24a78aa907a48d4c34a08c1c7df45f
-size 103255652

 version https://git-lfs.github.com/spec/v1
+oid sha256:2e8076647a75544334db431a6665fce841f654289b2b7d28f838389b84177a6c
+size 82225188

encoder.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:394e0021fc9d3862b3307c018dbce6118ea0c2b6664766d1729081a3904ca1d8
-size 126816306

 version https://git-lfs.github.com/spec/v1
+oid sha256:a92e43fd2ef0647bed913fcabcf216fa2a8333b8044f8aa9611f62a0dc003fc9
+size 126816434