diff --git a/mlp_map_test/M0_S-2_R16_P2.pt b/mlp_map_test/M0_S-2_R16_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..714ab0f4c619bfe9301eaff9778a2d91d39a9920 --- /dev/null +++ b/mlp_map_test/M0_S-2_R16_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9359d6761c0678872c24614fdc2e33a95859ed8893721a009e4efb7312c1a6ab +size 153705088 diff --git a/mlp_map_test/M0_S-2_R16_P2_config.json b/mlp_map_test/M0_S-2_R16_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..90a16baea10f96388a5ea8a48c4a92bf4f39b978 --- /dev/null +++ b/mlp_map_test/M0_S-2_R16_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R16_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R8_P2.pt b/mlp_map_test/M0_S-2_R8_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d8515155833066720763ddb9615bb53d797bdf2 --- /dev/null +++ b/mlp_map_test/M0_S-2_R8_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72fe4a438c7cb4fd200d69aec08f833f29172203aa7422efcd88ff57df0b9249 +size 153705080 diff --git a/mlp_map_test/M0_S-2_R8_P2_config.json b/mlp_map_test/M0_S-2_R8_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..22434e16dc342916e89995211702ad59ab8787df --- /dev/null +++ b/mlp_map_test/M0_S-2_R8_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R8_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R8_P4.pt b/mlp_map_test/M0_S-2_R8_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe98df13ebccaed9e869562aac523f001e90eab4 --- /dev/null +++ b/mlp_map_test/M0_S-2_R8_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1006aa4821d67c80e35c63ada50d443ae7e342f4f8afda3490b91d734e26125a +size 153705080 diff --git a/mlp_map_test/M0_S-2_R8_P4_config.json b/mlp_map_test/M0_S-2_R8_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..db7fed1ff8f315766f1691d652598d79a94743de --- /dev/null +++ b/mlp_map_test/M0_S-2_R8_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R8_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-4_R16_P6.pt b/mlp_map_test/M0_S-4_R16_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..16e6d633d67cb57ab26e4bb15aa3cea8598f7843 --- /dev/null +++ b/mlp_map_test/M0_S-4_R16_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c15de0bd8db6ce5aac80986803982acbdb2eaefcce9cd64978ced7511fa26595 +size 153705088 diff --git a/mlp_map_test/M0_S-4_R16_P6_config.json b/mlp_map_test/M0_S-4_R16_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9e40198f810d16b37146b268eca7e334403f10ea --- /dev/null +++ b/mlp_map_test/M0_S-4_R16_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-4_R16_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-4_R4_P2.pt b/mlp_map_test/M0_S-4_R4_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..48e667dfaecf820e5a74a9379e9d14928ef9293c --- /dev/null +++ b/mlp_map_test/M0_S-4_R4_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f48785465f336071949bcff0e1d1f4b3ca656ea66f6270a4d64c5075d0db263c +size 153705080 diff --git a/mlp_map_test/M0_S-4_R4_P2_config.json b/mlp_map_test/M0_S-4_R4_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..f994476e2e8bdf73b5f8eb58e4c02fa91ecffca3 --- /dev/null +++ b/mlp_map_test/M0_S-4_R4_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-4_R4_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-4_R8_P2.pt b/mlp_map_test/M0_S-4_R8_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9d8c8dfd63ec47ab1bea73e0067eba21d2c8388 --- /dev/null +++ b/mlp_map_test/M0_S-4_R8_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b5ebb8036e34338f3433ff2c2c7d6032ff76c4bb87b9b8dc17ed7203b6eba1 +size 153705080 diff --git a/mlp_map_test/M0_S-4_R8_P2_config.json b/mlp_map_test/M0_S-4_R8_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..59febf315d53f23fb3ffddd0bc265b68b42723ca --- /dev/null +++ b/mlp_map_test/M0_S-4_R8_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-4_R8_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R16_P6.pt b/mlp_map_test/M0_S-6_R16_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..17b04c46ae664490293738d993d1ed2148341abb --- /dev/null +++ b/mlp_map_test/M0_S-6_R16_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81e71c6a3ed2625c96875a73a66234e685f89b140852e496bf28a17d1f412a6a +size 153705088 diff --git a/mlp_map_test/M0_S-6_R16_P6_config.json b/mlp_map_test/M0_S-6_R16_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..53a31292e0730ee2b3568719beed58c7b0ae3d1f --- /dev/null +++ b/mlp_map_test/M0_S-6_R16_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R16_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R2_P2.pt b/mlp_map_test/M0_S-6_R2_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..de4ede32cb542bdfb8a67fdb9970f762ec482fd2 --- /dev/null +++ b/mlp_map_test/M0_S-6_R2_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac77f117cfc79c30cb2f10b415fee609eb8513a8b4fe301f4249743b7fb0cc5b +size 153705080 diff --git a/mlp_map_test/M0_S-6_R2_P2_config.json b/mlp_map_test/M0_S-6_R2_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..44a8cd4fe4146ccdb60b16044c74f7ff4d40c98b --- /dev/null +++ b/mlp_map_test/M0_S-6_R2_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R2_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R4_P2.pt b/mlp_map_test/M0_S-6_R4_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d14f720c5d2440280d3babe433589520278839c --- /dev/null +++ b/mlp_map_test/M0_S-6_R4_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d41efbd610f4e13f9131487d9125f2aeaf128541d04b2e8e4fc4daa71f0388 +size 153705080 diff --git a/mlp_map_test/M0_S-6_R4_P2_config.json b/mlp_map_test/M0_S-6_R4_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..19fa4c5320112ff0b34d0ea9309df114986b0ee8 --- /dev/null +++ b/mlp_map_test/M0_S-6_R4_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R4_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R4_P5.pt b/mlp_map_test/M0_S-6_R4_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ee42e4a76eabe8b2604564e814e0535fd804131 --- /dev/null +++ b/mlp_map_test/M0_S-6_R4_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d887b70c10c59158d64b4a325077f3da2ff37b6f859823460862440c6f543f53 +size 153705080 diff --git a/mlp_map_test/M0_S-6_R4_P5_config.json b/mlp_map_test/M0_S-6_R4_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..04f864bf00723147ea690de1a33f8168f934d428 --- /dev/null +++ b/mlp_map_test/M0_S-6_R4_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R4_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R8_P3.pt b/mlp_map_test/M0_S-6_R8_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..776bcd3c0a9f8af6529e55533becb7762717fc66 --- /dev/null +++ b/mlp_map_test/M0_S-6_R8_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a27cd0f5f150680d8dadcedb6f7ae34d350f24c9ac5be09c109e01ef7a56e4c +size 153705080 diff --git a/mlp_map_test/M0_S-6_R8_P3_config.json b/mlp_map_test/M0_S-6_R8_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..bc3a674acd78e9c1565e041eb7eb5b6bfde728ff --- /dev/null +++ b/mlp_map_test/M0_S-6_R8_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R8_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R8_P4.pt b/mlp_map_test/M0_S-6_R8_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea331176ac28de2c140b0da500afd54dd92fb9ff --- /dev/null +++ b/mlp_map_test/M0_S-6_R8_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5599d0290d3bf8b4260f38e3ec921e462755391b1078fc56c0b0136bb5f43c24 +size 153705080 diff --git a/mlp_map_test/M0_S-6_R8_P4_config.json b/mlp_map_test/M0_S-6_R8_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..78811fa3233dfd62642677ec7cc074dea03e5e2f --- /dev/null +++ b/mlp_map_test/M0_S-6_R8_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R8_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-8_R4_P1.pt b/mlp_map_test/M0_S-8_R4_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..be290ac5d3f24c7cbb3cb3bb241f328bbaf63496 --- /dev/null +++ b/mlp_map_test/M0_S-8_R4_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b00c6230ca71c87b2d192db96dc3d211db347d242016d760f8f55f06b38ddb34 +size 153705080 diff --git a/mlp_map_test/M0_S-8_R4_P1_config.json b/mlp_map_test/M0_S-8_R4_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..81e9f0b0da61de74a53f36a7f72a1abab6e68a64 --- /dev/null +++ b/mlp_map_test/M0_S-8_R4_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-8_R4_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-8_R4_P2.pt b/mlp_map_test/M0_S-8_R4_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0f06c41ffda6cfa6b2af3545ff522b9e0274877 --- /dev/null +++ b/mlp_map_test/M0_S-8_R4_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e396ed9e61013a12663e2e9a389ce34d902d049b5ff7fa82454a354b5e42ae99 +size 153705080 diff --git a/mlp_map_test/M0_S-8_R4_P2_config.json b/mlp_map_test/M0_S-8_R4_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..efe935a482ca727b7130db6da766df2c2b9f9bf9 --- /dev/null +++ b/mlp_map_test/M0_S-8_R4_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-8_R4_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-8_R8_P1.pt b/mlp_map_test/M0_S-8_R8_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d008c4547c209659acb098faa54457957a40d83 --- /dev/null +++ b/mlp_map_test/M0_S-8_R8_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4817e4afa0c953637942fb2b90a6e6cf9ea6963f37b8bcd9f603eb7920e560c +size 153705080 diff --git a/mlp_map_test/M0_S-8_R8_P1_config.json b/mlp_map_test/M0_S-8_R8_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a07b93ed4fdc82742c9f8ac514951ba7d5f1ae26 --- /dev/null +++ b/mlp_map_test/M0_S-8_R8_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-8_R8_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S0_R16_P5.pt b/mlp_map_test/M0_S0_R16_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8244610c8665507bbaf0c11454286607e82ff28 --- /dev/null +++ b/mlp_map_test/M0_S0_R16_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45672861bca72a3dede8880454bfeb06b2d633bf93961ea9f8a0f59625493b27 +size 153705080 diff --git a/mlp_map_test/M0_S0_R16_P5_config.json b/mlp_map_test/M0_S0_R16_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2696e9602270feb299ee06bdc0dc4df6800feb72 --- /dev/null +++ b/mlp_map_test/M0_S0_R16_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S0_R16_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S0_R4_P2.pt b/mlp_map_test/M0_S0_R4_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..b58474b20a8056d0ac06eda3ff90a9e906dd41f1 --- /dev/null +++ b/mlp_map_test/M0_S0_R4_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a000f854a07edbaffba6e09296d3996f2d4f7e1368497b7cbe3b06debc21892 +size 153705072 diff --git a/mlp_map_test/M0_S0_R4_P2_config.json b/mlp_map_test/M0_S0_R4_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..922ff1e74ecad09460ea3c89092e2e58927cc3a4 --- /dev/null +++ b/mlp_map_test/M0_S0_R4_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S0_R4_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S0_R4_P6.pt b/mlp_map_test/M0_S0_R4_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..fef0bcdb1b55bdaf5a651ea8c30e97117ff556fb --- /dev/null +++ b/mlp_map_test/M0_S0_R4_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb98206eace11c3c691ef6773637c1a21f7d2b9e99907223b630dd4fdb06e142 +size 153705072 diff --git a/mlp_map_test/M0_S0_R4_P6_config.json b/mlp_map_test/M0_S0_R4_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b16bf6308f4d294753902013bdbe868a45f0204c --- /dev/null +++ b/mlp_map_test/M0_S0_R4_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S0_R4_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S0_R8_P4.pt b/mlp_map_test/M0_S0_R8_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..3720918d2b8b720a218d359436705007faad8b29 --- /dev/null +++ b/mlp_map_test/M0_S0_R8_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfd70e40905225d54508805bec0bf51bd96dc77812a19df653ed398cf10c9731 +size 153705072 diff --git a/mlp_map_test/M0_S0_R8_P4_config.json b/mlp_map_test/M0_S0_R8_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e8484d925459814a1fb435465f0b52e2dfdad7e5 --- /dev/null +++ b/mlp_map_test/M0_S0_R8_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S0_R8_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-2_R16_P2.pt b/mlp_map_test/M1_S-2_R16_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a009efba3f6c1d0375d8518ef21dc73c57c9f4b --- /dev/null +++ b/mlp_map_test/M1_S-2_R16_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37b722f62ac9871daec727c03512026863cf1b8a896c7112ea7678163b4da5f1 +size 153705088 diff --git a/mlp_map_test/M1_S-2_R16_P2_config.json b/mlp_map_test/M1_S-2_R16_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..06a81c9f6bac1eec7ee5959fefb8acb2574b8744 --- /dev/null +++ b/mlp_map_test/M1_S-2_R16_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-2_R16_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-2_R2_P3.pt b/mlp_map_test/M1_S-2_R2_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..79c6e35a1b359574bc6f3fb01dbe1d21552f4ee0 --- /dev/null +++ b/mlp_map_test/M1_S-2_R2_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba4c4a14c610deb1cd5583f68e1ec84b5aa63a89b3dd36fd49e49f5a775467b3 +size 153705080 diff --git a/mlp_map_test/M1_S-2_R2_P3_config.json b/mlp_map_test/M1_S-2_R2_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..26591ddcdf379b0d2703b6e66e0e7b479b11b1fe --- /dev/null +++ b/mlp_map_test/M1_S-2_R2_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-2_R2_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-4_R16_P1.pt b/mlp_map_test/M1_S-4_R16_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..69a70020068e6b616eff0123b80b7096dc76e52c --- /dev/null +++ b/mlp_map_test/M1_S-4_R16_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42beb86f03a41ac4830dd421a5ce373d75b39188bd2712cbefaa003fab9e6279 +size 153705088 diff --git a/mlp_map_test/M1_S-4_R16_P1_config.json b/mlp_map_test/M1_S-4_R16_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..cec054db4ca902f12b1b5679bb2293b8dc70285a --- /dev/null +++ b/mlp_map_test/M1_S-4_R16_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-4_R16_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-4_R2_P6.pt b/mlp_map_test/M1_S-4_R2_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4145338484521809c0a49e19bcd3fd263b2bd4a --- /dev/null +++ b/mlp_map_test/M1_S-4_R2_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f729f2319c7d471c0029acb1022a93276bb159bb8815cda5bc66f2cb529da19e +size 153705080 diff --git a/mlp_map_test/M1_S-4_R2_P6_config.json b/mlp_map_test/M1_S-4_R2_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..8efdf266b378dea96862b9d84eceff08f9d7c516 --- /dev/null +++ b/mlp_map_test/M1_S-4_R2_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-4_R2_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-4_R4_P3.pt b/mlp_map_test/M1_S-4_R4_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..424fb47203ea4a795eff33e841f10107355c030c --- /dev/null +++ b/mlp_map_test/M1_S-4_R4_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf90a29a6f0befb83974f530c3c2497ca54df69e4da67e8f285b83ddacea492f +size 153705080 diff --git a/mlp_map_test/M1_S-4_R4_P3_config.json b/mlp_map_test/M1_S-4_R4_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6a571c592005945e39b38f870f12ba9c066e64b3 --- /dev/null +++ b/mlp_map_test/M1_S-4_R4_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-4_R4_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-4_R8_P2.pt b/mlp_map_test/M1_S-4_R8_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..e225ac242557e2775ec8c54a2d864f6a5c02f925 --- /dev/null +++ b/mlp_map_test/M1_S-4_R8_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ccbd7776c7e2f458d1dda3932307757741dd39f221daa7b0bf8ff94284f296d +size 153705080 diff --git a/mlp_map_test/M1_S-4_R8_P2_config.json b/mlp_map_test/M1_S-4_R8_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..caf585bf362d2a3cfa19dc2c74def5eb7fd421b4 --- /dev/null +++ b/mlp_map_test/M1_S-4_R8_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-4_R8_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-4_R8_P4.pt b/mlp_map_test/M1_S-4_R8_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..8171c393f6c9b96651d942d16fc8b0dfeb06a888 --- /dev/null +++ b/mlp_map_test/M1_S-4_R8_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ef5571c02ab237013104b7308ee886292bf4e8542c29b7a3c946d6d85eb2d4a +size 153705080 diff --git a/mlp_map_test/M1_S-4_R8_P4_config.json b/mlp_map_test/M1_S-4_R8_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..415d0fcbefaa59725e6e5edaa63d5331d1aac079 --- /dev/null +++ b/mlp_map_test/M1_S-4_R8_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-4_R8_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R16_P6.pt b/mlp_map_test/M1_S-6_R16_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..1810657fb48a5967db75ca76216b0c4b52ac03ff --- /dev/null +++ b/mlp_map_test/M1_S-6_R16_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5133c58905286f8300769a1b44dc656a52fcbf7381af60e20e8fb80a39cf87a6 +size 153705088 diff --git a/mlp_map_test/M1_S-6_R16_P6_config.json b/mlp_map_test/M1_S-6_R16_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..8dedd9f87889c044c27e0c8349e0165287eb969c --- /dev/null +++ b/mlp_map_test/M1_S-6_R16_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R16_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R2_P4.pt b/mlp_map_test/M1_S-6_R2_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fd7ef51091e04e22724a0a2b7bdd8bd744d9d8c --- /dev/null +++ b/mlp_map_test/M1_S-6_R2_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2e31304053fd85af1e4439c91c94b2c76a12b9b9dd9d69c1f92b18a3f0aab42 +size 153705080 diff --git a/mlp_map_test/M1_S-6_R2_P4_config.json b/mlp_map_test/M1_S-6_R2_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..93d9a4e40fe92f2850f117688f8860b189da9f1f --- /dev/null +++ b/mlp_map_test/M1_S-6_R2_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R2_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R2_P5.pt b/mlp_map_test/M1_S-6_R2_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..06023cead88404e10423ffbeb9f7735b69dffe1a --- /dev/null +++ b/mlp_map_test/M1_S-6_R2_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ced235e82fa3b320ef3839e12e34a33880d77ab5757c59dbe3f62b8852c7938 +size 153705080 diff --git a/mlp_map_test/M1_S-6_R2_P5_config.json b/mlp_map_test/M1_S-6_R2_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0dfcbd0f1cd52c3e079b00ef9e0c67b0062f03fb --- /dev/null +++ b/mlp_map_test/M1_S-6_R2_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R2_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R4_P2.pt b/mlp_map_test/M1_S-6_R4_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..b78a5647eccc7795fc322c811c067d5a657ff5a5 --- /dev/null +++ b/mlp_map_test/M1_S-6_R4_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac284cd119ecc90b4ffa84ec752c5b4ad9c1bad9cac9470957f9fbc98d6b6887 +size 153705080 diff --git a/mlp_map_test/M1_S-6_R4_P2_config.json b/mlp_map_test/M1_S-6_R4_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..592bf53e70e3d4ea4a0b9af853f2c1a9213562a4 --- /dev/null +++ b/mlp_map_test/M1_S-6_R4_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R4_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R8_P4.pt b/mlp_map_test/M1_S-6_R8_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d7a2b2aad8438f7455f70ce9aab797831ded0ba --- /dev/null +++ b/mlp_map_test/M1_S-6_R8_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3befebfa989cc12255d500ebcfb804fda19b947191cb51e989849f5ae27fc9c7 +size 153705080 diff --git a/mlp_map_test/M1_S-6_R8_P4_config.json b/mlp_map_test/M1_S-6_R8_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6a20e9ed2dea5d176e1a8c708f6a67188947caec --- /dev/null +++ b/mlp_map_test/M1_S-6_R8_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R8_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-8_R4_P1.pt b/mlp_map_test/M1_S-8_R4_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb685c072d3aaf3aa1cd47eaaad187676eb28803 --- /dev/null +++ b/mlp_map_test/M1_S-8_R4_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6710ee850f50218c19a8c8a0837dc4663fa97307e99111d2f827f0d02d9fca5f +size 153705080 diff --git a/mlp_map_test/M1_S-8_R4_P1_config.json b/mlp_map_test/M1_S-8_R4_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..f5260f2dc1f69a9fe306635d456b237ea03a73da --- /dev/null +++ b/mlp_map_test/M1_S-8_R4_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-8_R4_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-8_R4_P5.pt b/mlp_map_test/M1_S-8_R4_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..766facf8d99c319d6ec626052307bc618b06f914 --- /dev/null +++ b/mlp_map_test/M1_S-8_R4_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0517467cf7976ffb346800fba950c371bd1f99131dd46f8cb77547b3e8bd4702 +size 153705080 diff --git a/mlp_map_test/M1_S-8_R4_P5_config.json b/mlp_map_test/M1_S-8_R4_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..7cfa9d113b2ac5566548a3f1f37cc600909dd8da --- /dev/null +++ b/mlp_map_test/M1_S-8_R4_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-8_R4_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-8_R8_P4.pt b/mlp_map_test/M1_S-8_R8_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd818811ffd60e073a726eee804dbadfd4f66bb3 --- /dev/null +++ b/mlp_map_test/M1_S-8_R8_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87250ca854d601489ae4cd4d3f2f7458ce01d9966340278750c60ffa31ff9230 +size 153705080 diff --git a/mlp_map_test/M1_S-8_R8_P4_config.json b/mlp_map_test/M1_S-8_R8_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5aa13844b87c1b8a6e75338f64b62cf897a880b1 --- /dev/null +++ b/mlp_map_test/M1_S-8_R8_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-8_R8_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S0_R4_P4.pt b/mlp_map_test/M1_S0_R4_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7e291930c0439a49a9d74bbb29c9099083b887e --- /dev/null +++ b/mlp_map_test/M1_S0_R4_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f8cbb77d66eb6388fe3f05341e328f89f5bc87e1d64dc2190022771154ee907 +size 153705072 diff --git a/mlp_map_test/M1_S0_R4_P4_config.json b/mlp_map_test/M1_S0_R4_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..8f9b2d430de5a80b7dae105eeb1500cb5929ccf6 --- /dev/null +++ b/mlp_map_test/M1_S0_R4_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S0_R4_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S0_R8_P3.pt b/mlp_map_test/M1_S0_R8_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e16f72c9f0b15275de048e98720fed386fa8792 --- /dev/null +++ b/mlp_map_test/M1_S0_R8_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c5411167e13c7810932a790f9ed60cf40a3e53009aacdf833d377e655bfd06e +size 153705072 diff --git a/mlp_map_test/M1_S0_R8_P3_config.json b/mlp_map_test/M1_S0_R8_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0092810c2f6b1587a8519954ad8219f7614a0c0 --- /dev/null +++ b/mlp_map_test/M1_S0_R8_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S0_R8_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S0_R8_P5.pt b/mlp_map_test/M1_S0_R8_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..32744937e6ed728d859ea51972fb3b594fade10e --- /dev/null +++ b/mlp_map_test/M1_S0_R8_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057da5f094d3bb7a4bffe266015f21bac29f6f45d07221b00b7f479b7a6d793d +size 153705072 diff --git a/mlp_map_test/M1_S0_R8_P5_config.json b/mlp_map_test/M1_S0_R8_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..418e5d9892aa754adea49a9d7d891b9f531bc486 --- /dev/null +++ b/mlp_map_test/M1_S0_R8_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S0_R8_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R1_P0.pt b/mlp_map_test/M2_S-2_R1_P0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eeeac4b074e447122fa36476ae84fb7ca4aefda --- /dev/null +++ b/mlp_map_test/M2_S-2_R1_P0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19089a6182210ccba65a14194c6a7ae84ca07612e2d433fab1c87c0a1584710c +size 153705080 diff --git a/mlp_map_test/M2_S-2_R1_P0_config.json b/mlp_map_test/M2_S-2_R1_P0_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2a9d740f71f43451f1e7b6399962af7a07771156 --- /dev/null +++ b/mlp_map_test/M2_S-2_R1_P0_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 1, + "l1_p": 0, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R1_P0" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R2_P2.pt b/mlp_map_test/M2_S-2_R2_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b5ccce688ddee948a7395e7a46e63deffb4f5ce --- /dev/null +++ b/mlp_map_test/M2_S-2_R2_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d13f7adb16d02c7a95d0774e1ad9aded7eb5eaa29bca9c0cb1d956e9edff1a07 +size 153705080 diff --git a/mlp_map_test/M2_S-2_R2_P2_config.json b/mlp_map_test/M2_S-2_R2_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ffb9c4143bdb7f28cb238391341d45f4b7ab13c --- /dev/null +++ b/mlp_map_test/M2_S-2_R2_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R2_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R2_P5.pt b/mlp_map_test/M2_S-2_R2_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..131ec70b1b791444a55b670bf9af0a7ad747ce48 --- /dev/null +++ b/mlp_map_test/M2_S-2_R2_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d62a01008eeebf3593b0745365abe70e7e3ce2bce0f60bb1a23ddd2d405950f4 +size 153705080 diff --git a/mlp_map_test/M2_S-2_R2_P5_config.json b/mlp_map_test/M2_S-2_R2_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e6e6fffecedf2734d940ae739563a6425c17d4df --- /dev/null +++ b/mlp_map_test/M2_S-2_R2_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R2_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R4_P5.pt b/mlp_map_test/M2_S-2_R4_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b588c94327296932bd6ec52a7d4907337aa2d67 --- /dev/null +++ b/mlp_map_test/M2_S-2_R4_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9982b91f8f48af6ef9fa421f0f5338daf3de94f61d47b8d701c787b4933ccba3 +size 153705080 diff --git a/mlp_map_test/M2_S-2_R4_P5_config.json b/mlp_map_test/M2_S-2_R4_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5bac75fdf95d2dddd68069c6ba1169d5e05ddb98 --- /dev/null +++ b/mlp_map_test/M2_S-2_R4_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R4_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R16_P1.pt b/mlp_map_test/M2_S-4_R16_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..a865df1dbad8239d2cabff063d3e35ddfdcbef68 --- /dev/null +++ b/mlp_map_test/M2_S-4_R16_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2f8ad16fc0298ad13c19b522ece7a329f3260591e9497378dab6e24f3e36df7 +size 153705088 diff --git a/mlp_map_test/M2_S-4_R16_P1_config.json b/mlp_map_test/M2_S-4_R16_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2533d40fe712fd5b6e29205d9d4facfc19543f7 --- /dev/null +++ b/mlp_map_test/M2_S-4_R16_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R16_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R16_P4.pt b/mlp_map_test/M2_S-4_R16_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..feb30fb94d2ff61663b0bdb2761420617235fb5a --- /dev/null +++ b/mlp_map_test/M2_S-4_R16_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6dda8699a17a171f3ea236a8a49bd2dad9385580d6919c612b2d532467df194 +size 153705088 diff --git a/mlp_map_test/M2_S-4_R16_P4_config.json b/mlp_map_test/M2_S-4_R16_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0ae4e6d2b5a1bc35aee4f9221ac2d0730f09d412 --- /dev/null +++ b/mlp_map_test/M2_S-4_R16_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R16_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R2_P2.pt b/mlp_map_test/M2_S-4_R2_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..635a2c9183cd9ee0735bf758bc793e62e45bf8e1 --- /dev/null +++ b/mlp_map_test/M2_S-4_R2_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae7b60e171e44432b65b42a92f9de0239d9cbde03b5ee7d209dd2c3d6fa0e4c +size 153705080 diff --git a/mlp_map_test/M2_S-4_R2_P2_config.json b/mlp_map_test/M2_S-4_R2_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9f500f6903685665d02487d08346f143debc12af --- /dev/null +++ b/mlp_map_test/M2_S-4_R2_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R2_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R8_P1.pt b/mlp_map_test/M2_S-4_R8_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..cceaa5fcb6232b03fd1b4f52d3411a50e4e625e5 --- /dev/null +++ b/mlp_map_test/M2_S-4_R8_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c465763a36c8c8d213e9fa9e0e33563f9bc98627c8677fb54917d0ffd7011e53 +size 153705080 diff --git a/mlp_map_test/M2_S-4_R8_P1_config.json b/mlp_map_test/M2_S-4_R8_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0e803a971e377b094b718aac94ff0f79fba8d714 --- /dev/null +++ b/mlp_map_test/M2_S-4_R8_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R8_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R16_P1.pt b/mlp_map_test/M2_S-6_R16_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9995f001b59f40f5b8d846b593552f6321e111a --- /dev/null +++ b/mlp_map_test/M2_S-6_R16_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98af9ff48c6d093fc0c3cfcf429ea847f7d3379687e3d8be38bca3998ea6d1b6 +size 153705088 diff --git a/mlp_map_test/M2_S-6_R16_P1_config.json b/mlp_map_test/M2_S-6_R16_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..dfaa392817a9c8ad78a6c3cabdd0be07be56ab28 --- /dev/null +++ b/mlp_map_test/M2_S-6_R16_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R16_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R16_P2.pt b/mlp_map_test/M2_S-6_R16_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..01e781dd24d9151b74a58933931729e9a0d9f931 --- /dev/null +++ b/mlp_map_test/M2_S-6_R16_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e6f05f0c1ebcb8f85272fd8a442720fa7866e0e771e4bc0aa1340d9cc4add70 +size 153705088 diff --git a/mlp_map_test/M2_S-6_R16_P2_config.json b/mlp_map_test/M2_S-6_R16_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a690c44519c1a0c9e4c60745c231b145dde93f11 --- /dev/null +++ b/mlp_map_test/M2_S-6_R16_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R16_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R4_P1.pt b/mlp_map_test/M2_S-6_R4_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..8742e4d117e2ac75c73bbfed6111134945defd39 --- /dev/null +++ b/mlp_map_test/M2_S-6_R4_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068a15a7acc2d6056f7be3abb70618c41e398d973deb92a28d64cdcd30c4b496 +size 153705080 diff --git a/mlp_map_test/M2_S-6_R4_P1_config.json b/mlp_map_test/M2_S-6_R4_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..bca8cf5abe1b4edc2f6578b5ce1370d9eee0a586 --- /dev/null +++ b/mlp_map_test/M2_S-6_R4_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R4_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R8_P3.pt b/mlp_map_test/M2_S-6_R8_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc4cf11ff70c3332acda696add252a2e162ee9e2 --- /dev/null +++ b/mlp_map_test/M2_S-6_R8_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81b916bf777be5ec258642890b5fc41d7d45e91530a581686a9cb3a0ebc821c +size 153705080 diff --git a/mlp_map_test/M2_S-6_R8_P3_config.json b/mlp_map_test/M2_S-6_R8_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b017166efb35b0fc016dff5ed4f3e7cf4b1ded87 --- /dev/null +++ b/mlp_map_test/M2_S-6_R8_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R8_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R1_P0.pt b/mlp_map_test/M2_S-8_R1_P0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31a50c0cdbf521f735b7f99e4780d0a054c994c9 --- /dev/null +++ b/mlp_map_test/M2_S-8_R1_P0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a24f889b6c1bc13866d301e480e77727eeae8394dc450a112e6f7519f1c4e8f6 +size 153705080 diff --git a/mlp_map_test/M2_S-8_R1_P0_config.json b/mlp_map_test/M2_S-8_R1_P0_config.json new file mode 100644 index 0000000000000000000000000000000000000000..96710f91c8cfe9d0773a2e3be10acb1de9bf460c --- /dev/null +++ b/mlp_map_test/M2_S-8_R1_P0_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 1, + "l1_p": 0, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R1_P0" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R2_P2.pt b/mlp_map_test/M2_S-8_R2_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d5084eebe176722a9cfde908f66811a762b8428 --- /dev/null +++ b/mlp_map_test/M2_S-8_R2_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2201e800080f57ec24a8b0a75990e2cbbbb3146bfc4b6a7ce33a4cb920bb7b4f +size 153705080 diff --git a/mlp_map_test/M2_S-8_R2_P2_config.json b/mlp_map_test/M2_S-8_R2_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5af85ea3dbeed48a2ef90a56c139afea61d9be17 --- /dev/null +++ b/mlp_map_test/M2_S-8_R2_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R2_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R2_P6.pt b/mlp_map_test/M2_S-8_R2_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..db7848743c45f92c4bed7764ed7d40a7dd2c71cb --- /dev/null +++ b/mlp_map_test/M2_S-8_R2_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81ccf59cbc27209df5eebdbdead654546a375d5b9f9b51638afab3f76a9553af +size 153705080 diff --git a/mlp_map_test/M2_S-8_R2_P6_config.json b/mlp_map_test/M2_S-8_R2_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..206ef0dd04cd31ca08f4d24f6d5ee059ce341fde --- /dev/null +++ b/mlp_map_test/M2_S-8_R2_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R2_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R4_P3.pt b/mlp_map_test/M2_S-8_R4_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d2092c8808d544c38ac80ec5f766968083fe695 --- /dev/null +++ b/mlp_map_test/M2_S-8_R4_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df47a714da51a361fd1864caf8be5017b277cee0191b840f48d00f3e57aa016d +size 153705080 diff --git a/mlp_map_test/M2_S-8_R4_P3_config.json b/mlp_map_test/M2_S-8_R4_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3874193e5451c2828a97b3791069db2dd6d0e78d --- /dev/null +++ b/mlp_map_test/M2_S-8_R4_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R4_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R8_P4.pt b/mlp_map_test/M2_S-8_R8_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e4dcf88b7d083e84b94d6fd354a8886311877d1 --- /dev/null +++ b/mlp_map_test/M2_S-8_R8_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7139359ae70726ad3adebe2a6392dcdde323261256dcee0cd4d8168e8e2da525 +size 153705080 diff --git a/mlp_map_test/M2_S-8_R8_P4_config.json b/mlp_map_test/M2_S-8_R8_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e6739c628c3fa33c9a1deb35051aeb4f5ac4cb21 --- /dev/null +++ b/mlp_map_test/M2_S-8_R8_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R8_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S0_R16_P6.pt b/mlp_map_test/M2_S0_R16_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae05b7ca07391a9a84b20ada270c3dbb914c1bb1 --- /dev/null +++ b/mlp_map_test/M2_S0_R16_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57c86fed4414df3fcbb2b6bead7114d1ae81c790cd413ed27434868520782374 +size 153705080 diff --git a/mlp_map_test/M2_S0_R16_P6_config.json b/mlp_map_test/M2_S0_R16_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..813e07aa2a621f9752de87f6fb69c7e50ed6faf2 --- /dev/null +++ b/mlp_map_test/M2_S0_R16_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S0_R16_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S0_R2_P2.pt b/mlp_map_test/M2_S0_R2_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb382b99039f31e3d32b7d6a3a6d5ed2cc914ff5 --- /dev/null +++ b/mlp_map_test/M2_S0_R2_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1d3984f22523df32d05ec40ba5220f525df81a71f37601f91d62b293677d5a +size 153705072 diff --git a/mlp_map_test/M2_S0_R2_P2_config.json b/mlp_map_test/M2_S0_R2_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a2f7ca54ad0eb64cd13761d60506c4e96aaaf29e --- /dev/null +++ b/mlp_map_test/M2_S0_R2_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S0_R2_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S0_R2_P3.pt b/mlp_map_test/M2_S0_R2_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..458c1477ae6d3d0b7fe75f93838f88e3672d8612 --- /dev/null +++ b/mlp_map_test/M2_S0_R2_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5396e3d19fb80c8f09c75200ef1b52cf87231e3d67a5e28e6af216a8c491733b +size 153705072 diff --git a/mlp_map_test/M2_S0_R2_P3_config.json b/mlp_map_test/M2_S0_R2_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9e33c4031f64fdf4529bef00434bb1d1f35a7d2b --- /dev/null +++ b/mlp_map_test/M2_S0_R2_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S0_R2_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S0_R2_P6.pt b/mlp_map_test/M2_S0_R2_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..df644d24bf707faa5a855d604d4a59d9cbb2e113 --- /dev/null +++ b/mlp_map_test/M2_S0_R2_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad25d5f7443ebedb7eebee114c1be38dcfe2ac2033b52abc0c6c6de4eca14163 +size 153705072 diff --git a/mlp_map_test/M2_S0_R2_P6_config.json b/mlp_map_test/M2_S0_R2_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6ff1710dbf86944c2bb5f0684bb06de7467d6bfc --- /dev/null +++ b/mlp_map_test/M2_S0_R2_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S0_R2_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S0_R4_P3.pt b/mlp_map_test/M2_S0_R4_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..3166f17643dc9ceaddf1d6d206339240d38d9993 --- /dev/null +++ b/mlp_map_test/M2_S0_R4_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b012ce6634261ed6d42c2fd6ce75fc6911d0c40249aca87c9c1583ea6c255087 +size 153705072 diff --git a/mlp_map_test/M2_S0_R4_P3_config.json b/mlp_map_test/M2_S0_R4_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..cff6cb301fab9906e01911738e50b165c09ae0c2 --- /dev/null +++ b/mlp_map_test/M2_S0_R4_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S0_R4_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S0_R8_P1.pt b/mlp_map_test/M2_S0_R8_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe230465688e5e3fa9a36249817e2deae34f811f --- /dev/null +++ b/mlp_map_test/M2_S0_R8_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:052995be653781852dd92a6665f661a0e3dd5868da564e2af3ae83f9b7fad19c +size 153705072 diff --git a/mlp_map_test/M2_S0_R8_P1_config.json b/mlp_map_test/M2_S0_R8_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3fbcbdd82ef11c37facd9889648f6bd404da487a --- /dev/null +++ b/mlp_map_test/M2_S0_R8_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S0_R8_P1" +} \ No newline at end of file