diff --git a/mlp_map_test/M0_S-10_R16_P2.pt b/mlp_map_test/M0_S-10_R16_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c4de1290de77af9de6770dc36217ac70ec29691 --- /dev/null +++ b/mlp_map_test/M0_S-10_R16_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a476d3aef4c5a1dcc75418e38609399e84fb2cb55b7dd460d0a07449aef9a18 +size 153705096 diff --git a/mlp_map_test/M0_S-10_R16_P2_config.json b/mlp_map_test/M0_S-10_R16_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..fa94eecef71e19ae9c48070959e000271cc1c33c --- /dev/null +++ b/mlp_map_test/M0_S-10_R16_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-10_R16_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-10_R16_P3.pt b/mlp_map_test/M0_S-10_R16_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..85d43cdf1de9806cf5282293ef3a3953f4caaa5b --- /dev/null +++ b/mlp_map_test/M0_S-10_R16_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f8e0615563aef8d1a9540b22e7223e6e80c3813d825b3aa49cd0355db998292 +size 153705096 diff --git a/mlp_map_test/M0_S-10_R16_P3_config.json b/mlp_map_test/M0_S-10_R16_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4249cbc075473b8f6747db107376aec3d0a65166 --- /dev/null +++ b/mlp_map_test/M0_S-10_R16_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-10_R16_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-10_R16_P4.pt b/mlp_map_test/M0_S-10_R16_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..2643ccf751a6d92fe9b0a7b5b6fa9dcad1b8d5fc --- /dev/null +++ b/mlp_map_test/M0_S-10_R16_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25a46db602dbd14919d1c35b25e05cd34ff2e46e7b3b2449c6b16a267b1e184f +size 153705096 diff --git a/mlp_map_test/M0_S-10_R16_P4_config.json b/mlp_map_test/M0_S-10_R16_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..10633d71d5fdbca710aa094464560ce9a1a8cca4 --- /dev/null +++ b/mlp_map_test/M0_S-10_R16_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-10_R16_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-10_R16_P5.pt b/mlp_map_test/M0_S-10_R16_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..78c3e4157d6f03cae635205a1a94d312e0e2d400 --- /dev/null +++ b/mlp_map_test/M0_S-10_R16_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a85488e911ab5a73fc9d82a330e78c4184eed5007a6b0e1cabf54da3baec1f7 +size 153705096 diff --git a/mlp_map_test/M0_S-10_R16_P5_config.json b/mlp_map_test/M0_S-10_R16_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c3fef58fbf670a04dfc76cc0c21c89f237039491 --- /dev/null +++ b/mlp_map_test/M0_S-10_R16_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-10_R16_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-10_R4_P1.pt b/mlp_map_test/M0_S-10_R4_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..e017f2267b9a2595795d4906b54a1a9d8abfb47e --- /dev/null +++ b/mlp_map_test/M0_S-10_R4_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e2b03ae00efdc04924bc67fd57561adc0ef02bcd70ec500e3612930c78d304 +size 153705088 diff --git a/mlp_map_test/M0_S-10_R4_P1_config.json b/mlp_map_test/M0_S-10_R4_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5b3be82632b1af96b214c41fede33998a1804e04 --- /dev/null +++ b/mlp_map_test/M0_S-10_R4_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-10_R4_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-10_R4_P5.pt b/mlp_map_test/M0_S-10_R4_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..421c196f1818868f878270ec554665113ff67863 --- /dev/null +++ b/mlp_map_test/M0_S-10_R4_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d71afabdb9f20aa17f3e6a1576b42c6ab73c271c14da4109fb5028c37cbc36d +size 153705088 diff --git a/mlp_map_test/M0_S-10_R4_P5_config.json b/mlp_map_test/M0_S-10_R4_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..51c43b3b3aaa620b45a3ce87b5564b7a13402e5b --- /dev/null +++ b/mlp_map_test/M0_S-10_R4_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-10_R4_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-10_R8_P1.pt b/mlp_map_test/M0_S-10_R8_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..06e03f72cf20bd8e4cd008184bc50cfa2eb00c49 --- /dev/null +++ b/mlp_map_test/M0_S-10_R8_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc902d6b03e5f89da1308cd533dd49a3fbc503f117691e677522a46bcaa9a5ff +size 153705088 diff --git a/mlp_map_test/M0_S-10_R8_P1_config.json b/mlp_map_test/M0_S-10_R8_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..de86019f5688f5330b379707ccd970b031066b6d --- /dev/null +++ b/mlp_map_test/M0_S-10_R8_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-10_R8_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-10_R8_P2.pt b/mlp_map_test/M0_S-10_R8_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..2323a1098c2b3b8c1881110738889dcf8fb64537 --- /dev/null +++ b/mlp_map_test/M0_S-10_R8_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c72c5cb9c4d6b17693c77ca0a05a7c812e2d19d6e83ec0eeb2853d1f156b12d +size 153705088 diff --git a/mlp_map_test/M0_S-10_R8_P2_config.json b/mlp_map_test/M0_S-10_R8_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..f96f650a9feba539a05eda44a995fa400938a17d --- /dev/null +++ b/mlp_map_test/M0_S-10_R8_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-10_R8_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-10_R8_P3.pt b/mlp_map_test/M0_S-10_R8_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd749b7f7ba3010570e00cb9d7cf0298c174fc22 --- /dev/null +++ b/mlp_map_test/M0_S-10_R8_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39899c5a0eb2a0de2615591467f7133389e29c7cf6743642e743a0f8586b3c23 +size 153705088 diff --git a/mlp_map_test/M0_S-10_R8_P3_config.json b/mlp_map_test/M0_S-10_R8_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0bc8c71ef12b846ac9b504184033e8a1fe59a718 --- /dev/null +++ b/mlp_map_test/M0_S-10_R8_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-10_R8_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R16_P1.pt b/mlp_map_test/M0_S-2_R16_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcf0bcf741536e76f3dc08ef343d4289988b493f --- /dev/null +++ b/mlp_map_test/M0_S-2_R16_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fcddc6c89f38a708069bae5fb748625dbb057c8214bec471f353d98838a844d +size 153705088 diff --git a/mlp_map_test/M0_S-2_R16_P1_config.json b/mlp_map_test/M0_S-2_R16_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..86497cb3eba71c74df4015f616ce975ea3f6402c --- /dev/null +++ b/mlp_map_test/M0_S-2_R16_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R16_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R16_P4.pt b/mlp_map_test/M0_S-2_R16_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..8613fb254fc8e919cf014b2029aae582cad4678c --- /dev/null +++ b/mlp_map_test/M0_S-2_R16_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0221c4acac9ff33d429738173547f422a82dadfbf4f5313e17a18a0b6fc2b4e0 +size 153705088 diff --git a/mlp_map_test/M0_S-2_R16_P4_config.json b/mlp_map_test/M0_S-2_R16_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1ddb43108d6afb369ac733a159ddf4926578c2c2 --- /dev/null +++ b/mlp_map_test/M0_S-2_R16_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R16_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R16_P6.pt b/mlp_map_test/M0_S-2_R16_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d50e954ac3bd58e6cf0a273b27deb81fb34bb3e --- /dev/null +++ b/mlp_map_test/M0_S-2_R16_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d54835151ee0f914c46031271ff86e17264ebd39be55897c2ab3364c65ef54cd +size 153705088 diff --git a/mlp_map_test/M0_S-2_R16_P6_config.json b/mlp_map_test/M0_S-2_R16_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..637fad7412142e273e4ceb5c71ed7816e44b0fd9 --- /dev/null +++ b/mlp_map_test/M0_S-2_R16_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R16_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R1_P0.pt b/mlp_map_test/M0_S-2_R1_P0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f1263e288478ccbcba36cf45c65ab7093fe4bf4 --- /dev/null +++ b/mlp_map_test/M0_S-2_R1_P0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35a794ba2abdc801c955216c172bd99f67f0b8af8847c5bb25276bf55765bfba +size 153705080 diff --git a/mlp_map_test/M0_S-2_R1_P0_config.json b/mlp_map_test/M0_S-2_R1_P0_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e939e3448e78bc204729a544e9fe3e30d63ef681 --- /dev/null +++ b/mlp_map_test/M0_S-2_R1_P0_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 1, + "l1_p": 0, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R1_P0" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R2_P2.pt b/mlp_map_test/M0_S-2_R2_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..a63c6b2db5a32a8ba68354797b13a913a33218a8 --- /dev/null +++ b/mlp_map_test/M0_S-2_R2_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e824360311d126899f3afa8aaa8c9694bc76c9d6824685f11158bad9f347e95b +size 153705080 diff --git a/mlp_map_test/M0_S-2_R2_P2_config.json b/mlp_map_test/M0_S-2_R2_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4e0d308f9ad6a5ded9a532f20be0cf2c9034056a --- /dev/null +++ b/mlp_map_test/M0_S-2_R2_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R2_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R2_P3.pt b/mlp_map_test/M0_S-2_R2_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..379054a0c1cb43d8ddf51fb2174951a3b30d0337 --- /dev/null +++ b/mlp_map_test/M0_S-2_R2_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e0adffbde68d106fb7352f1bda49a9e2bbd7a29204e453444ab9e41b26180f +size 153705080 diff --git a/mlp_map_test/M0_S-2_R2_P3_config.json b/mlp_map_test/M0_S-2_R2_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..792fd05d06e2768986c6770202f56d1158822b76 --- /dev/null +++ b/mlp_map_test/M0_S-2_R2_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R2_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R2_P6.pt b/mlp_map_test/M0_S-2_R2_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac4377559d273c7763d287bc94e6ebfe7d1a3418 --- /dev/null +++ b/mlp_map_test/M0_S-2_R2_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9c0096062a00d780ba2059a0428c9edf6a7dcfa11a0a8a755c60e2872b8b83e +size 153705080 diff --git a/mlp_map_test/M0_S-2_R2_P6_config.json b/mlp_map_test/M0_S-2_R2_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6cc9e2841699d384379b3c47798933ec3ccb087c --- /dev/null +++ b/mlp_map_test/M0_S-2_R2_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R2_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R4_P2.pt b/mlp_map_test/M0_S-2_R4_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..496b84e0171843cbf60cdaa4869cda1eddafc042 --- /dev/null +++ b/mlp_map_test/M0_S-2_R4_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0dc239455dd8d2730ec3d6281a8a6970c9533fe57c8fbfd87d854cd02f1a056 +size 153705080 diff --git a/mlp_map_test/M0_S-2_R4_P2_config.json b/mlp_map_test/M0_S-2_R4_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f501708e173951ba4ba507bce7292e9168f0da3 --- /dev/null +++ b/mlp_map_test/M0_S-2_R4_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R4_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R8_P1.pt b/mlp_map_test/M0_S-2_R8_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..b38fd9bec9310234c3292b81a5611c692eb357b9 --- /dev/null +++ b/mlp_map_test/M0_S-2_R8_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd089c61fe3b8f6377e1e637136c8fe5936e49136e68fabe3b67639beb77e69f +size 153705080 diff --git a/mlp_map_test/M0_S-2_R8_P1_config.json b/mlp_map_test/M0_S-2_R8_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..bf7cf9791cd6a539d174684a112bacd17e366f2e --- /dev/null +++ b/mlp_map_test/M0_S-2_R8_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R8_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-2_R8_P6.pt b/mlp_map_test/M0_S-2_R8_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..70c5ef05e9927cfab6cfe40f61c105714fbd762d --- /dev/null +++ b/mlp_map_test/M0_S-2_R8_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:444bea44001a54b7c3b3236ce2ee724ec413d73eac1e176e86c3978732454bc6 +size 153705080 diff --git a/mlp_map_test/M0_S-2_R8_P6_config.json b/mlp_map_test/M0_S-2_R8_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..936100313861904c3af2db73e5fed8f44c48b883 --- /dev/null +++ b/mlp_map_test/M0_S-2_R8_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-2_R8_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-4_R1_P0.pt b/mlp_map_test/M0_S-4_R1_P0.pt new file mode 100644 index 0000000000000000000000000000000000000000..74e0821164b355961fcb80072a9349dd2dadfddd --- /dev/null +++ b/mlp_map_test/M0_S-4_R1_P0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9343d0e4a26550fb8bc89c5b28e44dce35b5b15de7e597823f38808dc58eb497 +size 153705080 diff --git a/mlp_map_test/M0_S-4_R1_P0_config.json b/mlp_map_test/M0_S-4_R1_P0_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3286996a0ed480d731993a94286f68da62c24ee8 --- /dev/null +++ b/mlp_map_test/M0_S-4_R1_P0_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 1, + "l1_p": 0, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-4_R1_P0" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-4_R2_P2.pt b/mlp_map_test/M0_S-4_R2_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..329dd0efc05578a1b2a1f6726a319aac8edfa6e5 --- /dev/null +++ b/mlp_map_test/M0_S-4_R2_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e98075cc14067e15ea786d491a3bd58133b766b412e26f9fe6773d2d68a16b50 +size 153705080 diff --git a/mlp_map_test/M0_S-4_R2_P2_config.json b/mlp_map_test/M0_S-4_R2_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9afaaacfaad26960e6020ef94c905bc2c333b253 --- /dev/null +++ b/mlp_map_test/M0_S-4_R2_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-4_R2_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-4_R2_P5.pt b/mlp_map_test/M0_S-4_R2_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..973cd0ac9d614357d47f7f69995f19fdef6c4e79 --- /dev/null +++ b/mlp_map_test/M0_S-4_R2_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4e85a33973a1a7e5a2417de023819a307b4268232f8a6245fd9b33031b14aa9 +size 153705080 diff --git a/mlp_map_test/M0_S-4_R2_P5_config.json b/mlp_map_test/M0_S-4_R2_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9fef3888c754bb95469749ad09cf68a97d8f2b55 --- /dev/null +++ b/mlp_map_test/M0_S-4_R2_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-4_R2_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-4_R4_P3.pt b/mlp_map_test/M0_S-4_R4_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..c44ef9cb72a8b8d06aa62d9f675d3df9606c0933 --- /dev/null +++ b/mlp_map_test/M0_S-4_R4_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a74f2eada1afa47e29f97115efd783050cd0202de87e8be1a81268c24109f09 +size 153705080 diff --git a/mlp_map_test/M0_S-4_R4_P3_config.json b/mlp_map_test/M0_S-4_R4_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..adaeb0ee3e73a3f01e3afa24c2191d1f3483cbf7 --- /dev/null +++ b/mlp_map_test/M0_S-4_R4_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-4_R4_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-4_R8_P4.pt b/mlp_map_test/M0_S-4_R8_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..c44da61c7a17c588881c8471acec0170631aaa53 --- /dev/null +++ b/mlp_map_test/M0_S-4_R8_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cb3af53c98345aec597d8431a88eea554620b047c5e1e31b329da4d24b1e639 +size 153705080 diff --git a/mlp_map_test/M0_S-4_R8_P4_config.json b/mlp_map_test/M0_S-4_R8_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..780520f464bf5a5f3c37efb520313d2dd5a2669e --- /dev/null +++ b/mlp_map_test/M0_S-4_R8_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-4_R8_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R16_P3.pt b/mlp_map_test/M0_S-6_R16_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..a241ddf8cf78e236a14f2fb8c4259ae644963eac --- /dev/null +++ b/mlp_map_test/M0_S-6_R16_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f410085c13cb1ac593dcdde8365300d35d3c5287974a60a84feee4b76f116c74 +size 153705088 diff --git a/mlp_map_test/M0_S-6_R16_P3_config.json b/mlp_map_test/M0_S-6_R16_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..d76bbca27c5c79d9ba432f8bc820c942de110bc6 --- /dev/null +++ b/mlp_map_test/M0_S-6_R16_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R16_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R16_P5.pt b/mlp_map_test/M0_S-6_R16_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..31cf672116e24a842e3225f8a8724cc67f46eefd --- /dev/null +++ b/mlp_map_test/M0_S-6_R16_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67a5e315b4b3a250e5d3a2b5e230f0181a75cc2b412eac665f2fa154de227609 +size 153705088 diff --git a/mlp_map_test/M0_S-6_R16_P5_config.json b/mlp_map_test/M0_S-6_R16_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..ef1cbcf1e5530cf15dcb7552b662cb5ad455005c --- /dev/null +++ b/mlp_map_test/M0_S-6_R16_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R16_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R2_P4.pt b/mlp_map_test/M0_S-6_R2_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..230bf4bebb863cc39cca15787eee4d56490500ed --- /dev/null +++ b/mlp_map_test/M0_S-6_R2_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bf4a4a8d06ef08734e7342e02e8ec37fcd2084deb65dcd83c91ad8cb68ed717 +size 153705080 diff --git a/mlp_map_test/M0_S-6_R2_P4_config.json b/mlp_map_test/M0_S-6_R2_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..15ea1d9684497d16350a30b8a915443ba234d9f5 --- /dev/null +++ b/mlp_map_test/M0_S-6_R2_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R2_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R4_P3.pt b/mlp_map_test/M0_S-6_R4_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..c83bbdae177efdc1ca810064321c6b41c14753a6 --- /dev/null +++ b/mlp_map_test/M0_S-6_R4_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee5c334b32f5ab2bb80363d3eb431af75a46d2098282e4a3278a42cd2ed9ac83 +size 153705080 diff --git a/mlp_map_test/M0_S-6_R4_P3_config.json b/mlp_map_test/M0_S-6_R4_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..187a4db4e588afc9361fc0fabda1b93c02212699 --- /dev/null +++ b/mlp_map_test/M0_S-6_R4_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R4_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R4_P4.pt b/mlp_map_test/M0_S-6_R4_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..8965ae86dfcec6cc5c42b9e88b72a9b73dd33e05 --- /dev/null +++ b/mlp_map_test/M0_S-6_R4_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60f0a4b7f10130c62096b1f58fb07c3fc9c2b27ff6dcba8600c263695f3772ef +size 153705080 diff --git a/mlp_map_test/M0_S-6_R4_P4_config.json b/mlp_map_test/M0_S-6_R4_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..94cfc46a413ce09f758ee52a2c38ce1ae25d4161 --- /dev/null +++ b/mlp_map_test/M0_S-6_R4_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R4_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-6_R8_P1.pt b/mlp_map_test/M0_S-6_R8_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..f331a3c85d8b9314a7e6bf8e15dc201df2875b11 --- /dev/null +++ b/mlp_map_test/M0_S-6_R8_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e7316a1421f45549575eba797bc55333c70bff8becf151781cb389868a2db8 +size 153705080 diff --git a/mlp_map_test/M0_S-6_R8_P1_config.json b/mlp_map_test/M0_S-6_R8_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9b9768a5dd2e2da3ef944c1ffd26b8ff6eef1875 --- /dev/null +++ b/mlp_map_test/M0_S-6_R8_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-6_R8_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-8_R16_P2.pt b/mlp_map_test/M0_S-8_R16_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd46ea4463dbb04062c3c00d074cae139ef06e8a --- /dev/null +++ b/mlp_map_test/M0_S-8_R16_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46cc9e5273e0dae7a31e4402f2b354eba9e8ac21f69686d7d7b9b3e3e9540182 +size 153705088 diff --git a/mlp_map_test/M0_S-8_R16_P2_config.json b/mlp_map_test/M0_S-8_R16_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..921aeaa3155ee6ae2c4204eec0ed20a852ee83c4 --- /dev/null +++ b/mlp_map_test/M0_S-8_R16_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-8_R16_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-8_R2_P3.pt b/mlp_map_test/M0_S-8_R2_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..7230d08ccb8d68d21544ce7bc0642766f76e89c5 --- /dev/null +++ b/mlp_map_test/M0_S-8_R2_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c9be4ca74f85f0528718d1ea8387a54b5b923def2b90d7515d516aefaddb009 +size 153705080 diff --git a/mlp_map_test/M0_S-8_R2_P3_config.json b/mlp_map_test/M0_S-8_R2_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..f55b7b82dbfa44783073484bf795b484560fe0f9 --- /dev/null +++ b/mlp_map_test/M0_S-8_R2_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-8_R2_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-8_R4_P4.pt b/mlp_map_test/M0_S-8_R4_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..6524051d20875f14c933cd5c3ba57440459e05d5 --- /dev/null +++ b/mlp_map_test/M0_S-8_R4_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c745fcf5a4c7273740ba4abbc5c6a574d677f014949a07989debf261991bbd2 +size 153705080 diff --git a/mlp_map_test/M0_S-8_R4_P4_config.json b/mlp_map_test/M0_S-8_R4_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..549e91ad3864459140048677fe0f6443d9e14f55 --- /dev/null +++ b/mlp_map_test/M0_S-8_R4_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-8_R4_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-8_R4_P5.pt b/mlp_map_test/M0_S-8_R4_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..a678f04567cf13a50a728e06bc3cceddb1281292 --- /dev/null +++ b/mlp_map_test/M0_S-8_R4_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d8b202c151b99eca84e0134fb1ca855f6dee8d4f0add9ec3aef1d6462208969 +size 153705080 diff --git a/mlp_map_test/M0_S-8_R4_P5_config.json b/mlp_map_test/M0_S-8_R4_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..11ada75ac82f02d2e63732c6726aadcb8ec9dd7b --- /dev/null +++ b/mlp_map_test/M0_S-8_R4_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-8_R4_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S-8_R8_P2.pt b/mlp_map_test/M0_S-8_R8_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..137800f4329316cd78382c404105e7aefd32e90a --- /dev/null +++ b/mlp_map_test/M0_S-8_R8_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fff6165935707501cf729de23fec3c931a8b8a6fb7a91125de0ddcf6337efda +size 153705080 diff --git a/mlp_map_test/M0_S-8_R8_P2_config.json b/mlp_map_test/M0_S-8_R8_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e84523ff06d548383570f80f2983757caea6b179 --- /dev/null +++ b/mlp_map_test/M0_S-8_R8_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S-8_R8_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S0_R2_P3.pt b/mlp_map_test/M0_S0_R2_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1bd5acdafe4e2ab49e473bfe97da603454ed278 --- /dev/null +++ b/mlp_map_test/M0_S0_R2_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38dbbad683693e83e290be987a02cc17f531d5dd885dc5e4603cbe02f9e25ba4 +size 153705072 diff --git a/mlp_map_test/M0_S0_R2_P3_config.json b/mlp_map_test/M0_S0_R2_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9f21469abb5bf4800ab46147a5b828b6b72074df --- /dev/null +++ b/mlp_map_test/M0_S0_R2_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S0_R2_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S0_R2_P5.pt b/mlp_map_test/M0_S0_R2_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1bf8ab917a10102e08bcf69bcfa65cb551cfc2c --- /dev/null +++ b/mlp_map_test/M0_S0_R2_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dce62ab087e9e38dddf6783097869bfc1881d03559b5e5537c79290d0c4db1d +size 153705072 diff --git a/mlp_map_test/M0_S0_R2_P5_config.json b/mlp_map_test/M0_S0_R2_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a7e8eae94fc3b4c59e0de9f01db10270a710f116 --- /dev/null +++ b/mlp_map_test/M0_S0_R2_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S0_R2_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S0_R8_P1.pt b/mlp_map_test/M0_S0_R8_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..1828e6ab746c968755271a1828f291fdc3e1fbf3 --- /dev/null +++ b/mlp_map_test/M0_S0_R8_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5610177e1268d7b8506d717269204b1cd0da1bd96cfcd3ebc82f938d04090037 +size 153705072 diff --git a/mlp_map_test/M0_S0_R8_P1_config.json b/mlp_map_test/M0_S0_R8_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3ba8f16db679593cc86bc2596a8f3da469a59a6b --- /dev/null +++ b/mlp_map_test/M0_S0_R8_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S0_R8_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M0_S0_R8_P2.pt b/mlp_map_test/M0_S0_R8_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9c778620281138217b9b2e75f830243bf63150f --- /dev/null +++ b/mlp_map_test/M0_S0_R8_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5f3ac458fe97ca42b3c8e888226fddc216281810a1e7e9bec775252b1ca61a3 +size 153705072 diff --git a/mlp_map_test/M0_S0_R8_P2_config.json b/mlp_map_test/M0_S0_R8_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..fde5426f7c12d7582784aae2446ad4c38cc595ca --- /dev/null +++ b/mlp_map_test/M0_S0_R8_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 0, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M0_S0_R8_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-10_R16_P1.pt b/mlp_map_test/M1_S-10_R16_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a4753116d58d95c933268f7017cad91e45380de --- /dev/null +++ b/mlp_map_test/M1_S-10_R16_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0affe2dc3be57c4ce0ae5fa583a1da0dba3c8ba736e58b6aa60efd003a1d3916 +size 153705096 diff --git a/mlp_map_test/M1_S-10_R16_P1_config.json b/mlp_map_test/M1_S-10_R16_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..f9c90cde56fdd8e65871a8e2d7c1100fd64f2c11 --- /dev/null +++ b/mlp_map_test/M1_S-10_R16_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-10_R16_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-10_R2_P6.pt b/mlp_map_test/M1_S-10_R2_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..7354797b9bb6b2f99e4bec188e967f71ef450256 --- /dev/null +++ b/mlp_map_test/M1_S-10_R2_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30961f196efb2b38ce36f4b8e78158ef5983825a00ffae2e80ea447f7d59f3ea +size 153705088 diff --git a/mlp_map_test/M1_S-10_R2_P6_config.json b/mlp_map_test/M1_S-10_R2_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..fd990a76e4ac2a6dcde3945596fe3979b0d24d80 --- /dev/null +++ b/mlp_map_test/M1_S-10_R2_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-10_R2_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-10_R4_P6.pt b/mlp_map_test/M1_S-10_R4_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3c4d68d78c22bf07f2fe76b29cdaa3179d41c13 --- /dev/null +++ b/mlp_map_test/M1_S-10_R4_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03756cb79f5d7953c07564095aed2e32380810e5ac6ea36a0d8d4bf47f6c7643 +size 153705088 diff --git a/mlp_map_test/M1_S-10_R4_P6_config.json b/mlp_map_test/M1_S-10_R4_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2d0357060d3956940f50f508a96a023b4cfe6c4e --- /dev/null +++ b/mlp_map_test/M1_S-10_R4_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-10_R4_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-10_R8_P1.pt b/mlp_map_test/M1_S-10_R8_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..169c61d7f00ec66349438a26a73cc44d3d2bd645 --- /dev/null +++ b/mlp_map_test/M1_S-10_R8_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61c3ade4cf2981a77599bcad59aa435f7945ba216ed6d50a2bd28cb7b848fdf8 +size 153705088 diff --git a/mlp_map_test/M1_S-10_R8_P1_config.json b/mlp_map_test/M1_S-10_R8_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3154d90740ed111a30753cb3de080710137764d0 --- /dev/null +++ b/mlp_map_test/M1_S-10_R8_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-10_R8_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-2_R16_P1.pt b/mlp_map_test/M1_S-2_R16_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..15851509cec548d2f0ec80b580f6d76e7caea756 --- /dev/null +++ b/mlp_map_test/M1_S-2_R16_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbf74540918cce9f0fe0868f3c38cfd6bb29ee12e7dc81c09f58b7c9ae31e625 +size 153705088 diff --git a/mlp_map_test/M1_S-2_R16_P1_config.json b/mlp_map_test/M1_S-2_R16_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0893297de8eccbc3c51e67bc58205090a7e22a0d --- /dev/null +++ b/mlp_map_test/M1_S-2_R16_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-2_R16_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-2_R1_P0.pt b/mlp_map_test/M1_S-2_R1_P0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfdb33ea7ac884bf23f2a310d740da4c48c58804 --- /dev/null +++ b/mlp_map_test/M1_S-2_R1_P0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2887bd8619b85f316544cbbf84c191e7042a74f870b1e148d1d8df7b84ee001a +size 153705080 diff --git a/mlp_map_test/M1_S-2_R1_P0_config.json b/mlp_map_test/M1_S-2_R1_P0_config.json new file mode 100644 index 0000000000000000000000000000000000000000..d1c582e657ea3813fc0e9cdd344fde0737dfa8d0 --- /dev/null +++ b/mlp_map_test/M1_S-2_R1_P0_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 1, + "l1_p": 0, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-2_R1_P0" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-2_R4_P1.pt b/mlp_map_test/M1_S-2_R4_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..79d4ab091fbad243e5f8e8c34eb7f7f0c9033912 --- /dev/null +++ b/mlp_map_test/M1_S-2_R4_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3e094738a8783a904a5082bfccf42a2f851e0c54a73e0d0ba1cb0f45d07afe9 +size 153705080 diff --git a/mlp_map_test/M1_S-2_R4_P1_config.json b/mlp_map_test/M1_S-2_R4_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..de085cd503246b4e69d2d840bc3f67e5c89e018e --- /dev/null +++ b/mlp_map_test/M1_S-2_R4_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-2_R4_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-2_R4_P5.pt b/mlp_map_test/M1_S-2_R4_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..102c8737bbf8c15ed1e0f2c37ebeaf7ad3768c6f --- /dev/null +++ b/mlp_map_test/M1_S-2_R4_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1065b05d9998403a5b0d5048833db1192cf4363027038385a5f395a86594de8 +size 153705080 diff --git a/mlp_map_test/M1_S-2_R4_P5_config.json b/mlp_map_test/M1_S-2_R4_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..bbcb78c8beae05c2f530182c78e64c868a856754 --- /dev/null +++ b/mlp_map_test/M1_S-2_R4_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-2_R4_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-2_R8_P4.pt b/mlp_map_test/M1_S-2_R8_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0ef641d0816da5493fe418d01b938b0710eebe4 --- /dev/null +++ b/mlp_map_test/M1_S-2_R8_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b26a245779b734247a3c6d48530d470272eb3f3b0ca1abd348ddf994c793a84 +size 153705080 diff --git a/mlp_map_test/M1_S-2_R8_P4_config.json b/mlp_map_test/M1_S-2_R8_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e5788d26aa7f901acb480f45ebf09f7d89398f87 --- /dev/null +++ b/mlp_map_test/M1_S-2_R8_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-2_R8_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-4_R16_P6.pt b/mlp_map_test/M1_S-4_R16_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..e01795ea45fd9b0cd06c1e0526ff89c00057c0ff --- /dev/null +++ b/mlp_map_test/M1_S-4_R16_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ce0f9392dc1455698cdead8f65b4ff6b9dfedf0c0c446d5bbbf125dd98ac9c +size 153705088 diff --git a/mlp_map_test/M1_S-4_R16_P6_config.json b/mlp_map_test/M1_S-4_R16_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..f145e4966189f1be269b130da97ddf1895ee260c --- /dev/null +++ b/mlp_map_test/M1_S-4_R16_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-4_R16_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-4_R4_P2.pt b/mlp_map_test/M1_S-4_R4_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..93156bc86e2ee671ce4e753ec65a6adb38787956 --- /dev/null +++ b/mlp_map_test/M1_S-4_R4_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b578fbcf218142cd53bae0bc3edefff7f1894352bb9cbce2dfdaa736240cc6b7 +size 153705080 diff --git a/mlp_map_test/M1_S-4_R4_P2_config.json b/mlp_map_test/M1_S-4_R4_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..09f4675ac0e55555f9cc40dac035118133bd3a29 --- /dev/null +++ b/mlp_map_test/M1_S-4_R4_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-4_R4_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-4_R4_P5.pt b/mlp_map_test/M1_S-4_R4_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b2f986846f73963fe703a6f4e01f5432477ec33 --- /dev/null +++ b/mlp_map_test/M1_S-4_R4_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8a2df0398b80ba296e1961eaea132d49a53a6f6bc63a011758698d7589b61a0 +size 153705080 diff --git a/mlp_map_test/M1_S-4_R4_P5_config.json b/mlp_map_test/M1_S-4_R4_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3e40ca467aa2c76cd882744c9e2aaf81bf954877 --- /dev/null +++ b/mlp_map_test/M1_S-4_R4_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-4_R4_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-4_R4_P6.pt b/mlp_map_test/M1_S-4_R4_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..f33f354fcb22ecf8ad61e62d9a315c5580b70eb8 --- /dev/null +++ b/mlp_map_test/M1_S-4_R4_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bec7fe4ec5ae51230f7e0c4470d88bd71ba62caa1cbdba095ac820cd9262b5d2 +size 153705080 diff --git a/mlp_map_test/M1_S-4_R4_P6_config.json b/mlp_map_test/M1_S-4_R4_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6b70517e51eb99884672a08cbfc13a850d30025 --- /dev/null +++ b/mlp_map_test/M1_S-4_R4_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-4_R4_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-4_R8_P3.pt b/mlp_map_test/M1_S-4_R8_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..55200d45a942c40a8ce0b800127865ee05a27656 --- /dev/null +++ b/mlp_map_test/M1_S-4_R8_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9f9cd0b60245fd382414f38cb91f89ec297ef91d4d8c2ccf2bd2136d4f97019 +size 153705080 diff --git a/mlp_map_test/M1_S-4_R8_P3_config.json b/mlp_map_test/M1_S-4_R8_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5fd3bc458d681e32e335b3d3baaf38fbc9171af6 --- /dev/null +++ b/mlp_map_test/M1_S-4_R8_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-4_R8_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-4_R8_P6.pt b/mlp_map_test/M1_S-4_R8_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..31785a27a80c49b847b5228a2929487bf879c5dc --- /dev/null +++ b/mlp_map_test/M1_S-4_R8_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a786e4583551a9ea3da73c5f6d18ed024a3b9512aa816499990851a283def5da +size 153705080 diff --git a/mlp_map_test/M1_S-4_R8_P6_config.json b/mlp_map_test/M1_S-4_R8_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..99cbef87ddecb13309c563d92fb1a799c404973a --- /dev/null +++ b/mlp_map_test/M1_S-4_R8_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-4_R8_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R16_P2.pt b/mlp_map_test/M1_S-6_R16_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7dfeae3904ed7667853065d36bd3425f77716d1 --- /dev/null +++ b/mlp_map_test/M1_S-6_R16_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a0a6f8cb8abf003b65ea19bd07b80319a1d96a847e45f664f399bc1fb287cf6 +size 153705088 diff --git a/mlp_map_test/M1_S-6_R16_P2_config.json b/mlp_map_test/M1_S-6_R16_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..68ef7dd512ce6911fa7c94f33fc5a5466fab6244 --- /dev/null +++ b/mlp_map_test/M1_S-6_R16_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R16_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R16_P3.pt b/mlp_map_test/M1_S-6_R16_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..54abaa6dcf5f5ace24535a0894f9f4a3935bc650 --- /dev/null +++ b/mlp_map_test/M1_S-6_R16_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7bfa04bc0a4b7a2f8f79710da31e6d5f85ef7579ec528e541e43bcad5a4d0ff +size 153705088 diff --git a/mlp_map_test/M1_S-6_R16_P3_config.json b/mlp_map_test/M1_S-6_R16_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..eafd0af9af8190cbf556221c7d5e90d41b6fcd30 --- /dev/null +++ b/mlp_map_test/M1_S-6_R16_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R16_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R2_P2.pt b/mlp_map_test/M1_S-6_R2_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7f8e1572a18f2bd36db44bc432376285dd5f757 --- /dev/null +++ b/mlp_map_test/M1_S-6_R2_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543ef04a54519a96c0b2ebfa578521dea9ce6b82e7606dc73dfebca682efbb97 +size 153705080 diff --git a/mlp_map_test/M1_S-6_R2_P2_config.json b/mlp_map_test/M1_S-6_R2_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2613d9ab9ea13927d142c96b852ca5d093900cf2 --- /dev/null +++ b/mlp_map_test/M1_S-6_R2_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R2_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R4_P1.pt b/mlp_map_test/M1_S-6_R4_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4d385b241f712e673ed5e4e71bb01c95aa619ea --- /dev/null +++ b/mlp_map_test/M1_S-6_R4_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c692acc8fe995c83d2642d010ce7cda4df14604ee4e9cd106994af12ce05fbb6 +size 153705080 diff --git a/mlp_map_test/M1_S-6_R4_P1_config.json b/mlp_map_test/M1_S-6_R4_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9f9fece86852eae41c26d96d3933a9eb49c71a27 --- /dev/null +++ b/mlp_map_test/M1_S-6_R4_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R4_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R4_P3.pt b/mlp_map_test/M1_S-6_R4_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f0fd582181b90f7d76dca727c49c2b0f4e1802b --- /dev/null +++ b/mlp_map_test/M1_S-6_R4_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e84f9dd253a922b8da50450a89a0369a08fd640ac33c78454e000d4d59ef813f +size 153705080 diff --git a/mlp_map_test/M1_S-6_R4_P3_config.json b/mlp_map_test/M1_S-6_R4_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..d83e8210a83a83ebc62302fc2964f817438220d5 --- /dev/null +++ b/mlp_map_test/M1_S-6_R4_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R4_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R4_P6.pt b/mlp_map_test/M1_S-6_R4_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..52bdd4bc38a868a9d0018d92a44c69d352aa6718 --- /dev/null +++ b/mlp_map_test/M1_S-6_R4_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4013ccd89e3fbe4e6cd0ae07d38ae0c8f6be0f9450af9478d3e83b110b9374b +size 153705080 diff --git a/mlp_map_test/M1_S-6_R4_P6_config.json b/mlp_map_test/M1_S-6_R4_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4e2dc5569a25a8ede3f4beb524a3e2b02da47009 --- /dev/null +++ b/mlp_map_test/M1_S-6_R4_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R4_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R8_P2.pt b/mlp_map_test/M1_S-6_R8_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..befcd4e7882e30ba7e8be65cccfca7fe0c71a1eb --- /dev/null +++ b/mlp_map_test/M1_S-6_R8_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c14e0edd24becedbc0d08e8d57c7e9faca8d5458553d97ace52239c926ddf296 +size 153705080 diff --git a/mlp_map_test/M1_S-6_R8_P2_config.json b/mlp_map_test/M1_S-6_R8_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..20f3dbe2955a7c59cda7b008aff9b89d18b976bc --- /dev/null +++ b/mlp_map_test/M1_S-6_R8_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R8_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-6_R8_P5.pt b/mlp_map_test/M1_S-6_R8_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2f50797779abfba2a2bf7b14b4de3a5649d4fa6 --- /dev/null +++ b/mlp_map_test/M1_S-6_R8_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee860563bf96c1110c428dbc5d3a7e6d41c3376a009168334e823cb176b6e23 +size 153705080 diff --git a/mlp_map_test/M1_S-6_R8_P5_config.json b/mlp_map_test/M1_S-6_R8_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..f58c3d6e6911cdbbbb0a8011ba37fd2f3ba40b95 --- /dev/null +++ b/mlp_map_test/M1_S-6_R8_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-6_R8_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-8_R16_P4.pt b/mlp_map_test/M1_S-8_R16_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..668babfc4858b411bfe147bc4e50fc1212f9891b --- /dev/null +++ b/mlp_map_test/M1_S-8_R16_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4078ea944603e1f78d8c5fe2278bf62c0bfc85989cd04736f977aafe343ceb50 +size 153705088 diff --git a/mlp_map_test/M1_S-8_R16_P4_config.json b/mlp_map_test/M1_S-8_R16_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..eade7f473809fba93ea62a0fbcf0d77a0c102282 --- /dev/null +++ b/mlp_map_test/M1_S-8_R16_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-8_R16_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-8_R2_P1.pt b/mlp_map_test/M1_S-8_R2_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..b812190e85d8061bf1f7e7956e3c1a04c6e85fc6 --- /dev/null +++ b/mlp_map_test/M1_S-8_R2_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:505b15208bf07415e633ba7dd47fc883b1f60ad658af999ded0afc218a9855b2 +size 153705080 diff --git a/mlp_map_test/M1_S-8_R2_P1_config.json b/mlp_map_test/M1_S-8_R2_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..8a6181f28b6b67aa20876449d3d06350f03586af --- /dev/null +++ b/mlp_map_test/M1_S-8_R2_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-8_R2_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-8_R2_P2.pt b/mlp_map_test/M1_S-8_R2_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0d19d468b611479e78aa3df04869420809cd643 --- /dev/null +++ b/mlp_map_test/M1_S-8_R2_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9752bd168fc1ae9d07718e306c4b4cbdccc85edcdc4486b96c5a0fbd8f04b73a +size 153705080 diff --git a/mlp_map_test/M1_S-8_R2_P2_config.json b/mlp_map_test/M1_S-8_R2_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..66d5ba1b4640ce2d1bc26d4808f7696671d9d182 --- /dev/null +++ b/mlp_map_test/M1_S-8_R2_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-8_R2_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-8_R2_P3.pt b/mlp_map_test/M1_S-8_R2_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..09ce4219e3a9dc465d0fe05177c7d2fe5dd94df6 --- /dev/null +++ b/mlp_map_test/M1_S-8_R2_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa3550014c9c129c08b6c6b6d72bfdfb9244745d218dd94b4721194bcc3c06ff +size 153705080 diff --git a/mlp_map_test/M1_S-8_R2_P3_config.json b/mlp_map_test/M1_S-8_R2_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..dfe238d3879448121c9037746d841b16ab0696c5 --- /dev/null +++ b/mlp_map_test/M1_S-8_R2_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-8_R2_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-8_R4_P6.pt b/mlp_map_test/M1_S-8_R4_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6bae76cddb15c88943a6f2709bb1b6d9b554083 --- /dev/null +++ b/mlp_map_test/M1_S-8_R4_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80566db5a74523ccb6608f12f0c02cd758355958e95395aa55d77ace56171ae5 +size 153705080 diff --git a/mlp_map_test/M1_S-8_R4_P6_config.json b/mlp_map_test/M1_S-8_R4_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..843385f550a173c09de362c794731bdb7ad5204a --- /dev/null +++ b/mlp_map_test/M1_S-8_R4_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-8_R4_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-8_R8_P3.pt b/mlp_map_test/M1_S-8_R8_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..7902a811791774ad9205a5e67de904c90dc18ca0 --- /dev/null +++ b/mlp_map_test/M1_S-8_R8_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:275b24f9e0cbadaaed2d76a774979e97a0378d7837d911b6693842616549bade +size 153705080 diff --git a/mlp_map_test/M1_S-8_R8_P3_config.json b/mlp_map_test/M1_S-8_R8_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..cf80c6dd9d3e40b803c43ffe541c9b4f72e38584 --- /dev/null +++ b/mlp_map_test/M1_S-8_R8_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-8_R8_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S-8_R8_P5.pt b/mlp_map_test/M1_S-8_R8_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..4912a191eea4156cf83ea527fde8fe2931bee36d --- /dev/null +++ b/mlp_map_test/M1_S-8_R8_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:915b5314807602b2b9d8833b3a2a96ba9d541704b51fc4ff62b9be294d5ef1ce +size 153705080 diff --git a/mlp_map_test/M1_S-8_R8_P5_config.json b/mlp_map_test/M1_S-8_R8_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9174967d36bfce08019ee87ee329445424bcd883 --- /dev/null +++ b/mlp_map_test/M1_S-8_R8_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S-8_R8_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S0_R16_P2.pt b/mlp_map_test/M1_S0_R16_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d1b368bf99476becac54e2bc1b0422a21b10cb1 --- /dev/null +++ b/mlp_map_test/M1_S0_R16_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a65f6542f0353cc6d3ed68e8f5b4b6efeb011a762eb69380b5fbc5830d2972e +size 153705080 diff --git a/mlp_map_test/M1_S0_R16_P2_config.json b/mlp_map_test/M1_S0_R16_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b48a355cedb29dd680821c01330fb1f5fb3b3b63 --- /dev/null +++ b/mlp_map_test/M1_S0_R16_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S0_R16_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S0_R16_P4.pt b/mlp_map_test/M1_S0_R16_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..427d9f3c6e4c7ed53859b18c22390405368be7db --- /dev/null +++ b/mlp_map_test/M1_S0_R16_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11bd9f833dcb4ccdd0a01d27a344b3a206e1bf809674cc14084875b3631b86eb +size 153705080 diff --git a/mlp_map_test/M1_S0_R16_P4_config.json b/mlp_map_test/M1_S0_R16_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..fc2e8165e01a8d58e7ce09ce201ba0720ffbdf09 --- /dev/null +++ b/mlp_map_test/M1_S0_R16_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S0_R16_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S0_R16_P6.pt b/mlp_map_test/M1_S0_R16_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..c99950614f0a3ae1cde05dc8f2eaca58bd88fb33 --- /dev/null +++ b/mlp_map_test/M1_S0_R16_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d527e0f5a8ebe8eade25ca21bffe32de596cd4dcfc1590f83bc055941fb0f7a5 +size 153705080 diff --git a/mlp_map_test/M1_S0_R16_P6_config.json b/mlp_map_test/M1_S0_R16_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..faf37cc82a5ea1b34c031ddaea21bbebed2c5372 --- /dev/null +++ b/mlp_map_test/M1_S0_R16_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S0_R16_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M1_S0_R8_P4.pt b/mlp_map_test/M1_S0_R8_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..576cf65a8ec1f888aec38ba9f750dec212b3e949 --- /dev/null +++ b/mlp_map_test/M1_S0_R8_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f486ef96050d40004d8535da021ffb855d737b5d07aefd0bda9c3f494f141eb +size 153705072 diff --git a/mlp_map_test/M1_S0_R8_P4_config.json b/mlp_map_test/M1_S0_R8_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..035db7f8657cef12bc6f7c8ff7fdd25b91808a8c --- /dev/null +++ b/mlp_map_test/M1_S0_R8_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 1, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M1_S0_R8_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-10_R16_P4.pt b/mlp_map_test/M2_S-10_R16_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..5474f806a3ad7f4104311afb5b68ebbe69ada37f --- /dev/null +++ b/mlp_map_test/M2_S-10_R16_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f93e02198087cc08a2882fb6cfb61470db2632c3b021296917465ff6601f9222 +size 153705096 diff --git a/mlp_map_test/M2_S-10_R16_P4_config.json b/mlp_map_test/M2_S-10_R16_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb6c36a9bd7bc59f4fb58ff0256e30625f02321c --- /dev/null +++ b/mlp_map_test/M2_S-10_R16_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-10_R16_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-10_R2_P1.pt b/mlp_map_test/M2_S-10_R2_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..35fe0cb3c6f4c08295cf0d9e346668c892a46390 --- /dev/null +++ b/mlp_map_test/M2_S-10_R2_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:813fe23ef03cec96f66df676cf81c5daabada604b0e49fca9b25105305d38279 +size 153705088 diff --git a/mlp_map_test/M2_S-10_R2_P1_config.json b/mlp_map_test/M2_S-10_R2_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e09efb3eee5958a805c1074ba420ef2d359f63c4 --- /dev/null +++ b/mlp_map_test/M2_S-10_R2_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-10_R2_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-10_R2_P3.pt b/mlp_map_test/M2_S-10_R2_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..d49ad3855779a9c55a2bb7aeb2a59d52d99d94d1 --- /dev/null +++ b/mlp_map_test/M2_S-10_R2_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bec827207f145cf7eaf88ee658ec07da1c3360430537de352a0999812f37c62 +size 153705088 diff --git a/mlp_map_test/M2_S-10_R2_P3_config.json b/mlp_map_test/M2_S-10_R2_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..882473873247f3a233eb884078027fc862392fe6 --- /dev/null +++ b/mlp_map_test/M2_S-10_R2_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-10_R2_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-10_R2_P4.pt b/mlp_map_test/M2_S-10_R2_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf0fed46b2b931c42a6acb299755c510e831a4a2 --- /dev/null +++ b/mlp_map_test/M2_S-10_R2_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f704f3bd477b8ec2d325d15a27dab10c93c2dbb528d15b3fa72790c37c2fbfd +size 153705088 diff --git a/mlp_map_test/M2_S-10_R2_P4_config.json b/mlp_map_test/M2_S-10_R2_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..542b405791f2bd5e51d5d28b2800957ac530f232 --- /dev/null +++ b/mlp_map_test/M2_S-10_R2_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-10_R2_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-10_R2_P5.pt b/mlp_map_test/M2_S-10_R2_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..def7aa59e015ea4c51161e69910600b399a1b5d4 --- /dev/null +++ b/mlp_map_test/M2_S-10_R2_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f73ea4fd5faa0e74c678db16bd9dbb8f880a17eb82a615f454e34c8a80f2218 +size 153705088 diff --git a/mlp_map_test/M2_S-10_R2_P5_config.json b/mlp_map_test/M2_S-10_R2_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..cb04739b2453e3de87aa66f29206698edd102960 --- /dev/null +++ b/mlp_map_test/M2_S-10_R2_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-10_R2_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-10_R2_P6.pt b/mlp_map_test/M2_S-10_R2_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdfbe0e391d0104c77f3efff3fedcd6584ae29e8 --- /dev/null +++ b/mlp_map_test/M2_S-10_R2_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2adc119670ed23c0df956fa26c89d120b41a37f2bee4c41f494e1b92507385be +size 153705088 diff --git a/mlp_map_test/M2_S-10_R2_P6_config.json b/mlp_map_test/M2_S-10_R2_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1bb6248cef0e9ce7570e97f6f51588b91e1353e6 --- /dev/null +++ b/mlp_map_test/M2_S-10_R2_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-10_R2_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-10_R4_P2.pt b/mlp_map_test/M2_S-10_R4_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9171935b0e3e57c9564ddfcb6faf1b7eb1719b9 --- /dev/null +++ b/mlp_map_test/M2_S-10_R4_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd238a88deee7cf4e0e3197d721d1a72d9dfb052d40b4ecf024e8eae7445d60d +size 153705088 diff --git a/mlp_map_test/M2_S-10_R4_P2_config.json b/mlp_map_test/M2_S-10_R4_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9517826a5d3e60095df275f8385944b8aeeb95ba --- /dev/null +++ b/mlp_map_test/M2_S-10_R4_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-10_R4_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-10_R8_P3.pt b/mlp_map_test/M2_S-10_R8_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..9552d3058b7a05de5ef8e00a9d8093aff7199bd4 --- /dev/null +++ b/mlp_map_test/M2_S-10_R8_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aa011e72be05bcec009a680d4f7cae6387b12529b1661de624ab319d09ed2b9 +size 153705088 diff --git a/mlp_map_test/M2_S-10_R8_P3_config.json b/mlp_map_test/M2_S-10_R8_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..ec14a316e01c7f5fe9cabd3bbb62bc6447a0e1aa --- /dev/null +++ b/mlp_map_test/M2_S-10_R8_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -10, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-10_R8_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R16_P3.pt b/mlp_map_test/M2_S-2_R16_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..73034bbff2d6b575216b2647b71ce6fd22113f79 --- /dev/null +++ b/mlp_map_test/M2_S-2_R16_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:127a902811c5fbf634a331cf805daa7bc3a8ac8570fcdcf198fed481daa3772d +size 153705088 diff --git a/mlp_map_test/M2_S-2_R16_P3_config.json b/mlp_map_test/M2_S-2_R16_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..20226ffc6862c2f62a9b7d1eea2798d6fd4ce86d --- /dev/null +++ b/mlp_map_test/M2_S-2_R16_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R16_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R16_P6.pt b/mlp_map_test/M2_S-2_R16_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed685e8f823a70f1ecbf84b6d4aa1692e48fd0b6 --- /dev/null +++ b/mlp_map_test/M2_S-2_R16_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8e425eb6796232e8650637548027aeb365b5ae5face33579d830cdd833426b5 +size 153705088 diff --git a/mlp_map_test/M2_S-2_R16_P6_config.json b/mlp_map_test/M2_S-2_R16_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9e4b7173f35101a5745a677042415b17b0374165 --- /dev/null +++ b/mlp_map_test/M2_S-2_R16_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R16_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R2_P1.pt b/mlp_map_test/M2_S-2_R2_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec7f8531ce24abed993e6011f52426ee05703854 --- /dev/null +++ b/mlp_map_test/M2_S-2_R2_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b3fad29834cdd97d9da998017d0c8bb3c1152e19953de21cda2d085032c1df +size 153705080 diff --git a/mlp_map_test/M2_S-2_R2_P1_config.json b/mlp_map_test/M2_S-2_R2_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0876cfad8caf96b7ba8cee58b9e01cefc244cb47 --- /dev/null +++ b/mlp_map_test/M2_S-2_R2_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R2_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R2_P3.pt b/mlp_map_test/M2_S-2_R2_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..84ac900c42fa2df5c7874be1734b0a2a82ff98cc --- /dev/null +++ b/mlp_map_test/M2_S-2_R2_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c944ea4b9e33195f97c02b2aa6d2a6a46d0810011c30a556867ab7d2e1740b0 +size 153705080 diff --git a/mlp_map_test/M2_S-2_R2_P3_config.json b/mlp_map_test/M2_S-2_R2_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..ce04ce84c1b36f00c823ce41cbaf7ad9860883bb --- /dev/null +++ b/mlp_map_test/M2_S-2_R2_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R2_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R2_P4.pt b/mlp_map_test/M2_S-2_R2_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..c16d96cd0c69ceec2e39584538041220f650e294 --- /dev/null +++ b/mlp_map_test/M2_S-2_R2_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368d1c35b999fced34a3ba276e27857bb217b59add0e1a600f50a917f9384a71 +size 153705080 diff --git a/mlp_map_test/M2_S-2_R2_P4_config.json b/mlp_map_test/M2_S-2_R2_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..d44958bfe3c846501207b79d628fd1406c50cb1e --- /dev/null +++ b/mlp_map_test/M2_S-2_R2_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R2_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R4_P2.pt b/mlp_map_test/M2_S-2_R4_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe18b9c04b1b15ffcf3089ce56dcceed2db5b02e --- /dev/null +++ b/mlp_map_test/M2_S-2_R4_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0756badeededbf44c590485a23e9fabe8d5fb4d2bf22c84a8ed4bc5832fed342 +size 153705080 diff --git a/mlp_map_test/M2_S-2_R4_P2_config.json b/mlp_map_test/M2_S-2_R4_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..ef391a13226a9f0a23e1c45d69b9aa72c0dc3285 --- /dev/null +++ b/mlp_map_test/M2_S-2_R4_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R4_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R4_P3.pt b/mlp_map_test/M2_S-2_R4_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..621b0830126ff231aa6945cf8f2dcf02e10d5e53 --- /dev/null +++ b/mlp_map_test/M2_S-2_R4_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f0284540ca481b55b44d56c866e94cafc07945e93ce57ea72bea746588f500f +size 153705080 diff --git a/mlp_map_test/M2_S-2_R4_P3_config.json b/mlp_map_test/M2_S-2_R4_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..ca48484c1fdecc2a93513bb13c968f7ffe62b598 --- /dev/null +++ b/mlp_map_test/M2_S-2_R4_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R4_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R8_P1.pt b/mlp_map_test/M2_S-2_R8_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..551de06b6c5b2b3603eef20636ca0ae246105df1 --- /dev/null +++ b/mlp_map_test/M2_S-2_R8_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74816a6972e7f2e6fff0edee6b4fe9cb467a683942c71aee04aad53dea2c3c5f +size 153705080 diff --git a/mlp_map_test/M2_S-2_R8_P1_config.json b/mlp_map_test/M2_S-2_R8_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..64bb856d21406374563d42a57ac86b110f9c8c97 --- /dev/null +++ b/mlp_map_test/M2_S-2_R8_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R8_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R8_P2.pt b/mlp_map_test/M2_S-2_R8_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbd82217e05a771d74a33773d7d5be0ee71e8957 --- /dev/null +++ b/mlp_map_test/M2_S-2_R8_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ff873e9272fdd8b1d550615e650b907e5b77b8ffe3d4e0d6e511088ad633722 +size 153705080 diff --git a/mlp_map_test/M2_S-2_R8_P2_config.json b/mlp_map_test/M2_S-2_R8_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9c48591de55657997ccf532016ab4bb2b813307a --- /dev/null +++ b/mlp_map_test/M2_S-2_R8_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R8_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-2_R8_P6.pt b/mlp_map_test/M2_S-2_R8_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e6531bf0f1049189981312231a9922e672e223e --- /dev/null +++ b/mlp_map_test/M2_S-2_R8_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1fd5c6219dbe880daccd7adc39adfdcf2b33b4aa1f1aa14e125d9d4f26be4bc +size 153705080 diff --git a/mlp_map_test/M2_S-2_R8_P6_config.json b/mlp_map_test/M2_S-2_R8_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1a7871bacb1119c4fe1027052f095de515194df0 --- /dev/null +++ b/mlp_map_test/M2_S-2_R8_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -2, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-2_R8_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R16_P3.pt b/mlp_map_test/M2_S-4_R16_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb6f0cd475861c1ccb8d5efdac882abc4f2b47b7 --- /dev/null +++ b/mlp_map_test/M2_S-4_R16_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2a59652e2977c8a77c6e7a54280363bc6f45bedbd6a648f91ff0d070375c4b2 +size 153705088 diff --git a/mlp_map_test/M2_S-4_R16_P3_config.json b/mlp_map_test/M2_S-4_R16_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a0c10f4f130eaaff685759fc74d961a0cfd124a --- /dev/null +++ b/mlp_map_test/M2_S-4_R16_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R16_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R16_P5.pt b/mlp_map_test/M2_S-4_R16_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..967e9d205c80a221c454b0283affd59593bfe947 --- /dev/null +++ b/mlp_map_test/M2_S-4_R16_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:475f100e116008dc87b83bc0aa60117d48a0ed771b5e0668d47d452862ae0cc5 +size 153705088 diff --git a/mlp_map_test/M2_S-4_R16_P5_config.json b/mlp_map_test/M2_S-4_R16_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e1d00553393b5c3d14a33299f1ade8a0c87b6650 --- /dev/null +++ b/mlp_map_test/M2_S-4_R16_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R16_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R16_P6.pt b/mlp_map_test/M2_S-4_R16_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..af4237f518303b26426705c614264a9967629508 --- /dev/null +++ b/mlp_map_test/M2_S-4_R16_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69894fa46999a05bb68c9249c8e59c6418c3a9d7544fa8d1a16a7a96d54bf8e0 +size 153705088 diff --git a/mlp_map_test/M2_S-4_R16_P6_config.json b/mlp_map_test/M2_S-4_R16_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4c5651389dd5324ce4e6a3f4e5a7f6c34c63295e --- /dev/null +++ b/mlp_map_test/M2_S-4_R16_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R16_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R2_P1.pt b/mlp_map_test/M2_S-4_R2_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..a970dc1ec5ac845886264f0717df33e8b78eff52 --- /dev/null +++ b/mlp_map_test/M2_S-4_R2_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:537650fd0904d6e495a3519c9ffb464ee7d48d4eb189e4245bef4d15fdaa81bc +size 153705080 diff --git a/mlp_map_test/M2_S-4_R2_P1_config.json b/mlp_map_test/M2_S-4_R2_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0749ba3bf4f132544acbf17f7edf4d6aafc91ca8 --- /dev/null +++ b/mlp_map_test/M2_S-4_R2_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R2_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R2_P5.pt b/mlp_map_test/M2_S-4_R2_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..20b7817db32aedf34a8b60583e8077463f16d2e5 --- /dev/null +++ b/mlp_map_test/M2_S-4_R2_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f85aeceaad2142fe21780942d09de052ea9dedb5c921e45bb27f517bc85401a +size 153705080 diff --git a/mlp_map_test/M2_S-4_R2_P5_config.json b/mlp_map_test/M2_S-4_R2_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c0eddd98bfefc920c6ea8059461beaece8a593c3 --- /dev/null +++ b/mlp_map_test/M2_S-4_R2_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R2_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R2_P6.pt b/mlp_map_test/M2_S-4_R2_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9724602a9d2ad5c401d3d7190f96cfdb3b238d3 --- /dev/null +++ b/mlp_map_test/M2_S-4_R2_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a171d17bebd413152c983f853b70126decaf9a2a7f3db9d01b597af1d46a87 +size 153705080 diff --git a/mlp_map_test/M2_S-4_R2_P6_config.json b/mlp_map_test/M2_S-4_R2_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..02e19fb447be2bc1cf8b0971fb5b7be4e6bba381 --- /dev/null +++ b/mlp_map_test/M2_S-4_R2_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R2_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R4_P2.pt b/mlp_map_test/M2_S-4_R4_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..7590bde97c0e01a833a765235804e61d49a80e34 --- /dev/null +++ b/mlp_map_test/M2_S-4_R4_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7be53630991d1b92811106b6c77e5efc0d3c8851d9949959231535501b59e4e4 +size 153705080 diff --git a/mlp_map_test/M2_S-4_R4_P2_config.json b/mlp_map_test/M2_S-4_R4_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..885457a4326c465f16752942992579072da2b586 --- /dev/null +++ b/mlp_map_test/M2_S-4_R4_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R4_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R4_P4.pt b/mlp_map_test/M2_S-4_R4_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c661e60ca8e3a660b29c86b85c7e3b757a9a583 --- /dev/null +++ b/mlp_map_test/M2_S-4_R4_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96d89fb9f849dbcf2d5f0a6cddcbcf7489af423b50f380a9a110739348f51659 +size 153705080 diff --git a/mlp_map_test/M2_S-4_R4_P4_config.json b/mlp_map_test/M2_S-4_R4_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebc3739a950ea4480f3f9ae31dbfa3143372ddf --- /dev/null +++ b/mlp_map_test/M2_S-4_R4_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R4_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R8_P2.pt b/mlp_map_test/M2_S-4_R8_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..06c647388307eb22fa06c47cc61f6e33fb34d647 --- /dev/null +++ b/mlp_map_test/M2_S-4_R8_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:893a968d37deb20a6075847c70d135a49bcaafef0bb47298c0cc2fe2337ff805 +size 153705080 diff --git a/mlp_map_test/M2_S-4_R8_P2_config.json b/mlp_map_test/M2_S-4_R8_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3d65d3adc9ad63aab184461a9453f60a7847f3a4 --- /dev/null +++ b/mlp_map_test/M2_S-4_R8_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R8_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-4_R8_P4.pt b/mlp_map_test/M2_S-4_R8_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..20eb4fdf6807f4b674f459bc613781cf42a7c70c --- /dev/null +++ b/mlp_map_test/M2_S-4_R8_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd2b4d265f6c097fe14032beaa5762aadd1a8f7b74d0f06392aecf520a97ae77 +size 153705080 diff --git a/mlp_map_test/M2_S-4_R8_P4_config.json b/mlp_map_test/M2_S-4_R8_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..bc457493b4dedb0d2d39abdb7ffe09057ecd8c4b --- /dev/null +++ b/mlp_map_test/M2_S-4_R8_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -4, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-4_R8_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R1_P0.pt b/mlp_map_test/M2_S-6_R1_P0.pt new file mode 100644 index 0000000000000000000000000000000000000000..36ea63252682486a7b88218ae7c6d6e3acf00755 --- /dev/null +++ b/mlp_map_test/M2_S-6_R1_P0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b5e9c0f401f0324adcbad1f4a66565249f44fc641ae02d1b4f38c28509a8cc8 +size 153705080 diff --git a/mlp_map_test/M2_S-6_R1_P0_config.json b/mlp_map_test/M2_S-6_R1_P0_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e3b605b48e8310f52c3afe07500d10a373580585 --- /dev/null +++ b/mlp_map_test/M2_S-6_R1_P0_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 1, + "l1_p": 0, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R1_P0" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R2_P1.pt b/mlp_map_test/M2_S-6_R2_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..865c984cd4af9c2127b38c0de6bea4adc1f30ca5 --- /dev/null +++ b/mlp_map_test/M2_S-6_R2_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baacda98041fd6ec189eafac47e42efb5aeb9f0ab40c167672c4512d6fd761f1 +size 153705080 diff --git a/mlp_map_test/M2_S-6_R2_P1_config.json b/mlp_map_test/M2_S-6_R2_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..67dda843ca7efda5e3bc62d4b192a5c14b66b420 --- /dev/null +++ b/mlp_map_test/M2_S-6_R2_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R2_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R2_P3.pt b/mlp_map_test/M2_S-6_R2_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e6faa0f298d0ca913f8d773cc52ed07bcc6ec85 --- /dev/null +++ b/mlp_map_test/M2_S-6_R2_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfcc64d01348b5cd712f5c798e91ffe8057b960d05cbffa1f485acb97a231d35 +size 153705080 diff --git a/mlp_map_test/M2_S-6_R2_P3_config.json b/mlp_map_test/M2_S-6_R2_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..342d60a00e8b0b171d604fce67f398fa65a59ef7 --- /dev/null +++ b/mlp_map_test/M2_S-6_R2_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R2_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R2_P5.pt b/mlp_map_test/M2_S-6_R2_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..09b1ff84d996af3f5fc2f137ae219cf27b072b5a --- /dev/null +++ b/mlp_map_test/M2_S-6_R2_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b0db703e0fc41d6420dd184b7744f96c8b416dc3212228352917c2c7d1b710 +size 153705080 diff --git a/mlp_map_test/M2_S-6_R2_P5_config.json b/mlp_map_test/M2_S-6_R2_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..450447e0f37b0598d11c7ba3d6e3fd56abd94ae1 --- /dev/null +++ b/mlp_map_test/M2_S-6_R2_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R2_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R4_P2.pt b/mlp_map_test/M2_S-6_R4_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..d68a601c0e5f18db014977d4618126c7a2184f63 --- /dev/null +++ b/mlp_map_test/M2_S-6_R4_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d3b79e87d0615683e7f128cfcc6c5fc198517eebd41f183b3db5f27e4f09601 +size 153705080 diff --git a/mlp_map_test/M2_S-6_R4_P2_config.json b/mlp_map_test/M2_S-6_R4_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..29295bde52b13602978997501fe85d2555167794 --- /dev/null +++ b/mlp_map_test/M2_S-6_R4_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R4_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R4_P4.pt b/mlp_map_test/M2_S-6_R4_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5993bf701992c340e784991c4ed818de32826b9 --- /dev/null +++ b/mlp_map_test/M2_S-6_R4_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cf134fc6123d3f71e5e16fad64b5501fde53fa1f7ef54b1d69149e34e6ec00b +size 153705080 diff --git a/mlp_map_test/M2_S-6_R4_P4_config.json b/mlp_map_test/M2_S-6_R4_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..18da40c8b6bb6a3a4408a23869a4c3deb1f440d4 --- /dev/null +++ b/mlp_map_test/M2_S-6_R4_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R4_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R8_P2.pt b/mlp_map_test/M2_S-6_R8_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b3aa964b710a39312a13a1424165ebb02c64a04 --- /dev/null +++ b/mlp_map_test/M2_S-6_R8_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1203d22e1981a9e3723df4570764f8a332fa0492294a0bb5ce03b1e0176bc9bd +size 153705080 diff --git a/mlp_map_test/M2_S-6_R8_P2_config.json b/mlp_map_test/M2_S-6_R8_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3fe51b4bf507408eace5c7dd6ff7d7f231b38df6 --- /dev/null +++ b/mlp_map_test/M2_S-6_R8_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R8_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R8_P5.pt b/mlp_map_test/M2_S-6_R8_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b336b8d8af371cd5e53c1c49380e8319a3d5faf --- /dev/null +++ b/mlp_map_test/M2_S-6_R8_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e994f05fce8a222d5268a8167fa8dd37b927d3de2528ccb84f65a8d862779fbb +size 153705080 diff --git a/mlp_map_test/M2_S-6_R8_P5_config.json b/mlp_map_test/M2_S-6_R8_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d28b28422510e978ad5c57f28af9251beb0a97d --- /dev/null +++ b/mlp_map_test/M2_S-6_R8_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R8_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-6_R8_P6.pt b/mlp_map_test/M2_S-6_R8_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e691a8fad79bb791cd73634592668dafc77b78c --- /dev/null +++ b/mlp_map_test/M2_S-6_R8_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3230c9a42fc7bad4e854cbebb3531e1f3028342a7ec8a6d5666a2113bb5d596 +size 153705080 diff --git a/mlp_map_test/M2_S-6_R8_P6_config.json b/mlp_map_test/M2_S-6_R8_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4cba043e63922bebc8bb8db2fb84fe7e011729c7 --- /dev/null +++ b/mlp_map_test/M2_S-6_R8_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -6, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-6_R8_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R16_P3.pt b/mlp_map_test/M2_S-8_R16_P3.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3c1f25f6ca873b746833e02a199a06b6ea0036a --- /dev/null +++ b/mlp_map_test/M2_S-8_R16_P3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17da558c377f990d5f1d8c3f560fad426ac22587f6358fb6723b362071af3c48 +size 153705088 diff --git a/mlp_map_test/M2_S-8_R16_P3_config.json b/mlp_map_test/M2_S-8_R16_P3_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a9059246014b340daf462b3a9a4992f27b5ad07f --- /dev/null +++ b/mlp_map_test/M2_S-8_R16_P3_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 3, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R16_P3" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R16_P4.pt b/mlp_map_test/M2_S-8_R16_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c4e827f9db333f83812d6d9e318d1190dc71802 --- /dev/null +++ b/mlp_map_test/M2_S-8_R16_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c243b8297d8e7c2a389bf3c95f93897f24eb4d24ff7a27cac6823f5e11043cb6 +size 153705088 diff --git a/mlp_map_test/M2_S-8_R16_P4_config.json b/mlp_map_test/M2_S-8_R16_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c3ae2f9dffb768e3b2903736d3716e214b68af79 --- /dev/null +++ b/mlp_map_test/M2_S-8_R16_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 16, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R16_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R2_P4.pt b/mlp_map_test/M2_S-8_R2_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4457a24ee9c3feaa893dd6021ee08ac29b8447f --- /dev/null +++ b/mlp_map_test/M2_S-8_R2_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b7508a35c6205f23bf2e3ae9dda612c49605239dedbaf3a0c86d2707c250a02 +size 153705080 diff --git a/mlp_map_test/M2_S-8_R2_P4_config.json b/mlp_map_test/M2_S-8_R2_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..13724189b39a3bdc636b85c0fc7cc7994c634b02 --- /dev/null +++ b/mlp_map_test/M2_S-8_R2_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R2_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R2_P5.pt b/mlp_map_test/M2_S-8_R2_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cefd1c64607ae564a7dca745c56f53f92e86957 --- /dev/null +++ b/mlp_map_test/M2_S-8_R2_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf1e43f9c368ae6447ba45f2ea73266855e31a937516dc8a51549c2b27d0d1cf +size 153705080 diff --git a/mlp_map_test/M2_S-8_R2_P5_config.json b/mlp_map_test/M2_S-8_R2_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..7c376677b88f6047e0fea9ee1e55d892344c7c53 --- /dev/null +++ b/mlp_map_test/M2_S-8_R2_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 2, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R2_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R4_P4.pt b/mlp_map_test/M2_S-8_R4_P4.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2855b41ec45a1f9018ed0e9e8036f4d8f622fd6 --- /dev/null +++ b/mlp_map_test/M2_S-8_R4_P4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea3d0989f096791b78e960b1a665dc28b54fff3153f12eadef2018a562d4ead9 +size 153705080 diff --git a/mlp_map_test/M2_S-8_R4_P4_config.json b/mlp_map_test/M2_S-8_R4_P4_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e8a0fc4126409a482155ee10b82cdcb186df7649 --- /dev/null +++ b/mlp_map_test/M2_S-8_R4_P4_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 4, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R4_P4" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R8_P1.pt b/mlp_map_test/M2_S-8_R8_P1.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f15ccac61a92b738014f7923a3437d670500e47 --- /dev/null +++ b/mlp_map_test/M2_S-8_R8_P1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:921a3b5ffdda101166fae0d0aecfadbc4bca2014722f681f1c427c48d5300748 +size 153705080 diff --git a/mlp_map_test/M2_S-8_R8_P1_config.json b/mlp_map_test/M2_S-8_R8_P1_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0b19b21e5918947525113639707dca0110dce1b3 --- /dev/null +++ b/mlp_map_test/M2_S-8_R8_P1_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 1, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R8_P1" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R8_P2.pt b/mlp_map_test/M2_S-8_R8_P2.pt new file mode 100644 index 0000000000000000000000000000000000000000..49d569f8def7acbfdba377c47966cc16a8d125e1 --- /dev/null +++ b/mlp_map_test/M2_S-8_R8_P2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85fc9819ee85ed4b7febdb119c879fc7f6f800a9b03758c91acfdd9ac80ee15e +size 153705080 diff --git a/mlp_map_test/M2_S-8_R8_P2_config.json b/mlp_map_test/M2_S-8_R8_P2_config.json new file mode 100644 index 0000000000000000000000000000000000000000..579523444b4f188b5885927f2499d9e661259b41 --- /dev/null +++ b/mlp_map_test/M2_S-8_R8_P2_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 2, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R8_P2" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S-8_R8_P6.pt b/mlp_map_test/M2_S-8_R8_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..126acc489bf53bb6ab75ae3e37426fe0eb6863ce --- /dev/null +++ b/mlp_map_test/M2_S-8_R8_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c5831d12d6562e466eec0833757acdcd075fa569144f9369c83c605e8a1a28 +size 153705080 diff --git a/mlp_map_test/M2_S-8_R8_P6_config.json b/mlp_map_test/M2_S-8_R8_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..81df8f4cf0c80cb39e7b2be503d1be134edbc414 --- /dev/null +++ b/mlp_map_test/M2_S-8_R8_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": -8, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S-8_R8_P6" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S0_R4_P5.pt b/mlp_map_test/M2_S0_R4_P5.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4f9f7a37518a3a959b1d65dc84f4e331e29f9d4 --- /dev/null +++ b/mlp_map_test/M2_S0_R4_P5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b745de80b05deef1fedc4992116e29765a5c38deb8abbbfcf765fb51b705f1b7 +size 153705072 diff --git a/mlp_map_test/M2_S0_R4_P5_config.json b/mlp_map_test/M2_S0_R4_P5_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b947e6e825018dbfc8355292036908b0d396501a --- /dev/null +++ b/mlp_map_test/M2_S0_R4_P5_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 4, + "l1_p": 5, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S0_R4_P5" +} \ No newline at end of file diff --git a/mlp_map_test/M2_S0_R8_P6.pt b/mlp_map_test/M2_S0_R8_P6.pt new file mode 100644 index 0000000000000000000000000000000000000000..0051d8a35d9683140b04d7ea78701a7041e308b8 --- /dev/null +++ b/mlp_map_test/M2_S0_R8_P6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b55b3f0c84de1053df217b0ff8cec7fe5cbeba66c94f51e7de007a7a5819d9d +size 153705072 diff --git a/mlp_map_test/M2_S0_R8_P6_config.json b/mlp_map_test/M2_S0_R8_P6_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b4643d1452ddfbbe3fcb5e2784d2d4f3949f8b0c --- /dev/null +++ b/mlp_map_test/M2_S0_R8_P6_config.json @@ -0,0 +1,38 @@ +{ + "n_features": 25000, + "d_model": 768, + "lr_exp": -10, + "disable_comet": false, + "per_neuron_reinit_interval": 0, + "reservoir_time_discount": 0.995, + "reinit_interval": 800, + "max_reinit_neurons": 5000, + "reservoir_size": 5000, + "n_piles": 292, + "log_interval": 200, + "reinit_input_norm": "target_scaled", + "reinit_input": "x", + "reinit_norm_alpha": 0.3, + "data_loc": "mlp_data", + "reinit_threshold": -6, + "scheduler": "wsd", + "layer_idx": 2, + "l1_exp": 0, + "neuron_reinit_percent": 0.85, + "beta1": 1, + "beta2": 4, + "reinit_target": "y", + "sparse_adam": false, + "run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}", + "project_name": "mlp_map_test", + "decoder_bias": true, + "l1_beta": 0.99, + "alt_sparsity_loss": "log", + "l1_ratio": 8, + "l1_p": 6, + "optimizer": "sparse_adam", + "model_type": "mlp_map", + "adam_beta1": 0.5, + "adam_beta2": 0.9375, + "run_name": "M2_S0_R8_P6" +} \ No newline at end of file