noanabeshima
commited on
Commit
•
d8df745
1
Parent(s):
84e485d
Upload folder using huggingface_hub
Browse files- mlp_map_test/M0_S-3_R1_P0.pt +3 -0
- mlp_map_test/M0_S-3_R1_P0_config.json +38 -0
- mlp_map_test/M0_S-6_R1_P0.pt +3 -0
- mlp_map_test/M0_S-6_R1_P0_config.json +38 -0
- mlp_map_test/M0_S-8_R1_P0.pt +3 -0
- mlp_map_test/M0_S-8_R1_P0_config.json +38 -0
- mlp_map_test/M0_S0_R1_P0.pt +3 -0
- mlp_map_test/M0_S0_R1_P0_config.json +38 -0
- mlp_map_test/M1_S-3_R1_P0.pt +3 -0
- mlp_map_test/M1_S-3_R1_P0_config.json +38 -0
- mlp_map_test/M1_S-4_R1_P0.pt +3 -0
- mlp_map_test/M1_S-4_R1_P0_config.json +38 -0
- mlp_map_test/M1_S0_R1_P0.pt +3 -0
- mlp_map_test/M1_S0_R1_P0_config.json +38 -0
- mlp_map_test/M2_S-3_R1_P0.pt +3 -0
- mlp_map_test/M2_S-3_R1_P0_config.json +38 -0
- mlp_map_test/M2_S-4_R1_P0.pt +3 -0
- mlp_map_test/M2_S-4_R1_P0_config.json +38 -0
- mlp_map_test/M2_S0_R1_P0.pt +3 -0
- mlp_map_test/M2_S0_R1_P0_config.json +38 -0
- mlp_map_test/M3_S-2_R1_P0.pt +3 -0
- mlp_map_test/M3_S-2_R1_P0_config.json +38 -0
- mlp_map_test/M3_S-3_R1_P0.pt +3 -0
- mlp_map_test/M3_S-3_R1_P0_config.json +38 -0
- mlp_map_test/M3_S-4_R1_P0.pt +3 -0
- mlp_map_test/M3_S-4_R1_P0_config.json +38 -0
- mlp_map_test/M3_S0_R1_P0.pt +3 -0
- mlp_map_test/M3_S0_R1_P0_config.json +38 -0
mlp_map_test/M0_S-3_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ce271c4f08bc5a13f5b884f42bc19e1f1a505ed2e9543fde6c5149bfa92d7f1
|
3 |
+
size 153705080
|
mlp_map_test/M0_S-3_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 0,
|
20 |
+
"l1_exp": -3,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M0_S-3_R1_P0"
|
38 |
+
}
|
mlp_map_test/M0_S-6_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5b9ec2032767721c3578d4837817c938dde6d534826e5e831fbd661d67c32be
|
3 |
+
size 153705080
|
mlp_map_test/M0_S-6_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 0,
|
20 |
+
"l1_exp": -6,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M0_S-6_R1_P0"
|
38 |
+
}
|
mlp_map_test/M0_S-8_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a472e5d18de5d83e6e79eb0a5192f2890b68d1de9431608f2125cae83112a6e0
|
3 |
+
size 153705080
|
mlp_map_test/M0_S-8_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 0,
|
20 |
+
"l1_exp": -8,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M0_S-8_R1_P0"
|
38 |
+
}
|
mlp_map_test/M0_S0_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c3a0fa92f2b71152399a3aa23cf225dda78fdbf9efe9dcdb3004d132814fd81
|
3 |
+
size 153705072
|
mlp_map_test/M0_S0_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 0,
|
20 |
+
"l1_exp": 0,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M0_S0_R1_P0"
|
38 |
+
}
|
mlp_map_test/M1_S-3_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:352804e14b28245f2b3f3d41fe4e4e4f7b38d8cefdfbedee57953f9ddb152842
|
3 |
+
size 153705080
|
mlp_map_test/M1_S-3_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 1,
|
20 |
+
"l1_exp": -3,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M1_S-3_R1_P0"
|
38 |
+
}
|
mlp_map_test/M1_S-4_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ac2bdf89dd757b88c0190668bd17a6f1d520722ad795ec3afc6a29d588e9f84
|
3 |
+
size 153705080
|
mlp_map_test/M1_S-4_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 1,
|
20 |
+
"l1_exp": -4,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M1_S-4_R1_P0"
|
38 |
+
}
|
mlp_map_test/M1_S0_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3dca79fc4147c8a19647c99f6d2f9ef32cfa9d154f3ceb0d122150b97a26d7f8
|
3 |
+
size 153705072
|
mlp_map_test/M1_S0_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 1,
|
20 |
+
"l1_exp": 0,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M1_S0_R1_P0"
|
38 |
+
}
|
mlp_map_test/M2_S-3_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fc4603aa99d4fb7403cb3ebcb928f84be3fd9ea09e862f1bcdc7889ba83e2d7
|
3 |
+
size 153705080
|
mlp_map_test/M2_S-3_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 2,
|
20 |
+
"l1_exp": -3,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M2_S-3_R1_P0"
|
38 |
+
}
|
mlp_map_test/M2_S-4_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93d1582ec93565eccc3c1a67e407e1ab828d8e78c0c5acccadbaa9086d077def
|
3 |
+
size 153705080
|
mlp_map_test/M2_S-4_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 2,
|
20 |
+
"l1_exp": -4,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M2_S-4_R1_P0"
|
38 |
+
}
|
mlp_map_test/M2_S0_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8a15a16297cf51d5c6f3860d12ca9f98b822d63598169ea3260423858ce164d
|
3 |
+
size 153705072
|
mlp_map_test/M2_S0_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 2,
|
20 |
+
"l1_exp": 0,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M2_S0_R1_P0"
|
38 |
+
}
|
mlp_map_test/M3_S-2_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f389520ff2899f63ce05fc182e283b6edcf3043d61848128c10b3d6a9713b7f
|
3 |
+
size 153705080
|
mlp_map_test/M3_S-2_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 3,
|
20 |
+
"l1_exp": -2,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M3_S-2_R1_P0"
|
38 |
+
}
|
mlp_map_test/M3_S-3_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f53e9fee4c1085e95b3b0bb983e4050f62d77580bd902f3bbc8ac1a9edee51e
|
3 |
+
size 153705080
|
mlp_map_test/M3_S-3_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 3,
|
20 |
+
"l1_exp": -3,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M3_S-3_R1_P0"
|
38 |
+
}
|
mlp_map_test/M3_S-4_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:545d02f369cf98681e311c5aaf74d1543beb038bad7b9c13b077fa95b67f15a4
|
3 |
+
size 153705080
|
mlp_map_test/M3_S-4_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 3,
|
20 |
+
"l1_exp": -4,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M3_S-4_R1_P0"
|
38 |
+
}
|
mlp_map_test/M3_S0_R1_P0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a2b2f5f638b0b9e5d48a004eb916a519672e5686e358b75e3bf47ac7a0a1593
|
3 |
+
size 153705072
|
mlp_map_test/M3_S0_R1_P0_config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"n_features": 25000,
|
3 |
+
"d_model": 768,
|
4 |
+
"lr_exp": -10,
|
5 |
+
"disable_comet": false,
|
6 |
+
"per_neuron_reinit_interval": 0,
|
7 |
+
"reservoir_time_discount": 0.995,
|
8 |
+
"reinit_interval": 800,
|
9 |
+
"max_reinit_neurons": 5000,
|
10 |
+
"reservoir_size": 5000,
|
11 |
+
"n_piles": 292,
|
12 |
+
"log_interval": 200,
|
13 |
+
"reinit_input_norm": "target_scaled",
|
14 |
+
"reinit_input": "x",
|
15 |
+
"reinit_norm_alpha": 0.3,
|
16 |
+
"data_loc": "mlp_data",
|
17 |
+
"reinit_threshold": -6,
|
18 |
+
"scheduler": "wsd",
|
19 |
+
"layer_idx": 3,
|
20 |
+
"l1_exp": 0,
|
21 |
+
"neuron_reinit_percent": 0.85,
|
22 |
+
"beta1": 1,
|
23 |
+
"beta2": 4,
|
24 |
+
"reinit_target": "y",
|
25 |
+
"sparse_adam": false,
|
26 |
+
"run_template": "M{layer_idx}_S{l1_exp}_R{l1_ratio}_P{l1_p}",
|
27 |
+
"project_name": "mlp_map_test",
|
28 |
+
"decoder_bias": true,
|
29 |
+
"l1_beta": 0.99,
|
30 |
+
"alt_sparsity_loss": "log",
|
31 |
+
"l1_ratio": 1,
|
32 |
+
"l1_p": 0,
|
33 |
+
"optimizer": "sparse_adam",
|
34 |
+
"model_type": "mlp_map",
|
35 |
+
"adam_beta1": 0.5,
|
36 |
+
"adam_beta2": 0.9375,
|
37 |
+
"run_name": "M3_S0_R1_P0"
|
38 |
+
}
|