2023-10-19 17:45:43 +02:00
|
|
|
batch_size = 64
|
2023-12-13 20:42:30 +01:00
|
|
|
steps = 500000
|
|
|
|
print_every = 10000
|
|
|
|
seed = 0
|
2023-10-19 17:45:43 +02:00
|
|
|
cnn_storage = "./res/cnn.eqx"
|
2023-12-13 20:42:30 +01:00
|
|
|
|
|
|
|
[[sae]]
|
|
|
|
layer = 6
|
|
|
|
hidden_size = 1000
|
|
|
|
input_size = 64
|
|
|
|
learning_rate = 0.1
|
|
|
|
|
|
|
|
[[sae]]
|
|
|
|
layer = 6
|
|
|
|
hidden_size = 1000
|
|
|
|
input_size = 64
|
|
|
|
learning_rate = 3e-2
|
|
|
|
|
|
|
|
[[sae]]
|
|
|
|
layer = 6
|
|
|
|
hidden_size = 1000
|
|
|
|
input_size = 64
|
|
|
|
learning_rate = 1e-2
|
|
|
|
|
|
|
|
[[sae]]
|
|
|
|
layer = 6
|
|
|
|
hidden_size = 1000
|
|
|
|
input_size = 64
|
|
|
|
learning_rate = 3e-3
|
|
|
|
|
|
|
|
[[sae]]
|
|
|
|
layer = 6
|
|
|
|
hidden_size = 1000
|
|
|
|
input_size = 64
|
|
|
|
learning_rate = 1e-3
|
|
|
|
|
|
|
|
[[sae]]
|
|
|
|
layer = 6
|
|
|
|
hidden_size = 1000
|
|
|
|
input_size = 64
|
|
|
|
learning_rate = 3e-4
|
|
|
|
|
|
|
|
[[sae]]
|
|
|
|
layer = 6
|
|
|
|
hidden_size = 1000
|
|
|
|
input_size = 64
|
|
|
|
learning_rate = 1e-4
|