34 lines
455 B
TOML
34 lines
455 B
TOML
batch_size = 64
|
|
steps = 1000000
|
|
print_every = 50000
|
|
seed = 0
|
|
cnn_storage = "./res/cnn.eqx"
|
|
|
|
[[sae]]
|
|
layer = 6
|
|
hidden_size = 300
|
|
input_size = 64
|
|
learning_rate = 1e-3
|
|
l1 = 3e-4 # from Neel Nanda's sae git
|
|
|
|
[[sae]]
|
|
layer = 6
|
|
hidden_size = 300
|
|
input_size = 64
|
|
learning_rate = 3e-4
|
|
l1 = 3e-4
|
|
|
|
[[sae]]
|
|
layer = 6
|
|
hidden_size = 300
|
|
input_size = 64
|
|
learning_rate = 1e-4
|
|
l1 = 3e-4
|
|
|
|
[[sae]]
|
|
layer = 6
|
|
hidden_size = 300
|
|
input_size = 64
|
|
learning_rate = 3e-5
|
|
l1 = 3e-4
|