{"seed": 47, "batch_size": 4096, "buffer_mult": 512, "lr": 0.0001, "num_tokens": 10000000, "l1_coeff": 0.003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "model_batch_size": 512, "buffer_size": 2097152, "buffer_batches": 16384}