{ "iteration": 2000, "best_val_loss": 0.06397182494401932, "early_stopping_counter": 0, "learning_rate": 1e-05, "batch_size": 12, "block_size": 1024, "model_args": { "n_layer": 12, "n_head": 12, "n_embd": 768, "block_size": 1024, "bias": false, "vocab_size": 33, "dropout": 0.1 } }