{ "iteration": 5000, "best_val_loss": 2.814284086227417, "early_stopping_counter": 4, "learning_rate": 0.0006, "batch_size": 12, "block_size": 1024, "model_args": { "n_layer": 12, "n_head": 12, "n_embd": 768, "block_size": 1024, "bias": false, "vocab_size": 33, "dropout": 0.1 } }