{ "iteration": 2000, "best_val_loss": 0.51076340675354, "early_stopping_counter": 1, "learning_rate": 1e-05, "batch_size": 8, "block_size": 1024, "model_args": { "n_layer": 12, "n_head": 12, "n_embd": 768, "block_size": 1024, "bias": false, "vocab_size": 50257, "dropout": 0.0 } }