17 lines
324 B
JSON
17 lines
324 B
JSON
{
|
|
"iteration": 5000,
|
|
"best_val_loss": 2.814284086227417,
|
|
"early_stopping_counter": 4,
|
|
"learning_rate": 0.0006,
|
|
"batch_size": 12,
|
|
"block_size": 1024,
|
|
"model_args": {
|
|
"n_layer": 12,
|
|
"n_head": 12,
|
|
"n_embd": 768,
|
|
"block_size": 1024,
|
|
"bias": false,
|
|
"vocab_size": 33,
|
|
"dropout": 0.1
|
|
}
|
|
} |