17 lines
491 B
JSON
17 lines
491 B
JSON
|
|
{
|
||
|
|
"model_id": "laabam-ai-3b-v1-epoch2",
|
||
|
|
"brand": "Laabam AI",
|
||
|
|
"base_model": "Qwen/Qwen2.5-3B-Instruct",
|
||
|
|
"continued_from": "/mnt/d/laabamai/outputs/laabam-ai-3b-v1/final-adapter",
|
||
|
|
"epoch": 2,
|
||
|
|
"train_loss": 0.563843307071262,
|
||
|
|
"train_runtime_seconds": 48833.440865039825,
|
||
|
|
"train_samples": 36000,
|
||
|
|
"eval_samples": 500,
|
||
|
|
"learning_rate": 5e-05,
|
||
|
|
"effective_batch_size": 8,
|
||
|
|
"max_seq_length": 1024,
|
||
|
|
"gpu": "NVIDIA GeForce RTX 3050",
|
||
|
|
"vram_gb": 6.0,
|
||
|
|
"backend": "unsloth"
|
||
|
|
}
|