初始化项目,由ModelHub XC社区提供模型

Model: DCAgent/a1-stack_jest
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-05-13 09:08:39 +08:00
commit 0f8e19a621
23 changed files with 163311 additions and 0 deletions

16
train_results.json Normal file
View File

@@ -0,0 +1,16 @@
{
"achieved_tflops_per_gpu": 0.003747713620293238,
"achieved_tflops_per_gpu_theoretical": 603.0470121825239,
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1903749257326126,
"mfu_percent": 0.0002648560862398048,
"mfu_percent_theoretical": 42.618163405125365,
"total_flos": 1474549610774528.0,
"train_loss": 0.20471333478722384,
"train_runtime": 24590.8199,
"train_samples_per_second": 2.851,
"train_steps_per_second": 0.178,
"valid_targets_mean": 5778.1,
"valid_targets_min": 3072
}