初始化项目,由ModelHub XC社区提供模型

Model: DCAgent/b1_top32_seq
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-06-09 07:43:18 +08:00
commit c3f9189599
20 changed files with 153470 additions and 0 deletions

16
train_results.json Normal file
View File

@@ -0,0 +1,16 @@
{
"achieved_tflops_per_gpu": 0.0038077623951744254,
"achieved_tflops_per_gpu_theoretical": 589.4953939312312,
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2470691055059433,
"mfu_percent": 0.00026909981591338695,
"mfu_percent_theoretical": 41.660451867931535,
"total_flos": 1344232108851200.0,
"train_loss": 0.2903653360683384,
"train_runtime": 22064.0098,
"train_samples_per_second": 2.775,
"train_steps_per_second": 0.174,
"valid_targets_mean": 2973.0,
"valid_targets_min": 811
}