初始化项目,由ModelHub XC社区提供模型

Model: fpadovani/tur_10mb_baseline_seed3407
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-05-23 00:50:33 +08:00
commit e5c6f8403c
64 changed files with 1359939 additions and 0 deletions

View File

@@ -0,0 +1,35 @@
{
"_name_or_path": "goldfish-models/tur_latn_10mb",
"activation_function": "gelu",
"architectures": [
"GPT2LMHeadModel"
],
"attn_pdrop": 0.1,
"bos_token_id": 50000,
"embd_pdrop": 0.1,
"eos_token_id": 50001,
"initializer_range": 0.02,
"layer_norm_epsilon": 1e-05,
"model_type": "gpt2",
"n_ctx": 2048,
"n_embd": 512,
"n_head": 8,
"n_inner": 2048,
"n_layer": 4,
"n_positions": 2048,
"pad_token_id": 50002,
"prefix": "[CLS]",
"reorder_and_upcast_attn": false,
"resid_pdrop": 0.1,
"scale_attn_by_inverse_layer_idx": false,
"scale_attn_weights": true,
"summary_activation": null,
"summary_first_dropout": 0.1,
"summary_proj_to_labels": true,
"summary_type": "cls_index",
"summary_use_proj": true,
"torch_dtype": "bfloat16",
"transformers_version": "4.47.0",
"use_cache": true,
"vocab_size": 51200
}

View File

@@ -0,0 +1,7 @@
{
"_from_model_config": true,
"bos_token_id": 50000,
"eos_token_id": 50001,
"pad_token_id": 50002,
"transformers_version": "4.47.0"
}

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:cb4dcd4378e7a7e1603a21e55d1e6505a66f18765a7b55bb86409936e4a7e8cf
size 79752272

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:81419e4a785fac624cc8515445a8541224b31b6ae09d2bdade3188554c1a4846
size 159538443

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:65ca5ec9eda2ea61c45da5c1760fb58186ace0feab4a88ea497a5fd5c482b942
size 14645

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6ff2ab183ac3438c73e3152ef5bf274c4bf4198fe8bfc2e520d27cbc6c1be00f
size 1465

File diff suppressed because it is too large Load Diff

210940
checkpoint-5000/tokenizer.json Normal file

File diff suppressed because one or more lines are too long

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:47c14992ed16d92c5aed65f9944df2da038052e34eaea8f6eb2f0cf4bed6a0f8
size 6097