初始化项目,由ModelHub XC社区提供模型

Model: fpadovani/tur_indomain_prepretraining_seed443
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-05-30 04:36:22 +08:00
commit d774fe1195
97 changed files with 2033223 additions and 0 deletions

View File

@@ -0,0 +1,35 @@
{
"_name_or_path": "goldfish-models/tur_latn_10mb",
"activation_function": "gelu",
"architectures": [
"GPT2LMHeadModel"
],
"attn_pdrop": 0.1,
"bos_token_id": 50000,
"embd_pdrop": 0.1,
"eos_token_id": 50001,
"initializer_range": 0.02,
"layer_norm_epsilon": 1e-05,
"model_type": "gpt2",
"n_ctx": 2048,
"n_embd": 512,
"n_head": 8,
"n_inner": 2048,
"n_layer": 4,
"n_positions": 2048,
"pad_token_id": 50002,
"prefix": "[CLS]",
"reorder_and_upcast_attn": false,
"resid_pdrop": 0.1,
"scale_attn_by_inverse_layer_idx": false,
"scale_attn_weights": true,
"summary_activation": null,
"summary_first_dropout": 0.1,
"summary_proj_to_labels": true,
"summary_type": "cls_index",
"summary_use_proj": true,
"torch_dtype": "bfloat16",
"transformers_version": "4.47.0",
"use_cache": true,
"vocab_size": 51200
}

View File

@@ -0,0 +1,7 @@
{
"_from_model_config": true,
"bos_token_id": 50000,
"eos_token_id": 50001,
"pad_token_id": 50002,
"transformers_version": "4.47.0"
}

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e660ea3b9087bf515ef59a7502e491c262827c37fb79b8108da0830f71397df5
size 79752272

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:1a42c5a9493833024fd51018a8a49af1f2cea0e9645dd68b0cf0fe2331de2b13
size 159538443

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:84eb9f55b9e425120c0f0c6f7e2475a0f5d883dcf62ac5b50b34d84ca2d8482f
size 14645

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:b6b3ad5549d5099e5cee60aa161fa531e77bd60d13a0dc32433f3e6e01a85319
size 1465

File diff suppressed because it is too large Load Diff

210940
checkpoint-2500/tokenizer.json Normal file

File diff suppressed because one or more lines are too long

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6dc7942391c97f5c71d525af067d82cf56a6d2234bb905634d507c9b596fea7c
size 6161