From 8d51581b51645dd6085e53e2403bd9a9ba423a0b Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sun, 17 May 2026 04:56:09 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: pfnet/Qwen3-1.7B-pfn-qfin Source: Original Platform --- .gitattributes | 36 ++++++++++++++++++ LICENSE | 3 ++ NOTICE | 1 + README.md | 82 +++++++++++++++++++++++++++++++++++++++++ added_tokens.json | 28 ++++++++++++++ config.json | 1 + configuration.json | 1 + generation_config.json | 6 +++ merges.txt | 3 ++ model.safetensors | 3 ++ special_tokens_map.json | 31 ++++++++++++++++ tokenizer.json | 3 ++ tokenizer_config.json | 3 ++ vocab.json | 3 ++ 14 files changed, 204 insertions(+) create mode 100644 .gitattributes create mode 100644 LICENSE create mode 100644 NOTICE create mode 100644 README.md create mode 100644 added_tokens.json create mode 100644 config.json create mode 100644 configuration.json create mode 100644 generation_config.json create mode 100644 merges.txt create mode 100644 model.safetensors create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 vocab.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..52373fe --- /dev/null +++ b/.gitattributes @@ -0,0 +1,36 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/LICENSE b/LICENSE new file mode 100644 index 0000000..84220ad --- /dev/null +++ b/LICENSE @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:988b37b0b21ca130ad84a092429e4e5bceec5f86dfe85a8ca3e06ea703b960ca +size 8720 diff --git a/NOTICE b/NOTICE new file mode 100644 index 0000000..727c739 --- /dev/null +++ b/NOTICE @@ -0,0 +1 @@ +This software includes the work (Qwen/Qwen3-1.7b) that is distributed in the Apache License 2.0. \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..4891f84 --- /dev/null +++ b/README.md @@ -0,0 +1,82 @@ +--- +language: +- en +- ja +library_name: transformers +pipeline_tag: text-generation +license: other +license_name: plamo-community-license +license_link: LICENSE +base_model: +- Qwen/Qwen3-1.7B-Base +--- + +# Qwen3-1.7B-pfn-qfin + +## Model Description +Qwen3-1.7B-pfn-qfin is an fine-tuned model based on [Qwen/Qwen3-1.7B-Base](https://huggingface.co/Qwen/Qwen3-1.7B-Base). +This is the base model, which is good at generating continuous sentences. +Qwen3-1.7B-pfn-qfin is fine-tuned on about 400M tokens from multiple special datasets generated by Preferred Networks, which is clear to use for commercial usage. +The fine-tuned were carried out at a 2048 context length. +This model is released under [PLaMo Community License](https://www.preferred.jp/ja/plamo-community-license/). + +# Benchmarking +The benchmark score is obtained using [Japanese Language Model Financial Evaluation Harness](https://github.com/pfnet-research/japanese-lm-fin-harness) +For the benchmark, 0-shot and default prompts are used. + +| Task |Metric|Qwen3-1.7B| Ours | +|----------------|------|------|------| +|chabsa |f1 |0.5734|0.7116| +|cma_basics |acc |0.3158|0.5263| +|cpa_audit |acc |0.1583|0.1884| +|fp2 |acc |0.4737|0.4912| +|security_sales_1|acc |0.2421|0.3389| +|----------------|------|------|------| +|OVER ALL | |0.3527|0.4513| + +## Usage +Install the required libraries as follows: +```sh +>>> python -m pip install "transformers>=4.51.0" +``` + +Execute the following python code: +```python +import torch +from transformers import AutoTokenizer, AutoModelForCausalLM + +tokenizer = AutoTokenizer.from_pretrained("pfnet/Qwen3-1.7B-pfn-qfin", trust_remote_code=True) +model = AutoModelForCausalLM.from_pretrained("pfnet/Qwen3-1.7B-pfn-qfin", device_map="auto", trust_remote_code=True) +text = "日本銀行は" +input_ids = tokenizer(text, return_tensors="pt").input_ids.to(model.device) +with torch.no_grad(): + generated_tokens = model.generate( + inputs=input_ids, + max_new_tokens=32, + do_sample=True, + top_k=50, + top_p=0.95, + temperature=1.0, + pad_token_id=tokenizer.pad_token_id, + bos_token_id=tokenizer.bos_token_id, + eos_token_id=tokenizer.eos_token_id + )[0] +generated_text = tokenizer.decode(generated_tokens) +print(generated_text) +``` + +## Bias, Risks, and Limitations +Qwen3-1.7B-pfn-qfin is a new technology that carries risks with use. +Testing conducted to date has been in English and Japanese, and has not covered, nor could it cover all scenarios. +For these reasons, as with all LLMs, Qwen3-1.7B-pfn-qfin’s potential outputs cannot be predicted in advance, and the model may in some instances produce inaccurate, biased or other objectionable responses to user prompts. +This model is not designed for legal, tax, investment, financial, or other advice. +Therefore, before deploying any applications of Qwen3-1.7B-pfn-qfin, developers should perform safety testing and tuning tailored to their specific applications of the model. + +## Authors +Preferred Networks, Inc. + - Masanori Hirano + - Kentaro Imajo + - Takeshi Masuko + +# License +[PLaMo Community License](https://www.preferred.jp/ja/plamo-community-license/) \ No newline at end of file diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000..b54f913 --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,28 @@ +{ + "": 151668, + "": 151658, + "": 151666, + "": 151667, + "": 151657, + "": 151665, + "<|box_end|>": 151649, + "<|box_start|>": 151648, + "<|endoftext|>": 151643, + "<|file_sep|>": 151664, + "<|fim_middle|>": 151660, + "<|fim_pad|>": 151662, + "<|fim_prefix|>": 151659, + "<|fim_suffix|>": 151661, + "<|im_end|>": 151645, + "<|im_start|>": 151644, + "<|image_pad|>": 151655, + "<|object_ref_end|>": 151647, + "<|object_ref_start|>": 151646, + "<|quad_end|>": 151651, + "<|quad_start|>": 151650, + "<|repo_name|>": 151663, + "<|video_pad|>": 151656, + "<|vision_end|>": 151653, + "<|vision_pad|>": 151654, + "<|vision_start|>": 151652 +} diff --git a/config.json b/config.json new file mode 100644 index 0000000..d627d6c --- /dev/null +++ b/config.json @@ -0,0 +1 @@ +{"architectures": ["Qwen3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151643, "head_dim": 128, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 6144, "max_position_embeddings": 32768, "max_window_layers": 28, "model_type": "qwen3", "num_attention_heads": 16, "num_hidden_layers": 28, "num_key_value_heads": 8, "rms_norm_eps": 1e-06, "rope_scaling": null, "rope_theta": 1000000, "sliding_window": null, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "transformers_version": "4.51.3", "use_cache": true, "use_sliding_window": false, "vocab_size": 151936} \ No newline at end of file diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..d46f198 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,6 @@ +{ + "bos_token_id": 151643, + "eos_token_id": 151643, + "max_new_tokens": 2048, + "transformers_version": "4.51.3" +} diff --git a/merges.txt b/merges.txt new file mode 100644 index 0000000..80c1a19 --- /dev/null +++ b/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/model.safetensors b/model.safetensors new file mode 100644 index 0000000..35813f8 --- /dev/null +++ b/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4422f2c7c4848809d72fb03900364777d98cdf663a284e1a418a01e7b4897015 +size 3441185608 diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..17305b3 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,31 @@ +{ + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "eos_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..cd71f61 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..5479a1e --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a3a6f623ddaad552d27957966270df1c7c6b8777ddaebeb4753abd4ed635edd +size 9709 diff --git a/vocab.json b/vocab.json new file mode 100644 index 0000000..6c49fc6 --- /dev/null +++ b/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833