初始化项目，由ModelHub XC社区提供模型

Model: MihaiPopa-1/OmniTranslate-1.1 Source: Original Platform
2026-06-06 16:07:18 +08:00
commit 77ff80b795
7 changed files with 849 additions and 0 deletions
--- a/.gitattributes
+++ b/.gitattributes
@@ -0,0 +1,36 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text
--- a/README.md
+++ b/README.md
@@ -0,0 +1,628 @@
+---
+base_model: MihaiPopa-1/OmniTranslate-1.0
+# base_model: Unsloth/Qwen3-0.6B-Unsloth-bnb-4bit - Variant that I used for fine-tuning (4-bit BNB quant by Unsloth)
+tags:
+- text-generation-inference
+- translation
+- transformers
+- unsloth
+- qwen3
+- omnitranslate
+license: apache-2.0
+language:
+- abk
+- abq
+- abs
+- acm
+- adh
+- adi
+- ady
+- aeb
+- afr
+- agx
+- aii
+- aim
+- ain
+- ajz
+- akb
+- aln
+- als
+- alt
+- amh
+- anp
+- aoz
+- apc
+- apt
+- arb
+- arg
+- arq
+- ars
+- ary
+- arz
+- asm
+- ast
+- atb
+- ava
+- awa
+- ayp
+- ayr
+- azb
+- azj
+- bak
+- bam
+- ban
+- bar
+- bas
+- bbc
+- bbk
+- bcl
+- bdq
+- bel
+- ben
+- bew
+- bho
+- bhp
+- bis
+- biu
+- bjn
+- bod
+- bos
+- brh
+- brx
+- bts
+- btx
+- bug
+- bul
+- bwi
+- bxr
+- cat
+- cbk
+- ccp
+- ceb
+- ces
+- cfm
+- cha
+- che
+- chr
+- chu
+- chv
+- cjs
+- ckb
+- ckt
+- cmn
+- cnh
+- cnw
+- cos
+- crh
+- crj
+- crk
+- crl
+- crs
+- csb
+- csw
+- csy
+- ctd
+- cym
+- czt
+- dak
+- dan
+- dar
+- deu
+- dik
+- diu
+- div
+- dje
+- dks
+- dln
+- dng
+- dnw
+- doi
+- dru
+- dsb
+- dtp
+- dty
+- dzo
+- ekk
+- ell
+- emj
+- enl
+- enm
+- epo
+- ess
+- eus
+- eve
+- ewo
+- ext
+- fao
+- fas
+- ffm
+- fij
+- fil
+- fin
+- fit
+- fkv
+- fmu
+- fra
+- fro
+- frp
+- fry
+- fuf
+- fur
+- fuv
+- gag
+- gaz
+- gcf
+- gla
+- gle
+- glg
+- glk
+- glv
+- gmh
+- gnb
+- goh
+- gom
+- gos
+- grc
+- gsw
+- gug
+- guj
+- guz
+- hac
+- hae
+- hak
+- hat
+- hau
+- haw
+- hbo
+- heb
+- her
+- hif
+- hil
+- hin
+- hmr
+- hne
+- hns
+- hrv
+- hrx
+- hsb
+- hun
+- hwc
+- hye
+- hyw
+- iba
+- ibg
+- ibo
+- ife
+- ike
+- ikt
+- ilo
+- ina
+- ind
+- inh
+- isl
+- ita
+- ivv
+- jav
+- jpn
+- jun
+- kaa
+- kab
+- kac
+- kak
+- kal
+- kam
+- kan
+- kas
+- kat
+- kaz
+- kbd
+- kca
+- kdh
+- kdr
+- kea
+- kei
+- kgp
+- kha
+- khk
+- khm
+- kik
+- kin
+- kir
+- kiu
+- kjb
+- kjh
+- kmr
+- knc
+- koi
+- kor
+- kos
+- kpv
+- krj
+- krl
+- kru
+- ksh
+- ksw
+- ktj
+- ktz
+- kua
+- kum
+- kwn
+- kyu
+- kzj
+- lad
+- lao
+- lat
+- lbe
+- ldn
+- lew
+- lez
+- lfn
+- lim
+- lin
+- lis
+- lit
+- lki
+- lld
+- lmk
+- lnd
+- lrc
+- ltg
+- ltz
+- lud
+- lug
+- luo
+- lus
+- lvs
+- lwg
+- lzh
+- mag
+- mah
+- mai
+- mak
+- mal
+- mar
+- mas
+- mbf
+- mdf
+- mer
+- mfe
+- mfg
+- mfy
+- mhi
+- mhr
+- mhy
+- min
+- mip
+- mjw
+- mkd
+- mlt
+- mni
+- mnk
+- mns
+- mnw
+- moh
+- mph
+- mqy
+- mri
+- mrj
+- mrw
+- mtg
+- mui
+- mup
+- mus
+- mvp
+- mwf
+- mwl
+- mww
+- mya
+- myv
+- myx
+- mzh
+- nah
+- nan
+- nap
+- naq
+- nbu
+- nde
+- ndo
+- nds
+- new
+- nio
+- njn
+- njo
+- nld
+- nmf
+- nmz
+- nno
+- nob
+- nog
+- non
+- npi
+- npo
+- nrf
+- nri
+- nrm
+- nse
+- nus
+- nya
+- nyn
+- nzm
+- obo
+- oci
+- ojb
+- olo
+- orv
+- ory
+- oss
+- ota
+- oto
+- otw
+- pam
+- pan
+- pap
+- pbt
+- pcd
+- pck
+- pcm
+- pfl
+- plt
+- pmq
+- pmx
+- pnb
+- pnt
+- pol
+- por
+- pov
+- ppk
+- pps
+- prg
+- pui
+- pxm
+- quc
+- qul
+- qup
+- qus
+- quz
+- raw
+- rcf
+- rel
+- rhg
+- ria
+- rjs
+- rmc
+- rml
+- rmn
+- rmy
+- rnl
+- roh
+- ron
+- rtm
+- rue
+- run
+- rus
+- sah
+- san
+- sat
+- sck
+- scn
+- sda
+- sdc
+- sdh
+- ses
+- sgc
+- sgh
+- sid
+- sin
+- sju
+- skr
+- slk
+- slv
+- sma
+- sme
+- smj
+- smn
+- smo
+- sms
+- smt
+- sna
+- snd
+- som
+- sot
+- spa
+- srd
+- srp
+- ssw
+- sul
+- sun
+- swe
+- swg
+- swh
+- syc
+- syl
+- szl
+- tab
+- tam
+- taq
+- tat
+- tcy
+- tcz
+- tel
+- tet
+- tgk
+- tha
+- thl
+- tig
+- tir
+- tkl
+- tkr
+- tlh
+- tly
+- tok
+- ton
+- tpi
+- tpw
+- trc
+- trp
+- trs
+- ttj
+- tuk
+- tur
+- tuv
+- twx
+- tyv
+- tzl
+- tzm
+- udm
+- uig
+- ukr
+- urd
+- uzn
+- uzs
+- vap
+- vie
+- vot
+- vro
+- war
+- way
+- wba
+- wbm
+- wes
+- whk
+- wlx
+- wol
+- wsg
+- wwa
+- xal
+- xho
+- xmm
+- xmv
+- xog
+- yaz
+- ydd
+- yor
+- yrk
+- yrl
+- yua
+- yue
+- zea
+- zgh
+- zom
+- zsm
+- zul
+pipeline_tag: translation
+datasets:
+- MihaiPopa-1/OmniSurgical-1.1
+---
+
+# OmniTranslate 1.1
+
+OmniTranslate 1.1 is a massively multilingual machine translation model supporting over 500 languages. Fine-tuned from [Qwen 3 0.6B](https://www.huggingface.co/Qwen/Qwen3-0.6B) (with Unsloth), this model is designed for translation tasks on any device!
+
+# Features
+* **500+ Languages Supported:** The broadest coverage of languages supported for a translation model that's under 1 billion parameters!
+* **Tiny Size:** Beats any other large model on speed and memory usage. No other model is able to compete with this!
+
+# Improvements over 1.0
+* OmniTranslate now makes less hiccups when translating to Romanian (like "ami"), and the diacritic bug on Romanian translations has been mostly fixed!
+
+There's a tiny chance that the model will spit out without diacritics (mostly due to seeds) though, so try a different one.
+
+# Experimental Features
+* We added 2 new languages, Emoji and Sulfuristic Speak (my own language for OmniTranslate 1.1 to quite fit the Chaos Cubed Minecraft vibe!). Try these out:
+
+## Emoji
+```python
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch
+
+# 1. Load from your Hugging Face Repo
+model_id = "MihaiPopa-1/OmniTranslate-1.1"
+
+tokenizer = AutoTokenizer.from_pretrained(model_id)
+model = AutoModelForCausalLM.from_pretrained(
+    model_id,
+    torch_dtype=torch.float32, # Standard for CPU
+    device_map="cpu"           # Forces CPU usage
+)
+
+# 2. Translate to Emoji
+prompt = "<|im_start|>user\nTranslate to emj_Emoj: We love the world!<|im_end|>\n<|im_start|>assistant\n<think>\n"
+inputs = tokenizer(prompt, return_tensors="pt").to("cpu")
+
+with torch.no_grad():
+    outputs = model.generate(**inputs, max_new_tokens=64, temperature=0.1)
+    
+print(tokenizer.decode(outputs[0], skip_special_tokens=True))
+```
+
+## Sulfuristic Speak
+```python
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch
+
+# 1. Load from your Hugging Face Repo
+model_id = "MihaiPopa-1/OmniTranslate-1.1"
+
+tokenizer = AutoTokenizer.from_pretrained(model_id)
+model = AutoModelForCausalLM.from_pretrained(
+    model_id,
+    torch_dtype=torch.float32, # Standard for CPU
+    device_map="cpu"           # Forces CPU usage
+)
+
+# 2. Translate to Sulfuristic Speak ("Translate to Sulfuristic Speak" also works too!)
+prompt = "<|im_start|>user\nTranslate to sul_Latn: Let's ride a Sulfur Cube!<|im_end|>\n<|im_start|>assistant\n<think>\n"
+inputs = tokenizer(prompt, return_tensors="pt").to("cpu")
+
+with torch.no_grad():
+    outputs = model.generate(**inputs, max_new_tokens=128, temperature=0.1)
+    
+print(tokenizer.decode(outputs[0], skip_special_tokens=True))
+```
+
+# Notes
+OmniTranslate 1.1 is still a experimental model and shouldn't be used for tasks where accurate translations matter.
+
+# Notes
+Providing the ISO code instead of the language name can improve the results a lot.
+
+# Usage
+Code is by Gemini 3 Flash (then some little modifications by myself):
+```python
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch
+
+# 1. Load from your Hugging Face Repo
+model_id = "MihaiPopa-1/OmniTranslate-1.1"
+
+tokenizer = AutoTokenizer.from_pretrained(model_id)
+model = AutoModelForCausalLM.from_pretrained(
+    model_id,
+    torch_dtype=torch.float32, # Standard for CPU
+    device_map="cpu"           # Forces CPU usage
+)
+
+# 2. Translate (replace ron_Latn with your language here)
+prompt = "<|im_start|>user\nTranslate to ron_Latn: OmniTranslate is a massively multilingual machine translation model supporting over 500 languages!<|im_end|>\n<|im_start|>assistant\n<think>\n"
+inputs = tokenizer(prompt, return_tensors="pt").to("cpu")
+
+with torch.no_grad():
+    outputs = model.generate(**inputs, max_new_tokens=256, temperature=0.1)
+    
+print(tokenizer.decode(outputs[0], skip_special_tokens=True))
+```
+
+# Data Used
+I used my own [OmniSurgical 1.1](https://www.huggingface.co/datasets/MihaiPopa-1/OmniSurgical-1.1), which the dataset itself contains a part of [HF's FineTranslations](https://www.huggingface.co/datasets/HuggingFaceFW/finetranslations)
+
+---
+
+# Uploaded finetuned model
+
+- **Developed by:** MihaiPopa-1
+- **License:** apache-2.0
+- **Finetuned from model :** unsloth/qwen3-0.6b-unsloth-bnb-4bit
+
+This qwen3 model was trained 2x faster with [Unsloth](https://github.com/unslothai/unsloth) and Huggingface's TRL library.
+
+[<img src="https://raw.githubusercontent.com/unslothai/unsloth/main/images/unsloth%20made%20with%20love.png" width="200"/>](https://github.com/unslothai/unsloth)
--- a/chat_template.jinja
+++ b/chat_template.jinja
@@ -0,0 +1,99 @@
+{%- if tools %}
+    {{- '<|im_start|>system\n' }}
+    {%- if messages[0].role == 'system' %}
+        {{- messages[0].content + '\n\n' }}
+    {%- endif %}
+    {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
+    {%- for tool in tools %}
+        {{- "\n" }}
+        {{- tool | tojson }}
+    {%- endfor %}
+    {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
+{%- else %}
+    {%- if messages[0].role == 'system' %}
+        {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
+    {%- endif %}
+{%- endif %}
+{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
+{%- for forward_message in messages %}
+    {%- set index = (messages|length - 1) - loop.index0 %}
+    {%- set message = messages[index] %}
+    {%- set current_content = message.content if message.content is defined and message.content is not none else '' %}
+    {%- set tool_start = '<tool_response>' %}
+    {%- set tool_start_length = tool_start|length %}
+    {%- set start_of_message = current_content[:tool_start_length] %}
+    {%- set tool_end = '</tool_response>' %}
+    {%- set tool_end_length = tool_end|length %}
+    {%- set start_pos = (current_content|length) - tool_end_length %}
+    {%- if start_pos < 0 %}
+        {%- set start_pos = 0 %}
+    {%- endif %}
+    {%- set end_of_message = current_content[start_pos:] %}
+    {%- if ns.multi_step_tool and message.role == "user" and not(start_of_message == tool_start and end_of_message == tool_end) %}
+        {%- set ns.multi_step_tool = false %}
+        {%- set ns.last_query_index = index %}
+    {%- endif %}
+{%- endfor %}
+{%- for message in messages %}
+    {%- if (message.role == "user") or (message.role == "system" and not loop.first) %}
+        {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}
+    {%- elif message.role == "assistant" %}
+        {%- set m_content = message.content if message.content is defined and message.content is not none else '' %}
+        {%- set content = m_content %}
+        {%- set reasoning_content = '' %}
+        {%- if message.reasoning_content is defined and message.reasoning_content is not none %}
+            {%- set reasoning_content = message.reasoning_content %}
+        {%- else %}
+            {%- if '</think>' in m_content %}
+                {%- set content = (m_content.split('</think>')|last).lstrip('\n') %}
+                {%- set reasoning_content = (m_content.split('</think>')|first).rstrip('\n') %}
+                {%- set reasoning_content = (reasoning_content.split('<think>')|last).lstrip('\n') %}
+            {%- endif %}
+        {%- endif %}
+        {%- if loop.index0 > ns.last_query_index %}
+            {%- if loop.last or (not loop.last and (not reasoning_content.strip() == '')) %}
+                {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') }}
+            {%- else %}
+                {{- '<|im_start|>' + message.role + '\n' + content }}
+            {%- endif %}
+        {%- else %}
+            {{- '<|im_start|>' + message.role + '\n' + content }}
+        {%- endif %}
+        {%- if message.tool_calls %}
+            {%- for tool_call in message.tool_calls %}
+                {%- if (loop.first and content) or (not loop.first) %}
+                    {{- '\n' }}
+                {%- endif %}
+                {%- if tool_call.function %}
+                    {%- set tool_call = tool_call.function %}
+                {%- endif %}
+                {{- '<tool_call>\n{"name": "' }}
+                {{- tool_call.name }}
+                {{- '", "arguments": ' }}
+                {%- if tool_call.arguments is string %}
+                    {{- tool_call.arguments }}
+                {%- else %}
+                    {{- tool_call.arguments | tojson }}
+                {%- endif %}
+                {{- '}\n</tool_call>' }}
+            {%- endfor %}
+        {%- endif %}
+        {{- '<|im_end|>\n' }}
+    {%- elif message.role == "tool" %}
+        {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
+            {{- '<|im_start|>user' }}
+        {%- endif %}
+        {{- '\n<tool_response>\n' }}
+        {{- message.content }}
+        {{- '\n</tool_response>' }}
+        {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
+            {{- '<|im_end|>\n' }}
+        {%- endif %}
+    {%- endif %}
+{%- endfor %}
+{%- if add_generation_prompt %}
+    {{- '<|im_start|>assistant\n' }}
+    {%- if enable_thinking is defined and enable_thinking is false %}
+        {{- '<think>\n\n</think>\n\n' }}
+    {%- endif %}
+{%- endif %}
--- a/config.json
+++ b/config.json
@@ -0,0 +1,64 @@
+{
+    "architectures": [
+        "Qwen3ForCausalLM"
+    ],
+    "attention_bias": false,
+    "attention_dropout": 0.0,
+    "bos_token_id": null,
+    "torch_dtype": "float16",
+    "eos_token_id": 151645,
+    "head_dim": 128,
+    "hidden_act": "silu",
+    "hidden_size": 1024,
+    "initializer_range": 0.02,
+    "intermediate_size": 3072,
+    "layer_types": [
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention"
+    ],
+    "max_position_embeddings": 40960,
+    "max_window_layers": 28,
+    "model_type": "qwen3",
+    "num_attention_heads": 16,
+    "num_hidden_layers": 28,
+    "num_key_value_heads": 8,
+    "pad_token_id": 151669,
+    "rms_norm_eps": 1e-06,
+    "rope_parameters": {
+        "rope_theta": 1000000,
+        "rope_type": "default"
+    },
+    "sliding_window": null,
+    "tie_word_embeddings": true,
+    "unsloth_fixed": true,
+    "unsloth_version": "2026.4.4",
+    "use_cache": false,
+    "use_sliding_window": false,
+    "vocab_size": 151936
+}
--- a/model.safetensors
+++ b/model.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ddbd4e1702ef2edb82380ae4453f305c47516c88bb04d40ecb31cebea6830680
+size 1192135096
--- a/tokenizer.json
+++ b/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d7430e9138b76e93fb6f93462394d236b411111aef53cb421ba97d2691040cca
+size 11423114
--- a/tokenizer_config.json
+++ b/tokenizer_config.json