From bb65529c16748a2c8f03017e6782b042db952c51 Mon Sep 17 00:00:00 2001
From: ModelHub XC <noreply@modelhub.org.cn>
Date: Sun, 31 May 2026 15:07:15 +0800
Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?=
 =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?=
 =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Model: prithivMLmods/Omega-Qwen3-Atom-8B
Source: Original Platform
---
 .gitattributes                            |  36 ++++++
 .ipynb_checkpoints/config-checkpoint.json |   3 +
 README.md                                 | 149 ++++++++++++++++++++++
 added_tokens.json                         |  28 ++++
 chat_template.jinja                       |   3 +
 config.json                               |   3 +
 configuration.json                        |   1 +
 generation_config.json                    |  14 ++
 merges.txt                                |   3 +
 model-00001-of-00004.safetensors          |   3 +
 model-00002-of-00004.safetensors          |   3 +
 model-00003-of-00004.safetensors          |   3 +
 model-00004-of-00004.safetensors          |   3 +
 model.safetensors.index.json              |   3 +
 special_tokens_map.json                   |  31 +++++
 tokenizer.json                            |   3 +
 tokenizer_config.json                     |   3 +
 vocab.json                                |   3 +
 18 files changed, 295 insertions(+)
 create mode 100644 .gitattributes
 create mode 100644 .ipynb_checkpoints/config-checkpoint.json
 create mode 100644 README.md
 create mode 100644 added_tokens.json
 create mode 100644 chat_template.jinja
 create mode 100644 config.json
 create mode 100644 configuration.json
 create mode 100644 generation_config.json
 create mode 100644 merges.txt
 create mode 100644 model-00001-of-00004.safetensors
 create mode 100644 model-00002-of-00004.safetensors
 create mode 100644 model-00003-of-00004.safetensors
 create mode 100644 model-00004-of-00004.safetensors
 create mode 100644 model.safetensors.index.json
 create mode 100644 special_tokens_map.json
 create mode 100644 tokenizer.json
 create mode 100644 tokenizer_config.json
 create mode 100644 vocab.json

diff --git a/.gitattributes b/.gitattributes
new file mode 100644
index 0000000..52373fe
--- /dev/null
+++ b/.gitattributes
@@ -0,0 +1,36 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text
diff --git a/.ipynb_checkpoints/config-checkpoint.json b/.ipynb_checkpoints/config-checkpoint.json
new file mode 100644
index 0000000..2b22722
--- /dev/null
+++ b/.ipynb_checkpoints/config-checkpoint.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df8e3165afc9d81bc555710e6961bfcf0d7dee87e5cdf6c13ae03c03150510f4
+size 1544
diff --git a/README.md b/README.md
new file mode 100644
index 0000000..bb84f30
--- /dev/null
+++ b/README.md
@@ -0,0 +1,149 @@
+---
+license: apache-2.0
+base_model:
+- Qwen/Qwen3-8B
+datasets:
+- prithivMLmods/Open-Omega-Atom-1.5M
+language:
+- en
+pipeline_tag: text-generation
+library_name: transformers
+tags:
+- text-generation-inference
+- code
+- science
+- 'Thinking: Enabled'
+- math
+- mot
+- moe
+- stem
+---
+
+![11.png](https://cdn-uploads.huggingface.co/production/uploads/65bb837dbfb878f46c77de4c/V26CJSyLm0ixHwNZQLlc_.png)
+
+# **Omega-Qwen3-Atom-8B**
+
+> **Omega-Qwen3-Atom-8B** is a powerful 8B-parameter model fine-tuned on **Qwen3-8B** using the curated **Open-Omega-Atom-1.5M** dataset, optimized for **math and science reasoning**. It excels at symbolic processing, scientific problem-solving, and structured output generation—making it a high-performance model for researchers, educators, and technical developers working in computational and analytical domains.
+
+## **Key Features**
+
+1. **Math & Science-Centric Reasoning**
+   Fine-tuned on the **Open-Omega-Atom-1.5M** dataset, built from high-quality math, science, and symbolic reasoning tasks—ideal for analytical domains including algebra, calculus, physics, and chemistry.
+
+2. **Scientific Concept Breakdown**
+   Explains theories, derivations, and concepts across STEM fields with clarity—solves equations step-by-step, handles formula-based questions, and provides interpretive insights.
+
+3. **Symbolic Computation & Chain-of-Thought**
+   Supports multi-step reasoning, symbolic derivations, and proof-based problem solving with a strong focus on accuracy and transparency.
+
+4. **Structured Output Generation**
+   Outputs precise formats in **LaTeX**, **Markdown**, **JSON**, and **YAML** for scientific writing, educational materials, and data pipeline integration.
+
+5. **Optimized for Efficient Scientific Workflows**
+   While based on an 8B model, it is optimized for **offline inference**, **research clusters**, and **GPU workstations** that need high symbolic precision and performance.
+
+---
+
+## Quick Start with Hugging Face Transformers🤗
+
+```py
+!pip install transformers huggingface_hub accelerate
+```
+
+```py
+from transformers import AutoModelForCausalLM, AutoTokenizer
+
+model_name = "prithivMLmods/Omega-Qwen3-Atom-8B"
+
+# load the tokenizer and the model
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(
+    model_name,
+    torch_dtype="auto",
+    device_map="auto"
+)
+
+# prepare the model input
+prompt = "A alone can do a piece of work in 6 days and B alone in 8 days. A and B undertook to do it for Rs. 3200. With the help of C, they completed the work in 3 days. How much is to be paid to C?"
+messages = [
+    {"role": "user", "content": prompt}
+]
+text = tokenizer.apply_chat_template(
+    messages,
+    tokenize=False,
+    add_generation_prompt=True,
+    enable_thinking=True # Switches between thinking and non-thinking modes. Default is True.
+)
+model_inputs = tokenizer([text], return_tensors="pt").to(model.device)
+
+# conduct text completion
+generated_ids = model.generate(
+    **model_inputs,
+    max_new_tokens=32768
+)
+output_ids = generated_ids[0][len(model_inputs.input_ids[0]):].tolist() 
+
+# parsing thinking content
+try:
+    # rindex finding 151668 (</think>)
+    index = len(output_ids) - output_ids[::-1].index(151668)
+except ValueError:
+    index = 0
+
+thinking_content = tokenizer.decode(output_ids[:index], skip_special_tokens=True).strip("\n")
+content = tokenizer.decode(output_ids[index:], skip_special_tokens=True).strip("\n")
+
+print("thinking content:", thinking_content)
+print("content:", content)
+```
+
+## Answer
+
+```
+thinking content: <think>
+Okay, let's see. So the problem is about A, B, and C working together to complete a piece of work. We need to figure out how much money C should get for his help. The total payment is Rs. 3200, and we have to divide that among A, B, and C based on their contributions. Let me try to break this down step by step.
+
+First, let's understand the work rates of A and B. A can finish the work in 6 days, so his work rate is 1/6 of the work per day. Similarly, B can finish it in 8 days, so his work rate is 1/8 per day. When they work together, their combined work rate would be 1/6 + 1/8. Let me calculate that:
+
+1/6 + 1/8. To add these, find a common denominator, which is 24. So, 4/24 + 3/24 = 7/24. So together, A and B can do 7/24 of the work in one day.
+
+But the problem says that with the help of C, they completed the work in 3 days. That means all three working together finished the job in 3 days. Let's denote C's work rate as 1/x per day, where x is the number of days C would take alone. So, the combined work rate of A, B, and C is 1/6 + 1/8 + 1/x.
+
+Since they completed the work in 3 days, their combined work rate multiplied by 3 should equal 1 (the whole work). So:
+
+(1/6 + 1/8 + 1/x) * 3 = 1
+
+Let me solve for 1/x first. Let's compute 1/6 + 1/8:
+
+As before, 1/6 is 4/24 and 1/8 is 3/24, so together they are 7/24. So:
+
+(7/24 + 1/x) * 3 = 1
+
+Divide both sides by 3:
+
+7/24 + 1/x = 1/3
+
+Subtract 7/24 from both sides:
+...
+
+$$
+\boxed{400}
+$$
+```
+
+---
+
+## **Intended Use**
+
+* Math and science tutoring, equation solving, and symbolic reasoning
+* Educational tools for high-school to postgraduate-level STEM
+* Research-grade assistant for physics, chemistry, and applied math
+* Structured technical content generator for papers, lab work, and datasets
+* STEM-focused chatbot/API for integration into science education platforms
+
+## **Limitations**
+
+* Not trained for open-domain chat or emotional dialogue
+* May struggle with very large codebases or long multi-part tasks
+* Best suited for STEM fields—general language understanding may vary
+* Prioritizes correctness and formality over conversational tone.
\ No newline at end of file
diff --git a/added_tokens.json b/added_tokens.json
new file mode 100644
index 0000000..b54f913
--- /dev/null
+++ b/added_tokens.json
@@ -0,0 +1,28 @@
+{
+  "</think>": 151668,
+  "</tool_call>": 151658,
+  "</tool_response>": 151666,
+  "<think>": 151667,
+  "<tool_call>": 151657,
+  "<tool_response>": 151665,
+  "<|box_end|>": 151649,
+  "<|box_start|>": 151648,
+  "<|endoftext|>": 151643,
+  "<|file_sep|>": 151664,
+  "<|fim_middle|>": 151660,
+  "<|fim_pad|>": 151662,
+  "<|fim_prefix|>": 151659,
+  "<|fim_suffix|>": 151661,
+  "<|im_end|>": 151645,
+  "<|im_start|>": 151644,
+  "<|image_pad|>": 151655,
+  "<|object_ref_end|>": 151647,
+  "<|object_ref_start|>": 151646,
+  "<|quad_end|>": 151651,
+  "<|quad_start|>": 151650,
+  "<|repo_name|>": 151663,
+  "<|video_pad|>": 151656,
+  "<|vision_end|>": 151653,
+  "<|vision_pad|>": 151654,
+  "<|vision_start|>": 151652
+}
diff --git a/chat_template.jinja b/chat_template.jinja
new file mode 100644
index 0000000..4240724
--- /dev/null
+++ b/chat_template.jinja
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8428c815ac94d82064e35ff1e841dcbe260e7e53a8d0bd3b94afa2eefa9bccab
+size 4761
diff --git a/config.json b/config.json
new file mode 100644
index 0000000..2b22722
--- /dev/null
+++ b/config.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df8e3165afc9d81bc555710e6961bfcf0d7dee87e5cdf6c13ae03c03150510f4
+size 1544
diff --git a/configuration.json b/configuration.json
new file mode 100644
index 0000000..159097f
--- /dev/null
+++ b/configuration.json
@@ -0,0 +1 @@
+{"framework": "pytorch", "task": "others", "allow_remote": true}
\ No newline at end of file
diff --git a/generation_config.json b/generation_config.json
new file mode 100644
index 0000000..20ea1d4
--- /dev/null
+++ b/generation_config.json
@@ -0,0 +1,14 @@
+{
+  "bos_token_id": 151643,
+  "do_sample": true,
+  "eos_token_id": [
+    151645,
+    151643
+  ],
+  "max_length": 40960,
+  "pad_token_id": 151654,
+  "temperature": 0.6,
+  "top_k": 20,
+  "top_p": 0.95,
+  "transformers_version": "4.53.2"
+}
diff --git a/merges.txt b/merges.txt
new file mode 100644
index 0000000..80c1a19
--- /dev/null
+++ b/merges.txt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5
+size 1671853
diff --git a/model-00001-of-00004.safetensors b/model-00001-of-00004.safetensors
new file mode 100644
index 0000000..de414a4
--- /dev/null
+++ b/model-00001-of-00004.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:27749f26af5726ea0a8b0d5b351799894139d8f28177082d39a4639228d8e25b
+size 4902257696
diff --git a/model-00002-of-00004.safetensors b/model-00002-of-00004.safetensors
new file mode 100644
index 0000000..4705b64
--- /dev/null
+++ b/model-00002-of-00004.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ceac8f69981d4620fee682589baf1717f2339b09faf523b81c35b29d599d976b
+size 4915960368
diff --git a/model-00003-of-00004.safetensors b/model-00003-of-00004.safetensors
new file mode 100644
index 0000000..e8f3a98
--- /dev/null
+++ b/model-00003-of-00004.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a440e450b4d5028a6b98978446ac4344caa6038dcd3f3d6c8edcefcf9fa1bc8c
+size 4983068496
diff --git a/model-00004-of-00004.safetensors b/model-00004-of-00004.safetensors
new file mode 100644
index 0000000..ceab387
--- /dev/null
+++ b/model-00004-of-00004.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dbc55767196444fb9ee9c2165843c3682939389861a9ad298532ecc59279ab66
+size 1580230264
diff --git a/model.safetensors.index.json b/model.safetensors.index.json
new file mode 100644
index 0000000..5368f15
--- /dev/null
+++ b/model.safetensors.index.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3649bb967710edc0f995e3839a363a069482a1688216f87745248966751d0221
+size 32878
diff --git a/special_tokens_map.json b/special_tokens_map.json
new file mode 100644
index 0000000..9b8043f
--- /dev/null
+++ b/special_tokens_map.json
@@ -0,0 +1,31 @@
+{
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>",
+    "<|object_ref_start|>",
+    "<|object_ref_end|>",
+    "<|box_start|>",
+    "<|box_end|>",
+    "<|quad_start|>",
+    "<|quad_end|>",
+    "<|vision_start|>",
+    "<|vision_end|>",
+    "<|vision_pad|>",
+    "<|image_pad|>",
+    "<|video_pad|>"
+  ],
+  "eos_token": {
+    "content": "<|im_end|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|vision_pad|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}
diff --git a/tokenizer.json b/tokenizer.json
new file mode 100644
index 0000000..cd71f61
--- /dev/null
+++ b/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
+size 11422654
diff --git a/tokenizer_config.json b/tokenizer_config.json
new file mode 100644
index 0000000..b256dac
--- /dev/null
+++ b/tokenizer_config.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e79a6c814467077aef847b2c307435a3d434ef3211f5266922827d9e56246b07
+size 5431
diff --git a/vocab.json b/vocab.json
new file mode 100644
index 0000000..6c49fc6
--- /dev/null
+++ b/vocab.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910
+size 2776833