commit c399453fa4a417dc309a15dd4a3d47cb60c343b5 Author: ModelHub XC Date: Tue May 26 22:11:12 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: smirki/UIGEN-FX-4B-STG-Modal-08-28 Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..d2fc868 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,51 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bin.* filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text + +merges.txt filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text +vocab.json filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..417b88d --- /dev/null +++ b/README.md @@ -0,0 +1,21 @@ +--- +base_model: unsloth/qwen3-4b-instruct-2507-unsloth-bnb-4bit +tags: +- text-generation-inference +- transformers +- unsloth +- qwen3 +license: apache-2.0 +language: +- en +--- + +# Uploaded finetuned model + +- **Developed by:** smirki +- **License:** apache-2.0 +- **Finetuned from model :** unsloth/qwen3-4b-instruct-2507-unsloth-bnb-4bit + +This qwen3 model was trained 2x faster with [Unsloth](https://github.com/unslothai/unsloth) and Huggingface's TRL library. + +[](https://github.com/unslothai/unsloth) diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000..b54f913 --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,28 @@ +{ + "": 151668, + "": 151658, + "": 151666, + "": 151667, + "": 151657, + "": 151665, + "<|box_end|>": 151649, + "<|box_start|>": 151648, + "<|endoftext|>": 151643, + "<|file_sep|>": 151664, + "<|fim_middle|>": 151660, + "<|fim_pad|>": 151662, + "<|fim_prefix|>": 151659, + "<|fim_suffix|>": 151661, + "<|im_end|>": 151645, + "<|im_start|>": 151644, + "<|image_pad|>": 151655, + "<|object_ref_end|>": 151647, + "<|object_ref_start|>": 151646, + "<|quad_end|>": 151651, + "<|quad_start|>": 151650, + "<|repo_name|>": 151663, + "<|video_pad|>": 151656, + "<|vision_end|>": 151653, + "<|vision_pad|>": 151654, + "<|vision_start|>": 151652 +} diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000..465e19f --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,289 @@ +{% if 'role' in messages[0] %} +{%- if tools %} + {{- '<|im_start|>system +' }} + {%- if messages[0].role == 'system' %} + {{- messages[0].content + ' + +' }} + {%- endif %} + {{- "# Tools + +You may call one or more functions to assist with the user query. + +You are provided with function signatures within XML tags: +" }} + {%- for tool in tools %} + {{- " +" }} + {{- tool | tojson }} + {%- endfor %} + {{- " + + +For each function call, return a json object with function name and arguments within XML tags: + +{\"name\": , \"arguments\": } +<|im_end|> +" }} +{%- else %} + {%- if messages[0].role == 'system' %} + {{- '<|im_start|>system +' + messages[0].content + '<|im_end|> +' }} + {%- endif %} +{%- endif %} +{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %} +{%- for forward_message in messages %} + {%- set index = (messages|length - 1) - loop.index0 %} + {%- set message = messages[index] %} + {%- set current_content = message.content if message.content is not none else '' %} + {%- set tool_start = '' %} + {%- set tool_start_length = tool_start|length %} + {%- set start_of_message = current_content[:tool_start_length] %} + {%- set tool_end = '' %} + {%- set tool_end_length = tool_end|length %} + {%- set start_pos = (current_content|length) - tool_end_length %} + {%- if start_pos < 0 %} + {%- set start_pos = 0 %} + {%- endif %} + {%- set end_of_message = current_content[start_pos:] %} + {%- if ns.multi_step_tool and message.role == "user" and not(start_of_message == tool_start and end_of_message == tool_end) %} + {%- set ns.multi_step_tool = false %} + {%- set ns.last_query_index = index %} + {%- endif %} +{%- endfor %} +{%- for message in messages %} + {%- if (message.role == "user") or (message.role == "system" and not loop.first) %} + {{- '<|im_start|>' + message.role + ' +' + message.content + '<|im_end|>' + ' +' }} + {%- elif message.role == "assistant" %} + {%- set content = message.content %} + {%- set reasoning_content = '' %} + {%- if message.reasoning_content is defined and message.reasoning_content is not none %} + {%- set reasoning_content = message.reasoning_content %} + {%- else %} + {%- if '' in message.content %} + {%- set content = (message.content.split('')|last).lstrip(' +') %} + {%- set reasoning_content = (message.content.split('')|first).rstrip(' +') %} + {%- set reasoning_content = (reasoning_content.split('')|last).lstrip(' +') %} + {%- endif %} + {%- endif %} + {%- if loop.index0 > ns.last_query_index %} + {%- if loop.last or (not loop.last and reasoning_content) %} + {{- '<|im_start|>' + message.role + ' + +' + reasoning_content.strip(' +') + ' + + +' + content.lstrip(' +') }} + {%- else %} + {{- '<|im_start|>' + message.role + ' +' + content }} + {%- endif %} + {%- else %} + {{- '<|im_start|>' + message.role + ' +' + content }} + {%- endif %} + {%- if message.tool_calls %} + {%- for tool_call in message.tool_calls %} + {%- if (loop.first and content) or (not loop.first) %} + {{- ' +' }} + {%- endif %} + {%- if tool_call.function %} + {%- set tool_call = tool_call.function %} + {%- endif %} + {{- ' +{"name": "' }} + {{- tool_call.name }} + {{- '", "arguments": ' }} + {%- if tool_call.arguments is string %} + {{- tool_call.arguments }} + {%- else %} + {{- tool_call.arguments | tojson }} + {%- endif %} + {{- '} +' }} + {%- endfor %} + {%- endif %} + {{- '<|im_end|> +' }} + {%- elif message.role == "tool" %} + {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|im_start|>user' }} + {%- endif %} + {{- ' + +' }} + {{- message.content }} + {{- ' +' }} + {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %} + {{- '<|im_end|> +' }} + {%- endif %} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|im_start|>assistant +' }} + {%- if enable_thinking is defined and enable_thinking is false %} + {{- ' + + + +' }} + {%- endif %} +{%- endif %} +{% else %} +{%- if tools %} + {{- '<|im_start|>system +' }} + {%- if messages[0].role == 'system' %} + {{- messages[0].content + ' + +' }} + {%- endif %} + {{- "# Tools + +You may call one or more functions to assist with the user query. + +You are provided with function signatures within XML tags: +" }} + {%- for tool in tools %} + {{- " +" }} + {{- tool | tojson }} + {%- endfor %} + {{- " + + +For each function call, return a json object with function name and arguments within XML tags: + +{\"name\": , \"arguments\": } +<|im_end|> +" }} +{%- else %} + {%- if messages[0].role == 'system' %} + {{- '<|im_start|>system +' + messages[0].content + '<|im_end|> +' }} + {%- endif %} +{%- endif %} +{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %} +{%- for forward_message in messages %} + {%- set index = (messages|length - 1) - loop.index0 %} + {%- set message = messages[index] %} + {%- set current_content = message.content if message.content is not none else '' %} + {%- set tool_start = '' %} + {%- set tool_start_length = tool_start|length %} + {%- set start_of_message = current_content[:tool_start_length] %} + {%- set tool_end = '' %} + {%- set tool_end_length = tool_end|length %} + {%- set start_pos = (current_content|length) - tool_end_length %} + {%- if start_pos < 0 %} + {%- set start_pos = 0 %} + {%- endif %} + {%- set end_of_message = current_content[start_pos:] %} + {%- if ns.multi_step_tool and message.role == "user" and not(start_of_message == tool_start and end_of_message == tool_end) %} + {%- set ns.multi_step_tool = false %} + {%- set ns.last_query_index = index %} + {%- endif %} +{%- endfor %} +{%- for message in messages %} + {%- if (message.role == "user") or (message.role == "system" and not loop.first) %} + {{- '<|im_start|>' + message.role + ' +' + message.content + '<|im_end|>' + ' +' }} + {%- elif message.role == "assistant" %} + {%- set content = message.content %} + {%- set reasoning_content = '' %} + {%- if message.reasoning_content is defined and message.reasoning_content is not none %} + {%- set reasoning_content = message.reasoning_content %} + {%- else %} + {%- if '' in message.content %} + {%- set content = (message.content.split('')|last).lstrip(' +') %} + {%- set reasoning_content = (message.content.split('')|first).rstrip(' +') %} + {%- set reasoning_content = (reasoning_content.split('')|last).lstrip(' +') %} + {%- endif %} + {%- endif %} + {%- if loop.index0 > ns.last_query_index %} + {%- if loop.last or (not loop.last and reasoning_content) %} + {{- '<|im_start|>' + message.role + ' + +' + reasoning_content.strip(' +') + ' + + +' + content.lstrip(' +') }} + {%- else %} + {{- '<|im_start|>' + message.role + ' +' + content }} + {%- endif %} + {%- else %} + {{- '<|im_start|>' + message.role + ' +' + content }} + {%- endif %} + {%- if message.tool_calls %} + {%- for tool_call in message.tool_calls %} + {%- if (loop.first and content) or (not loop.first) %} + {{- ' +' }} + {%- endif %} + {%- if tool_call.function %} + {%- set tool_call = tool_call.function %} + {%- endif %} + {{- ' +{"name": "' }} + {{- tool_call.name }} + {{- '", "arguments": ' }} + {%- if tool_call.arguments is string %} + {{- tool_call.arguments }} + {%- else %} + {{- tool_call.arguments | tojson }} + {%- endif %} + {{- '} +' }} + {%- endfor %} + {%- endif %} + {{- '<|im_end|> +' }} + {%- elif message.role == "tool" %} + {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|im_start|>user' }} + {%- endif %} + {{- ' + +' }} + {{- message.content }} + {{- ' +' }} + {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %} + {{- '<|im_end|> +' }} + {%- endif %} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|im_start|>assistant +' }} + {%- if enable_thinking is defined and enable_thinking is false %} + {{- ' + + + +' }} + {%- endif %} +{%- endif %} +{% endif %} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..a2919ea --- /dev/null +++ b/config.json @@ -0,0 +1,70 @@ +{ + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "eos_token_id": 151645, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 2560, + "initializer_range": 0.02, + "intermediate_size": 9728, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 262144, + "max_window_layers": 36, + "model_type": "qwen3", + "num_attention_heads": 32, + "num_hidden_layers": 36, + "num_key_value_heads": 8, + "pad_token_id": 151654, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 5000000, + "sliding_window": null, + "tie_word_embeddings": true, + "torch_dtype": "bfloat16", + "transformers_version": "4.55.4", + "unsloth_fixed": true, + "unsloth_version": "2025.8.9", + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..e8c0b71 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,14 @@ +{ + "bos_token_id": 151643, + "do_sample": true, + "eos_token_id": [ + 151645, + 151643 + ], + "max_length": 262144, + "pad_token_id": 151654, + "temperature": 0.7, + "top_k": 20, + "top_p": 0.8, + "transformers_version": "4.55.4" +} diff --git a/inference_samples/step_0/cattle_ranch.txt b/inference_samples/step_0/cattle_ranch.txt new file mode 100644 index 0000000..c2c689b --- /dev/null +++ b/inference_samples/step_0/cattle_ranch.txt @@ -0,0 +1,403 @@ +Prompt: make a website for a cattle ranch +Generated at step: 0 +Timestamp: 2025-08-28T08:50:16.847881 +============================================================ + +Absolutely! Here's a complete, professional **website concept and structure** for a cattle ranch — designed to be functional, trustworthy, and appealing to farmers, investors, buyers, and local communities. + +--- + +# 🌿 Welcome to **Sunset Ridge Ranch** + +*Where Nature Meets Tradition – Cattle Grazing, Sustainable Farming & Community Growth* + +--- + +## ✅ Website Structure (HTML/CSS/JS Framework) + +We’ll build this as a responsive, mobile-friendly site using modern web standards. Below is the full content layout with suggested design elements. + +--- + +### 📝 1. Homepage (`index.html`) + +```html + + + + + + Sunset Ridge Ranch | Premium Cattle & Sustainable Ranching + + + + + + + + + +
+
+

Sunset Ridge Ranch

+

Family-owned since 1932. Sustainably managed pasture-raised cattle. Healthy animals. Responsible land stewardship.

+ Schedule a Visit +
+
+ + +
+
+

About Our Ranch

+
+
+

Our Story

+

Founded in 1932 by James Whitaker, Sunset Ridge Ranch has been raising healthy, grass-fed beef using traditional methods passed down through generations.

+
+
+

Land Stewardship

+

We manage over 12,000 acres of native grasslands, restoring ecosystems through rotational grazing and native plant reseeding.

+
+
+

Community Focus

+

Every year, we host youth education programs, farm tours, and support local schools and food cooperatives.

+
+
+
+
+ + +
+
+

Our Cattle Herd

+
+
+

Brahma Bulls

+

Strong, resilient, excellent milkers. Used for breeding and cross-breeding.

+
+
+

Hereford Steers

+

Fat-tailed, well-suited for winter feeding and high-quality meat production.

+
+
+

Angus Heifers

+

Grass-fed, hormone-free, raised with natural forage. Ideal for premium beef markets.

+
+
+
+
+ + +
+
+

Our Services

+
+
+

Cattle Sales

+

Premium quality stock available for purchase or auction. Contact us to schedule a viewing.

+
+
+

Consultation

+

Need help managing your herd? We offer expert advice on nutrition, health, and pasture rotation.

+
+
+

Beef Processing Partnerships

+

Partner with our certified processors to deliver high-quality, traceable beef products.

+
+
+
+
+ + +
+
+

Get In Touch

+
+
+ + +
+
+ + +
+
+ + +
+ +
+
+
+ + + + + + +``` + +--- + +## 🔧 Features & Best Practices + +| Feature | Why It Matters | +|---------------------------|---------------| +| Responsive Design | Works on phones, tablets, desktops | +| Mobile-first Layout | Most users access via phone | +| Clean Typography | Readable and professional | +| Image Background (CSS) | Subtle, nature-themed visuals without heavy load | +| Clear CTAs | "Schedule a Visit", "Contact Us" | +| Trust Elements | "Family-Owned", "Sustainable", "Traceable" | +| Sections for SEO | Each section can be optimized for Google | + +--- + +## 💡 Recommended Additions (Later) + +1. **Gallery Page**: High-res photos of cattle, pastures, family members. +2. **Blog Section**: Articles like “Rotational Grazing Explained” or “The Benefits of Grass-Fed Beef” +3. **Investor Page**: For those interested in buying land or equity. +4. **Live Feed Dashboard (Optional)**: Real-time stats on animal count, feed usage, etc. +5. **Booking System**: For farm tours or private viewings. + +--- + +## 🖼️ Visual Assets You Should Include + +- Background images: Rolling hills, grazing cattle, sunrise over range +- Icons: Cattle, sheep, watering trough, map pin, calendar +- Brand Colors: + - Green (#4CAF50): Natural, growth, sustainability + - Earth Tones: Brown, tan, sage green + +--- + +## 🚀 How to Deploy This Site + +1. Save as `index.html` +2. Host it on any free hosting service: + - [GitHub Pages](https://pages.github.com/) + - [Netlify](https://www.netlify.com/) + - [Vercel](https://vercel.com/) +3. Upload files in `/public` folder or use domain (e.g., `sunsetridgeranch.com`) + +--- + +## Example Domain Suggestions + +- sunsetridgeranch.com +- sunrideranch.com +- westcoastcattle.com +- verdantgrazewest.com + +*(Choose one that sounds authentic and memorable)* + +--- + +Would you like me to: + +✅ Generate a full version with actual images and assets (can be added later)? +✅ Create a WordPress version (easy to manage)? +✅ Build a brochure or pitch deck to go along with the website? + +Let me know — I’d love to help you launch your ranch online successfully! + +🌾 *Success starts with visibility.* Let’s grow together. 🐄💚 \ No newline at end of file diff --git a/inference_samples/step_0/coffee_shop.txt b/inference_samples/step_0/coffee_shop.txt new file mode 100644 index 0000000..79aa8b3 --- /dev/null +++ b/inference_samples/step_0/coffee_shop.txt @@ -0,0 +1,979 @@ +Prompt: make the best coffee shop website you can in html css js +Generated at step: 0 +Timestamp: 2025-08-28T08:50:16.844959 +============================================================ + +Absolutely! Here's a **complete, modern, responsive, and interactive coffee shop website** built with **HTML, CSS, and JavaScript (vanilla)** — no frameworks or external libraries. It includes: + +- A sleek, minimalist design inspired by premium coffee shops +- Responsive layout (mobile-friendly) +- Interactive features: + - Menu toggle + - Cart functionality (add/remove items, calculate total) + - Dark/light mode switch + - Smooth animations & transitions +- Smooth scroll & hover effects +- Local storage for cart persistence + +--- + +## ✅ How to Use This: +1. Copy all code below into a single file named `index.html` +2. Save it locally and open in your browser. +3. Optionally add a real image path for better visuals. + +--- + +```html + + + + + + Bean Haven | Premium Coffee Experience + + + + + + + + +
+ +
+ + +
+
+

Welcome to Bean Haven

+

Handcrafted espresso, organic beans, and a warm atmosphere where every cup tells a story.

+ +
+
+ + +
+

Why Choose Us?

+
+
+
+

Craftsmanship

+

We roast our beans in small batches using traditional methods for rich flavor and aroma.

+
+
+
🌱
+

Sustainable Beans

+

All our beans are ethically sourced from sustainable farms around the world.

+
+
+
🔥
+

Expert Baristas

+

Our baristas are trained in precision pour-over and latte art techniques.

+
+
+
+ + + + + +
+
+

Your Order

+ +
+
+
+ Total: $0.00 +
+ +
+ + +
+ +
+ + + + + + + + +``` + +--- + +## 🚀 What’s Included? + +✅ **Dark/Light Mode** – Toggle via button at top +✅ **Responsive Layout** – Works on mobile, tablet, desktop +✅ **Interactive Menu Tabs** – Filter drinks by category +✅ **Shopping Cart** – Adds/removes items, totals sum, persists in localStorage +✅ **Smooth Animations & Transitions** – Fade-ins, hover effects +✅ **Scroll to Top Button** – Appears when scrolled down +✅ **Fully Self-Contained** – No external dependencies (no jQuery, React, etc.) +✅ **SEO-Friendly** – Semantic HTML structure +✅ **Accessible** – Keyboard navigation & screen reader support + +--- + +## 🔧 Want More? +You can extend this by adding: +- User login / order history +- Payment integration (Stripe API later) +- Search filter +- Image gallery per drink +- Booking system + +--- + +Let me know if you'd like a **version with React**, **TailwindCSS**, or **hosted on Vercel/Netlify**! + +Enjoy brewing success ☕✨ 💡 \ No newline at end of file diff --git a/inference_samples/step_0/cyber_dog_cafe.txt b/inference_samples/step_0/cyber_dog_cafe.txt new file mode 100644 index 0000000..6e0045c --- /dev/null +++ b/inference_samples/step_0/cyber_dog_cafe.txt @@ -0,0 +1,106 @@ +Prompt: make a cyber dog cafe +Generated at step: 0 +Timestamp: 2025-08-28T08:50:16.846430 +============================================================ + +Absolutely! Here's a fun, immersive concept for **"Cyber Dog Cafe"** — a futuristic, tech-savvy coffee shop with a twist of cyberpunk and canine charm. Perfect for fans of sci-fi, anime, or just a quirky break from the ordinary. + +--- + +## 🚀 Cyber Dog Café – Where Barks Meet Bits + +### 🏷️ Concept Overview +A high-tech, neon-drenched café that blends retro-futurism with robotic canines, AI baristas, and digital pet culture. Think *cyberpunk meets puppy love* — where your morning brew is served by a holographic poodle, and your loyalty rewards are earned through "digital barking." + +--- + +## 🌆 Atmosphere & Design +- **Ambient Vibe**: Glitchy neon lights, holographic murals of dogs in space, floating pixelated tails. +- **Color Palette**: Electric blue, deep purple, glowing pink, and black — like a digital sunset over Tokyo. +- **Soundtrack**: Chill lo-fi beats mixed with soft barks, chimes, and subtle synth melodies. +- **Furniture**: Futuristic stools shaped like robot pups; tables with built-in Wi-Fi charging pads. + +> “Every corner hums with a different dog’s heartbeat.” — Café Tagline + +--- + +## 🐾 The Menu (Tech-Powered Brews) + +| Drink | Description | +|-------|------------| +| **Neon Nuzzle Latte** | A warm oat milk latte with glow-in-the-dark cocoa powder. Served in a ceramic mug with a tiny LED tail flicker when stirred. | +| **Bark & Byte Frappuccino** | Iced blended drink with matcha, raspberry, and a dash of server-side espresso foam. Comes with a QR code to unlock a virtual pet dog. | +| **Glitch Pup Cappuccino** | A cold brew with micro-dosed caffeine + nano-particles that spark gently on the surface. Leaves a trail of digital paw prints on your cup. | +| **AI Bark Tea** | A hot herbal blend infused with machine-learning-infused chamomile. “Tastes like peace,” says 73% of customers. | + +--- + +## 🤖 Staff & Features + +### AI Baristas (Dogs in Hologram) +Each barista is a real-life AI companion trained as a robotic dog. They greet you with: +- “Paw-sitive!” +- “Bark-activated access granted.” +- “Your order is ready… *or is it?* (checks system)” + +They can place orders via voice, gesture, or thought (via neural interface headset). + +### Loyalty Program: “The Canine Chain” +- Earn **bark points** for every visit. +- Spend points to unlock: + - Virtual dog avatars in augmented reality + - Digital dog park memberships (play in the city skyline) + - Exclusive limited-edition drinks named after famous cyber-dog memes (e.g., “Fluff the Faux”) + +--- + +## 🐶 Special Features + +1. **Digital Pet Corner** + - Bring your real dog to the café → get a digital twin using AR glasses. + - Your dog appears in the lobby as a 3D projection. + +2. **Dog Memory Vault** + - Scan your pet’s photo → upload to a secure cloud vault. + - Every 30 days, the café generates a new "digital memory" (like a video of them playing fetch in the future). + +3. **Robo-Dog Therapy Sessions** + - 15-minute sessions with AI therapy dogs programmed to reduce anxiety. + - Uses biofeedback sensors to adjust tone based on human stress levels. + +4. **“Bark-to-Brew” Experience** + - Use your smartphone to record a bark (even if it’s just a snort), then the AI matches it to a custom drink recipe. + +--- + +## 🚨 Hidden Tech Features + +- **Wi-Fi Name**: `pawssive.net` +- **App Integration**: Download “PawConnect” app to track your digital dog’s journey across the city. +- **Sustainability Angle**: All cups are compostable bioplastic with embedded NFC tags for dog-friendly recycling. + +--- + +## 🎬 Marketing Taglines + +> *"Where your dog goes, your future comes."* +> *"One bark, one byte, one happy customer."* +> *"Not all cafes serve coffee. This one serves connection."* + +--- + +## Bonus: Real-Life Version Ideas +If you want to open one: +- Partner with pet tech startups or smart home brands. +- Host monthly events: “Cyber Dog Dance Party” or “Pet AI Meetups”. +- Offer free drinks for pets with microchips registered in the city database. + +--- + +🎉 Would you like this expanded into a full business plan, a pitch deck, a social media campaign, or even a short animated ad script? + +Let me know — I’d love to help bring *Cyber Dog Café* to life in any format! 🐕⚡☕ + +--- + +P.S. Imagine walking in and seeing a golden retriever-shaped drone serving you a cup of tea while a squirrel robot plays chess in the corner. That’s the vibe. 🔮🐶💻 \ No newline at end of file diff --git a/inference_samples/step_0/kpmg.txt b/inference_samples/step_0/kpmg.txt new file mode 100644 index 0000000..41fd938 --- /dev/null +++ b/inference_samples/step_0/kpmg.txt @@ -0,0 +1,234 @@ +Prompt: make a website for kpmg +Generated at step: 0 +Timestamp: 2025-08-28T08:50:16.848713 +============================================================ + +Creating a full website for **KPMG** (one of the world's largest professional services firms) requires careful planning, design, and content strategy to reflect its global brand, expertise, and services. Below is a complete **concept and structure** you can use to build or develop a professional KPMG website. + +--- + +# 🌐 KPMG Official Website Concept + +> *Note: This is not an actual live site — this is a comprehensive blueprint designed for developers, designers, or digital marketing teams to create a real-world KPMG-branded website.* + +--- + +## 🔍 Website Overview + +**Name:** [KPMG.com](https://www.kpmg.com) +**Purpose:** A globally accessible, responsive, secure, and user-friendly platform that showcases KPMG’s services, expertise, regions, careers, sustainability efforts, thought leadership, and client support. + +**Target Audience:** +- Businesses & enterprises seeking audit, tax, advisory, and consulting services +- Professionals looking for career opportunities +- Investors, government entities, and nonprofit organizations + +**Core Values:** Integrity, Innovation, Inclusion, Excellence, Sustainability + +--- + +## 🎯 Key Objectives + +1. Build trust through transparency and credibility +2. Showcase global reach with localized experiences +3. Enable easy navigation across 150+ countries +4. Highlight sustainability and ESG initiatives +5. Offer clear pathways for clients and job seekers + +--- + +## 📚 Site Structure (Sitemap) + +``` +Home +│ +├── About Us +│ ├── Our Firm +│ ├── Leadership +│ ├── Commitment to Integrity +│ └── Our People +│ +├── Services +│ ├── Audit & Assurance +│ ├── Tax +│ ├── Advisory +│ ├── Legal & Regulatory +│ ├── Sustainable Finance +│ ├── Risk & Compliance +│ └── Digital Transformation +│ +├── Industries +│ ├── Financial Services +│ ├── Healthcare +│ ├── Manufacturing +│ ├── Retail & Consumer +│ ├── Technology & AI +│ └── Public Sector +│ +├── Regions / Locations +│ ├── Global Offices +│ ├── Asia-Pacific +│ ├── Europe +│ ├── Americas +│ └── Middle East & Africa +│ +├── Careers +│ ├── Find a Job +│ ├── Join Our Team +│ ├── Diversity & Inclusion +│ └── Student Programs +│ +├── Insights & Thought Leadership +│ ├── Reports & Publications +│ ├── Podcasts & Videos +│ ├── Webinars +│ └── Industry Trends +│ +├── Sustainability & ESG +│ ├── Climate Action Plan +│ ├── Carbon Neutrality Goals +│ ├── Social Responsibility +│ └── Green Finance Initiatives +│ +├── Resources +│ ├── Client Tools +│ ├── Guides & White Papers +│ ├── Newsroom +│ └── Events Calendar +│ +└── Contact + ├── Contact by Region + ├── Get in Touch + └── Emergency & Media Relations +``` + +--- + +## ✅ Design Principles + +| Element | Specification | +|-------|---------------| +| **Brand Colors** | Deep blue (#003B7A), white, grey, accent green (#2ECC71) | +| **Typography** | Clean, modern sans-serif (e.g., Inter, Helvetica Neue) | +| **Layout** | Responsive (mobile-first), minimal, trustworthy UI | +| **Imagery** | Professional, diverse team shots, real-world scenarios, data visualizations | +| **Accessibility** | WCAG 2.1 AA compliant (screen reader support, contrast ratios) | + +--- + +## 🖼️ Homepage Content Highlights + +1. **Hero Section** + - Headline: *"Delivering Value Through Trust, Innovation & Integrity"* + - Subheadline: "We help businesses thrive — from financial strength to sustainable growth." + - CTA Buttons: “Explore Services” | “Find a Local Office” | “Join Our Team” + +2. **Key Service Highlights (Cards)** + - Audit & Assurance + - Tax Strategy + - Sustainability Consulting + - M&A Advisory + +3. **Global Reach Visual** + - Interactive map showing offices in over 150 countries + +4. **Client Testimonials** + - Real quotes from CEOs, CFOs, and leaders + +5. **News & Updates Banner** + - Latest insights, press releases, events + +6. **Footer Navigation** + - Quick links + Contact + Privacy Policy + Cookie Notice + +--- + +## 💡 Unique Features to Include + +✅ **Interactive Regional Selector** +Users pick region → auto-show local services, office locations, and language options + +✅ **AI-Powered Search Bar** +Search for services, industries, or experts using natural language + +✅ **Carbon Footprint Tracker Tool** +For clients interested in ESG reporting – shows how KPMG helps measure emissions + +✅ **Career Match Engine** +Allows users to filter jobs by industry, location, experience level, values (diversity, remote work, etc.) + +✅ **Live Webinar Scheduler** +Schedule and attend free webinars on topics like “ESG Compliance” or “Future of Auditing” + +--- + +## 🔒 Security & Compliance + +- GDPR-compliant data handling +- SOC 2 Type II certified (for service delivery) +- SSL encryption enabled +- Secure login for client portals and employee dashboards + +--- + +## 🚀 Development Recommendations + +### Tech Stack Suggestion: + +| Layer | Recommendation | +|--------------|----------------| +| Frontend | React.js + Next.js (with TypeScript) | +| Backend | Node.js / .NET Core (scalable APIs) | +| CMS | Strapi or WordPress (for content management) | +| Hosting | AWS or Azure (global CDN + edge caching) | +| SEO | Google Search Console + Schema.org markup | +| Analytics | Google Analytics 4 + Hotjar (user behavior tracking) | + +--- + +## 📢 Sample Page Copy (About Us) + +> **Our Promise to You** +> At KPMG, we believe every business deserves more than just advice—we deliver solutions rooted in integrity, innovation, and long-term value. With over 280,000 professionals across 150 countries, we partner with leaders worldwide to navigate complexity, reduce risk, and unlock growth—through transparency, technology, and human insight. + +> From helping companies achieve net-zero emissions to advising governments on digital transformation, our people bring deep expertise and empathy to every engagement. + +--- + +## 📣 How to Build It? + +If you're building this as a project: + +1. **Register Domain**: Use `kpmg.com` (or `kpmg.global`) +2. **Secure SSL Certificate** via Let’s Encrypt or Cloudflare +3. **Design Wireframes** using Figma/Adobe XD +4. **Develop MVP** (Minimum Viable Product) with core pages first +5. **Test UX/UI** with real users (clients, employees, job seekers) +6. **Launch in Phases**: Start with homepage, then expand to services, careers, and regions +7. **Add Multilingual Support** (English, French, Spanish, Mandarin, Hindi, Arabic, etc.) + +--- + +## Want This Turned Into a Live Website? + +I can help further by: +- Creating a fully functional **HTML/CSS/JS prototype** (static version) +- Writing SEO-optimized content for each page +- Providing sample copywriting for blogs, landing pages, and ads +- Suggesting AI tools to automate content updates +- Recommending integration with LinkedIn, X (Twitter), or YouTube for social presence + +--- + +Would you like me to generate: + +✅ A **sample HTML prototype** of the homepage? +✅ A list of **SEO titles and meta descriptions** for each page? +✅ Sample blog post ideas for "Insights & Thought Leadership"? +✅ A downloadable PDF version of this guide? + +Let me know what you'd like next! 👨‍💻✨ + +--- + +*This concept aligns with KPMG’s official branding and mission while being scalable and future-ready.* \ No newline at end of file diff --git a/inference_samples/step_0/steves_tech_repair.txt b/inference_samples/step_0/steves_tech_repair.txt new file mode 100644 index 0000000..e4c1f7e --- /dev/null +++ b/inference_samples/step_0/steves_tech_repair.txt @@ -0,0 +1,490 @@ +Prompt: Make a website for steve's tech repair shop. +Generated at step: 0 +Timestamp: 2025-08-28T08:50:16.842072 +============================================================ + +Sure! Here's a complete, ready-to-use **website concept and code** for **Steve’s Tech Repair Shop** — designed to be clean, professional, mobile-friendly, and user-focused. + +--- + +# 🎯 Steve’s Tech Repair Shop – Website (HTML/CSS/JS) + +This is a fully functional static website you can copy into an `index.html` file or deploy on platforms like Netlify, Vercel, or GitHub Pages. + +--- + +## ✅ Features Included: +- Responsive design (mobile & desktop) +- Navigation menu +- Services section +- About Steve +- Contact form +- Testimonials +- Footer with social links + +--- + +### 💻 Copy-Paste Code: `index.html` + +```html + + + + + + Steve's Tech Repair Shop + + + + + +
+ +
+ + +
+
+

Steve’s Tech Repair Shop

+

Your Trusted Partner for Phone, Laptop, and Device Repairs

+
+
+ + +
+
+

Our Services

+
+
+

Laptop Repair

+

We fix broken screens, slow performance, overheating, and software issues.

+
+
+

Phone & Tablet Repair

+

Battery replacement, screen repairs, water damage fixes, charging issues.

+
+
+

Computer Setup & Cleaning

+

Malware removal, system optimization, hardware upgrades, cleaning dust.

+
+
+

Data Recovery

+

Recovers lost files from damaged drives, phones, and external storage.

+
+
+
+
+ + +
+
+

About Steve

+ Steve +

Steve has over 15 years of experience in electronics repair. He started his journey fixing old PCs at home before opening Steve’s Tech Repair in 2010. With honest service, fast turnaround times, and no hidden fees, Steve’s Tech is your go-to place when your device fails.

+
+
+ + +
+
+

What Our Customers Say

+
+
+

"Steve fixed my cracked iPhone screen in under 2 hours. I was amazed by the quality and speed!"

+
— Sarah M., Customer
+
+
+

"My laptop wouldn’t boot up. Steve diagnosed it and replaced the hard drive — now it runs like new!"

+
— James R., Business Owner
+
+
+

"Finally found someone who doesn't charge extra. The service was friendly and transparent."

+
— Lisa K., Teacher
+
+
+
+
+ + +
+
+

Get In Touch

+
+
+ + +
+
+ + +
+
+ + +
+
+ + +
+ +
+
+
+ + + + + + +``` + +--- + +## 🔧 How to Use This Website: + +1. **Save as HTML File** + - Open any text editor (VS Code, Notepad++, etc.) + - Paste the code above. + - Save it as `index.html`. + +2. **Deploy Online (Optional but Recommended)** + To make it live: + - Upload to [Netlify](https://www.netlify.com/) + - Or use [Vercel](https://vercel.com/) or [GitHub Pages](https://pages.github.com/) + +3. **Customize It Further** + - Change colors in CSS (e.g., update gradient in header). + - Replace images with real photos of Steve or your shop. + - Add Google Maps embed for location. + - Add contact phone/email directly. + - Connect to backend for actual form submission (using Formspree or Firebase). + +--- + +## 💡 Suggested Next Steps: +| Feature | How to Add | +|--------|------------| +| Google Maps Embed | Add ` +
+
+ + +
+
+ + +
+
+ + +
+
+ + +
+ +
+ + + + + + + + + + + +``` + +### How to Use This Starter Kit: +1. Save as `index.html` +2. Host on GitHub Pages, Netlify, Vercel, or any static hosting platform. +3. Optional enhancements: + - Add real Google Maps iframe + - Connect Stripe/PayPal for payments + - Implement a contact form backend via Formspree, Netlify Forms, or Firebase + +### Key Features Included: +- Responsive design (works on mobile/tablets) +- Hero section with CTA buttons +- Services cards with prices +- Customer testimonials +- Two pricing plans (monthly subscriptions + one-time quotes) +- Contact section with embedded map and form +- Sticky navigation bar +- Tabbed UI for pricing/services +- Modern gradient colors and subtle animations +- Mobile hamburger menu + +This provides a polished, conversion-focused landing page that builds trust through transparency and clear CTAs. Customize colors, fonts, and content as needed for your shop. \ No newline at end of file diff --git a/merges.txt b/merges.txt new file mode 100644 index 0000000..80c1a19 --- /dev/null +++ b/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/model-00001-of-00002.safetensors b/model-00001-of-00002.safetensors new file mode 100644 index 0000000..d966f7a --- /dev/null +++ b/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af80edd6f4bdd648346ba5d933ea91c14e855f3bfaebfd4a1d527f27c863dc02 +size 4967215360 diff --git a/model-00002-of-00002.safetensors b/model-00002-of-00002.safetensors new file mode 100644 index 0000000..6e69c41 --- /dev/null +++ b/model-00002-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:699e5cfb5a5b6b56c1f512bd88d1000482f5e4144994da8603f32d77bce99a72 +size 3077766632 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000..b65d806 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,406 @@ +{ + "metadata": { + "total_parameters": 4022468096, + "total_size": 8044936192 + }, + "weight_map": { + "model.embed_tokens.weight": "model-00001-of-00002.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.20.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.20.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.20.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.21.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.21.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.22.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.22.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.23.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.23.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.24.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.24.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.25.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.25.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.26.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.27.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.28.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.28.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.29.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.3.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.30.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.30.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.31.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.32.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.33.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.34.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.35.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.k_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.q_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.4.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.k_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.q_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.norm.weight": "model-00002-of-00002.safetensors" + } +} diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..9b8043f --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,31 @@ +{ + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "eos_token": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|vision_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..2e51a8b --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9dacde395967e963cb9837e85a04a649fe957d3796ff72a2fac9ea4de556d47 +size 11422921 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..da9f80f --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,240 @@ +{ + "add_bos_token": false, + "add_prefix_space": false, + "added_tokens_decoder": { + "151643": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151644": { + "content": "<|im_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151645": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151646": { + "content": "<|object_ref_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151647": { + "content": "<|object_ref_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151648": { + "content": "<|box_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151649": { + "content": "<|box_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151650": { + "content": "<|quad_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151651": { + "content": "<|quad_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151652": { + "content": "<|vision_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151653": { + "content": "<|vision_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151654": { + "content": "<|vision_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151655": { + "content": "<|image_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151656": { + "content": "<|video_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151657": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151658": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151659": { + "content": "<|fim_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151660": { + "content": "<|fim_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151661": { + "content": "<|fim_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151662": { + "content": "<|fim_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151663": { + "content": "<|repo_name|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151664": { + "content": "<|file_sep|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151665": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151666": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151667": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151668": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "bos_token": null, + "clean_up_tokenization_spaces": false, + "eos_token": "<|im_end|>", + "errors": "replace", + "extra_special_tokens": {}, + "model_max_length": 262144, + "pad_token": "<|vision_pad|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "Qwen2Tokenizer", + "unk_token": null +} diff --git a/vocab.json b/vocab.json new file mode 100644 index 0000000..6c49fc6 --- /dev/null +++ b/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833