初始化项目，由ModelHub XC社区提供模型

Model: nguyenthanhthuan/Llama_3.2_1B_Intruct_Tool_Calling_V2 Source: Original Platform
2026-05-18 03:14:53 +08:00
commit 83c92a3dd4
10 changed files with 413059 additions and 0 deletions
--- a/.gitattributes
+++ b/.gitattributes
@@ -0,0 +1,37 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+unsloth.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
+Llama_3.2_1B_Intruct_Tool_Calling_V2.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
--- a/Llama_3.2_1B_Intruct_Tool_Calling_V2.Q8_0.gguf
+++ b/Llama_3.2_1B_Intruct_Tool_Calling_V2.Q8_0.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:46a1baf7ee886c001ad6d24a27eea7403bdacf2765237f24704ff955aec5ea78
+size 1321079552
--- a/46
+++ b/46
@@ -0,0 +1,46 @@
+FROM Llama_3.2_1B_Intruct_Tool_Calling_V2.Q8_0.gguf
+
+TEMPLATE """<|start_header_id|>system<|end_header_id|>
+
+Cutting Knowledge Date: December 2023
+
+{{ if .System }}{{ .System }}
+{{- end }}
+{{- if .Tools }}When you receive a tool call response, use the output to format an answer to the orginal user question.
+
+You are a helpful assistant with tool calling capabilities.
+{{- end }}<|eot_id|>
+{{- range $i, $_ := .Messages }}
+{{- $last := eq (len (slice $.Messages $i)) 1 }}
+{{- if eq .Role "user" }}<|start_header_id|>user<|end_header_id|>
+{{- if and $.Tools $last }}
+
+Given the following functions, please respond with a JSON for a function call with its proper arguments that best answers the given prompt.
+
+Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}. Do not use variables.
+
+{{ range $.Tools }}
+{{- . }}
+{{ end }}
+{{ .Content }}<|eot_id|>
+{{- else }}
+
+{{ .Content }}<|eot_id|>
+{{- end }}{{ if $last }}<|start_header_id|>assistant<|end_header_id|>
+
+{{ end }}
+{{- else if eq .Role "assistant" }}<|start_header_id|>assistant<|end_header_id|>
+{{- if .ToolCalls }}
+{{ range .ToolCalls }}
+{"name": "{{ .Function.Name }}", "parameters": {{ .Function.Arguments }}}{{ end }}
+{{- else }}
+
+{{ .Content }}
+{{- end }}{{ if not $last }}<|eot_id|>{{ end }}
+{{- else if eq .Role "tool" }}<|start_header_id|>ipython<|end_header_id|>
+
+{{ .Content }}<|eot_id|>{{ if $last }}<|start_header_id|>assistant<|end_header_id|>
+
+{{ end }}
+{{- end }}
+{{- end }}"""
--- a/README.md
+++ b/README.md
@@ -0,0 +1,264 @@
+---
+base_model:
+- meta-llama/Llama-3.2-1B-Instruct
+language:
+- en
+- vi
+license: apache-2.0
+tags:
+- text-generation-inference
+- transformers
+- unsloth
+- llama
+- trl
+- Ollama
+- Tool-Calling
+datasets:
+- nguyenthanhthuan/function-calling-sharegpt
+---
+# Function Calling Llama Model Version 2
+
+## Overview
+A specialized fine-tuned version of the **`meta-llama/Llama-3.2-1B-Instruct`** model enhanced with function/tool calling capabilities. The model leverages the **`nguyenthanhthuan/function-calling-sharegpt`** dataset for training.
+
+## Model Specifications
+
+* **Base Architecture**: meta-llama/Llama-3.2-1B-Instruct
+* **Primary Language**: English (Function/Tool Calling), Vietnamese
+* **Licensing**: Apache 2.0
+* **Primary Developer**: nguyenthanhthuan_banhmi
+* **Key Capabilities**: text-generation-inference, transformers, unsloth, llama, trl, Ollama, Tool-Calling
+
+## Getting Started
+
+### Prerequisites
+Method 1:
+1. Install [Ollama](https://ollama.com/)
+2. Install required Python packages:
+   ```bash
+   pip install langchain pydantic torch langchain-ollama langchain_core
+   ```
+Method 2:
+1. Click use this model
+2. Click Ollama
+
+### Installation Steps
+
+1. Clone the repository
+2. Navigate to the project directory
+3. Create the model in Ollama:
+   ```bash
+   ollama create <model_name> -f <path_to_modelfile>
+   ```
+
+## Implementation Guide
+
+### Model Initialization
+
+```python
+from langchain_ollama import ChatOllama 
+
+# Initialize model instance
+llm = ChatOllama(model="<model_name>")
+```
+
+### Basic Usage Example
+
+```python
+# Arithmetic computation example
+query = "What is 3 * 12? Also, what is 11 + 49?"
+response = llm.invoke(query)
+
+print(response.content)
+# Output:
+# 1. 3 times 12 is 36.
+# 2. 11 plus 49 is 60.
+```
+
+### Advanced Function Calling (English Recommended)
+
+#### Basic Arithmetic Tools (Different from the first version)
+```python
+from pydantic import BaseModel
+
+# Note that the docstrings here are crucial, as they will be passed along
+# to the model along with the class name.
+class add(BaseModel):
+    """Add two integers together."""
+
+    a: int = Field(..., description="First integer")
+    b: int = Field(..., description="Second integer")
+
+class multiply(BaseModel):
+    """Multiply two integers together."""
+
+    a: int = Field(..., description="First integer")
+    b: int = Field(..., description="Second integer")
+
+tools = [add, multiply]
+llm_with_tools = llm.bind_tools(tools)
+
+# Execute query and parser result (Different from the first version)
+from langchain_core.output_parsers.openai_tools import PydanticToolsParser
+
+query = "What is 3 * 12? Also, what is 11 + 49?"
+chain = llm_with_tools | PydanticToolsParser(tools=tools)
+result = chain.invoke(query)
+print(result)
+
+# Output:
+# [multiply(a=3, b=12), add(a=11, b=49)]
+```
+
+#### Complex Tool Integration (Different from the first version)
+
+```python
+from pydantic import BaseModel, Field
+from typing import List, Optional
+
+class SendEmail(BaseModel):
+    """Send an email to specified recipients."""
+
+    to: List[str] = Field(..., description="List of email recipients")
+    subject: str = Field(..., description="Email subject")
+    body: str = Field(..., description="Email content/body")
+    cc: Optional[List[str]] = Field(None, description="CC recipients")
+    attachments: Optional[List[str]] = Field(None, description="List of attachment file paths")
+
+class WeatherInfo(BaseModel):
+    """Get weather information for a specific location."""
+
+    city: str = Field(..., description="City name")
+    country: Optional[str] = Field(None, description="Country name")
+    units: str = Field("celsius", description="Temperature units (celsius/fahrenheit)")
+
+class SearchWeb(BaseModel):
+    """Search the web for given query."""
+
+    query: str = Field(..., description="Search query")
+    num_results: int = Field(5, description="Number of results to return")
+    language: str = Field("en", description="Search language")
+
+class CreateCalendarEvent(BaseModel):
+    """Create a calendar event."""
+
+    title: str = Field(..., description="Event title")
+    start_time: str = Field(..., description="Event start time (ISO format)")
+    end_time: str = Field(..., description="Event end time (ISO format)")
+    description: Optional[str] = Field(None, description="Event description")
+    attendees: Optional[List[str]] = Field(None, description="List of attendee emails")
+
+class TranslateText(BaseModel):
+    """Translate text between languages."""
+
+    text: str = Field(..., description="Text to translate")
+    source_lang: str = Field(..., description="Source language code (e.g., 'en', 'es')")
+    target_lang: str = Field(..., description="Target language code (e.g., 'fr', 'de')")
+
+class SetReminder(BaseModel):
+    """Set a reminder for a specific time."""
+
+    message: str = Field(..., description="Reminder message")
+    time: str = Field(..., description="Reminder time (ISO format)")
+    priority: str = Field("normal", description="Priority level (low/normal/high)")
+tools = [
+    SendEmail,
+    WeatherInfo,
+    SearchWeb,
+    CreateCalendarEvent,
+    TranslateText,
+    SetReminder
+]
+llm_tools = llm.bind_tools(tools)
+
+# # Execute query and parser result (Different from the first version)
+from langchain_core.output_parsers.openai_tools import PydanticToolsParser
+
+query = "Set a reminder to call John at 3 PM tomorrow. Also, translate 'Hello, how are you?' to Spanish."
+chain = llm_tools | PydanticToolsParser(tools=tools)
+result = chain.invoke(query)
+print(result)
+
+# Output:
+# [SetReminder(message='Set a reminder for a specific time.', time='3 PM tomorrow', priority='normal'),
+# TranslateText(text='Hello, how are you?', source_lang='en', target_lang='es')]
+```
+
+## Core Features
+
+* Arithmetic computation support
+* Advanced function/tool calling capabilities
+* Seamless Langchain integration
+* Full Ollama platform compatibility
+
+## Technical Details
+
+### Dataset Information
+Training utilized the **`nguyenthanhthuan/function-calling-sharegpt`** dataset, featuring comprehensive function calling interaction examples.
+
+### Known Limitations
+
+* Basic function/tool calling
+* English language support exclusively
+* Ollama installation dependency
+
+## Important Notes & Considerations
+
+### Potential Limitations and Edge Cases
+
+* **Function Parameter Sensitivity**: The model may occasionally misinterpret complex parameter combinations, especially when multiple optional parameters are involved. Double-check parameter values in critical applications.
+
+* **Response Format Variations**:
+  - In some cases, the function calling format might deviate from the expected JSON structure
+  - The model may generate additional explanatory text alongside the function call
+  - Multiple function calls in a single query might not always be processed in the expected order
+
+* **Error Handling Considerations**:
+  - Empty or null values might not be handled consistently across different function types
+  - Complex nested objects may sometimes be flattened unexpectedly
+  - Array inputs might occasionally be processed as single values
+
+### Best Practices for Reliability
+
+1. **Input Validation**:
+   - Always validate input parameters before processing
+   - Implement proper error handling for malformed function calls
+   - Consider adding default values for optional parameters
+
+2. **Testing Recommendations**:
+   - Test with various input combinations and edge cases
+   - Implement retry logic for inconsistent responses
+   - Log and monitor function call patterns for debugging
+
+3. **Performance Optimization**:
+   - Keep function descriptions concise and clear
+   - Limit the number of simultaneous function calls
+   - Cache frequently used function results when possible
+
+### Known Issues
+
+* Model may struggle with:
+  - Very long function descriptions
+  - Highly complex nested parameter structures
+  - Ambiguous or overlapping function purposes
+  - Non-English parameter values or descriptions
+
+## Development
+
+### Contributing Guidelines
+We welcome contributions through issues and pull requests for improvements and bug fixes.
+
+### License Information
+Released under Apache 2.0 license. See LICENSE file for complete terms.
+
+## Academic Citation
+
+```bibtex
+@misc{function-calling-llama,
+    author = {nguyenthanhthuan_banhmi},
+    title = {Function Calling Llama Model Version 2} ,
+    year = {2024},
+    publisher = {GitHub},
+    journal = {GitHub repository}
+}
+```
--- a/config.json
+++ b/config.json
@@ -0,0 +1,42 @@
+{
+  "_name_or_path": "unsloth/llama-3.2-1b-instruct-bnb-4bit",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 128000,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
+  "head_dim": 64,
+  "hidden_act": "silu",
+  "hidden_size": 2048,
+  "initializer_range": 0.02,
+  "intermediate_size": 8192,
+  "max_position_embeddings": 131072,
+  "mlp_bias": false,
+  "model_type": "llama",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 16,
+  "num_key_value_heads": 8,
+  "pad_token_id": 128004,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": {
+    "factor": 32.0,
+    "high_freq_factor": 4.0,
+    "low_freq_factor": 1.0,
+    "original_max_position_embeddings": 8192,
+    "rope_type": "llama3"
+  },
+  "rope_theta": 500000.0,
+  "tie_word_embeddings": true,
+  "torch_dtype": "float16",
+  "transformers_version": "4.44.2",
+  "unsloth_version": "2024.10.7",
+  "use_cache": true,
+  "vocab_size": 128256
+}
--- a/generation_config.json
+++ b/generation_config.json
@@ -0,0 +1,14 @@
+{
+  "bos_token_id": 128000,
+  "do_sample": true,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
+  "max_length": 131072,
+  "pad_token_id": 128004,
+  "temperature": 0.6,
+  "top_p": 0.9,
+  "transformers_version": "4.44.2"
+}
--- a/pytorch_model.bin
+++ b/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f9725bd0be2d6a4d1b05d5ed29383fcfa35b64d4bf987202358c89b78fa5e4b
+size 2471678098
--- a/special_tokens_map.json
+++ b/special_tokens_map.json
@@ -0,0 +1,23 @@
+{
+  "bos_token": {
+    "content": "<|begin_of_text|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|eot_id|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|finetune_right_pad_id|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}
--- a/tokenizer.json
+++ b/tokenizer.json
--- a/tokenizer_config.json
+++ b/tokenizer_config.json