2023-12-01 17:47:09 +08:00
|
|
|
---
|
2023-12-01 22:37:54 +08:00
|
|
|
language:
|
|
|
|
|
- zh
|
|
|
|
|
- en
|
|
|
|
|
pipeline_tag: text-generation
|
|
|
|
|
license: other
|
2023-12-01 14:41:13 +00:00
|
|
|
datasets:
|
|
|
|
|
- HuggingFaceH4/ultrafeedback_binarized
|
|
|
|
|
library_name: transformers
|
2023-12-01 14:41:56 +00:00
|
|
|
---
|
|
|
|
|
|
2023-12-01 14:44:01 +00:00
|
|
|
## Examples
|
|
|
|
|
```python
|
|
|
|
|
from transformers import AutoModelForCausalLM, AutoTokenizer
|
|
|
|
|
|
|
|
|
|
model_path = 'chinoll/Yi-6b-200k-dpo'
|
|
|
|
|
|
|
|
|
|
tokenizer = AutoTokenizer.from_pretrained(model_path, use_fast=False)
|
|
|
|
|
|
|
|
|
|
# Since transformers 4.35.0, the GPT-Q/AWQ model can be loaded using AutoModelForCausalLM.
|
|
|
|
|
model = AutoModelForCausalLM.from_pretrained(
|
|
|
|
|
model_path,
|
|
|
|
|
device_map="auto",
|
|
|
|
|
torch_dtype='auto'
|
|
|
|
|
).eval()
|
|
|
|
|
|
|
|
|
|
# Prompt content: "hi"
|
|
|
|
|
messages = [
|
|
|
|
|
{"role": "user", "content": "hi"}
|
|
|
|
|
]
|
|
|
|
|
|
|
|
|
|
input_ids = tokenizer.apply_chat_template(conversation=messages, tokenize=True, add_generation_prompt=True, return_tensors='pt')
|
|
|
|
|
output_ids = model.generate(input_ids.to('cuda'))
|
|
|
|
|
response = tokenizer.decode(output_ids[0][input_ids.shape[1]:], skip_special_tokens=True)
|
|
|
|
|
|
|
|
|
|
# Model response: "Hello! How can I assist you today?"
|
|
|
|
|
print(response)
|
|
|
|
|
```
|