Format code (#118)
This commit is contained in:
@@ -324,7 +324,7 @@ python -m sglang.launch_server --model-path meta-llama/Llama-2-7b-chat-hf --port
|
|||||||
- Mixtral
|
- Mixtral
|
||||||
- LLaVA
|
- LLaVA
|
||||||
- `python3 -m sglang.launch_server --model-path liuhaotian/llava-v1.5-7b --tokenizer-path llava-hf/llava-1.5-7b-hf --port 30000`
|
- `python3 -m sglang.launch_server --model-path liuhaotian/llava-v1.5-7b --tokenizer-path llava-hf/llava-1.5-7b-hf --port 30000`
|
||||||
- Qwen
|
- Qwen / Qwen 2
|
||||||
- AWQ quantization
|
- AWQ quantization
|
||||||
|
|
||||||
## Benchmark And Performance
|
## Benchmark And Performance
|
||||||
|
|||||||
@@ -319,4 +319,5 @@ class LlamaForCausalLM(nn.Module):
|
|||||||
weight_loader = getattr(param, "weight_loader", default_weight_loader)
|
weight_loader = getattr(param, "weight_loader", default_weight_loader)
|
||||||
weight_loader(param, loaded_weight)
|
weight_loader(param, loaded_weight)
|
||||||
|
|
||||||
|
|
||||||
EntryClass = LlamaForCausalLM
|
EntryClass = LlamaForCausalLM
|
||||||
|
|||||||
@@ -331,4 +331,5 @@ def monkey_path_clip_vision_embed_forward():
|
|||||||
clip_vision_embed_forward,
|
clip_vision_embed_forward,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
EntryClass = LlavaLlamaForCausalLM
|
EntryClass = LlavaLlamaForCausalLM
|
||||||
|
|||||||
@@ -377,4 +377,5 @@ class MixtralForCausalLM(nn.Module):
|
|||||||
weight_loader = getattr(param, "weight_loader", default_weight_loader)
|
weight_loader = getattr(param, "weight_loader", default_weight_loader)
|
||||||
weight_loader(param, loaded_weight)
|
weight_loader(param, loaded_weight)
|
||||||
|
|
||||||
|
|
||||||
EntryClass = MixtralForCausalLM
|
EntryClass = MixtralForCausalLM
|
||||||
|
|||||||
@@ -259,4 +259,5 @@ class QWenLMHeadModel(nn.Module):
|
|||||||
weight_loader = getattr(param, "weight_loader", default_weight_loader)
|
weight_loader = getattr(param, "weight_loader", default_weight_loader)
|
||||||
weight_loader(param, loaded_weight)
|
weight_loader(param, loaded_weight)
|
||||||
|
|
||||||
|
|
||||||
EntryClass = QWenLMHeadModel
|
EntryClass = QWenLMHeadModel
|
||||||
|
|||||||
@@ -315,4 +315,5 @@ class Qwen2ForCausalLM(nn.Module):
|
|||||||
weight_loader = getattr(param, "weight_loader", default_weight_loader)
|
weight_loader = getattr(param, "weight_loader", default_weight_loader)
|
||||||
weight_loader(param, loaded_weight)
|
weight_loader(param, loaded_weight)
|
||||||
|
|
||||||
|
|
||||||
EntryClass = Qwen2ForCausalLM
|
EntryClass = Qwen2ForCausalLM
|
||||||
|
|||||||
Reference in New Issue
Block a user