Fix the chat template for llava-v1.6-34b & format code (#177)

2024-02-11 05:50:13 -08:00
parent 50afed4eaa
commit c51020cf0c
23 changed files with 101 additions and 44 deletions
--- a/python/sglang/srt/models/llava.py
+++ b/python/sglang/srt/models/llava.py
@@ -1,4 +1,5 @@
 """Inference-only LLaVa model compatible with HuggingFace weights."""
+
 from typing import List, Optional

 import numpy as np
@@ -269,7 +270,6 @@ class LlavaLlamaForCausalLM(nn.Module):
            raise ValueError(f"Unexpected select feature: {self.select_feature}")

        # load mm_projector
-        # TODO: support TP?
        projector_weights = {
            "model.mm_projector.0": "multi_modal_projector.linear_1",
            "model.mm_projector.2": "multi_modal_projector.linear_2",
--- a/python/sglang/srt/models/mistral.py
+++ b/python/sglang/srt/models/mistral.py
@@ -1,4 +1,5 @@
 """Inference-only Mistral model."""
+
 from sglang.srt.models.llama2 import LlamaForCausalLM


--- a/python/sglang/srt/models/mixtral.py
+++ b/python/sglang/srt/models/mixtral.py
@@ -97,14 +97,16 @@ class MixtralMoE(nn.Module):

        self.experts = nn.ModuleList(
            [
-                MixtralMLP(
-                    self.num_total_experts,
-                    config.hidden_size,
-                    config.intermediate_size,
-                    linear_method=linear_method,
+                (
+                    MixtralMLP(
+                        self.num_total_experts,
+                        config.hidden_size,
+                        config.intermediate_size,
+                        linear_method=linear_method,
+                    )
+                    if idx in self.expert_indicies
+                    else None
                )
-                if idx in self.expert_indicies
-                else None
                for idx in range(self.num_total_experts)
            ]
        )
--- a/python/sglang/srt/models/yivl.py
+++ b/python/sglang/srt/models/yivl.py
@@ -1,4 +1,5 @@
 """Inference-only Yi-VL model."""
+
 import os
 from typing import List, Optional