[model] DBRX-instruct support (#337)

This commit is contained in:
Liangsheng Yin
2024-03-29 01:05:19 +08:00
committed by GitHub
parent 3842eba5fa
commit 2af565b3bb
5 changed files with 726 additions and 4 deletions

View File

@@ -5,12 +5,11 @@ model compatible with HuggingFace weights."""
from typing import Optional, Tuple
import torch
from torch import nn
from transformers import PretrainedConfig
from sglang.srt.layers.logits_processor import LogitsProcessor
from sglang.srt.layers.radix_attention import RadixAttention
from sglang.srt.managers.router.model_runner import InputMetadata
from torch import nn
from transformers import PretrainedConfig
from vllm.model_executor.layers.activation import SiluAndMul
from vllm.model_executor.layers.linear import (
LinearMethodBase,
@@ -20,8 +19,8 @@ from vllm.model_executor.layers.linear import (
)
from vllm.model_executor.layers.rotary_embedding import get_rope
from vllm.model_executor.layers.vocab_parallel_embedding import (
VocabParallelEmbedding,
ParallelLMHead,
VocabParallelEmbedding,
)
from vllm.model_executor.parallel_utils.parallel_state import (
get_tensor_model_parallel_world_size,