forked from EngineX-Cambricon/enginex-mlu370-vllm
22 lines
340 B
Python
22 lines
340 B
Python
from dataclasses import dataclass
|
|
from typing import Dict
|
|
|
|
import torch
|
|
|
|
|
|
@dataclass
|
|
class SamplingMetadata:
|
|
|
|
temperature: torch.Tensor
|
|
all_greedy: bool
|
|
all_random: bool
|
|
|
|
top_p: torch.Tensor
|
|
top_k: torch.Tensor
|
|
no_top_p: bool
|
|
no_top_k: bool
|
|
|
|
generators: Dict[int, torch.Generator]
|
|
|
|
max_num_logprobs: int
|