Update to new version of base image
This commit is contained in:
@@ -4,6 +4,7 @@ from typing import List, Optional, Tuple
|
||||
import torch
|
||||
|
||||
from vllm import _custom_ops as ops
|
||||
|
||||
from vllm.attention.ops.prefix_prefill import context_attention_fwd
|
||||
|
||||
# Should be the same as PARTITION_SIZE in `paged_attention_v2_launcher`.
|
||||
|
||||
Reference in New Issue
Block a user