update base image
This commit is contained in:
@@ -1,4 +1,4 @@
|
||||
FROM wjie520/vllm_kunlun:base_v0.0.2
|
||||
FROM vllm_kunlun:custom_base_v0.0.3
|
||||
|
||||
WORKDIR /workspace
|
||||
|
||||
|
||||
@@ -11,11 +11,12 @@ One of the key features of this project is efficient memory coordination, enabli
|
||||
|
||||
### Build from Dockerfile
|
||||
|
||||
Clone this repository:
|
||||
1. Get or build base image (base with customized xpytorch, ops, etc.). Ref: [installation](https://vllm-kunlun.readthedocs.io/en/latest/installation.html).
|
||||
|
||||
```bash
|
||||
docker build -t $build_image -f ./Dockerfile .
|
||||
```
|
||||
2. Clone this repository and build
|
||||
```bash
|
||||
docker build -t $build_image -f ./Dockerfile .
|
||||
```
|
||||
|
||||
## Usage
|
||||
|
||||
|
||||
@@ -8,9 +8,6 @@ import vllm.envs as envs
|
||||
from vllm.logger import init_logger
|
||||
|
||||
|
||||
# fix bfloat16 double size issue
|
||||
torch.backends.cuda.matmul.allow_bf16_reduced_precision_reduction = False
|
||||
|
||||
logger = init_logger(__name__)
|
||||
|
||||
class KunlunPlatform(Platform):
|
||||
|
||||
Reference in New Issue
Block a user