update base image
This commit is contained in:
@@ -1,4 +1,4 @@
|
|||||||
FROM wjie520/vllm_kunlun:base_v0.0.2
|
FROM vllm_kunlun:custom_base_v0.0.3
|
||||||
|
|
||||||
WORKDIR /workspace
|
WORKDIR /workspace
|
||||||
|
|
||||||
|
|||||||
@@ -11,8 +11,9 @@ One of the key features of this project is efficient memory coordination, enabli
|
|||||||
|
|
||||||
### Build from Dockerfile
|
### Build from Dockerfile
|
||||||
|
|
||||||
Clone this repository:
|
1. Get or build base image (base with customized xpytorch, ops, etc.). Ref: [installation](https://vllm-kunlun.readthedocs.io/en/latest/installation.html).
|
||||||
|
|
||||||
|
2. Clone this repository and build
|
||||||
```bash
|
```bash
|
||||||
docker build -t $build_image -f ./Dockerfile .
|
docker build -t $build_image -f ./Dockerfile .
|
||||||
```
|
```
|
||||||
|
|||||||
@@ -8,9 +8,6 @@ import vllm.envs as envs
|
|||||||
from vllm.logger import init_logger
|
from vllm.logger import init_logger
|
||||||
|
|
||||||
|
|
||||||
# fix bfloat16 double size issue
|
|
||||||
torch.backends.cuda.matmul.allow_bf16_reduced_precision_reduction = False
|
|
||||||
|
|
||||||
logger = init_logger(__name__)
|
logger = init_logger(__name__)
|
||||||
|
|
||||||
class KunlunPlatform(Platform):
|
class KunlunPlatform(Platform):
|
||||||
|
|||||||
Reference in New Issue
Block a user