[Misc] Cleanup useless print and logger (#5220)

1. Remove useless print
2. use vLLM logger
3. change useless INFO to DEBUG level

- vLLM version: release/v0.13.0
- vLLM main:
ad32e3e19c

Signed-off-by: wangxiyuan <wangxiyuan1007@gmail.com>
This commit is contained in:
wangxiyuan
2025-12-22 11:28:26 +08:00
committed by GitHub
parent e117b3d693
commit 492173cf89
6 changed files with 10 additions and 23 deletions

View File

@@ -15,13 +15,12 @@
# See the License for the specific language governing permissions and
# limitations under the License.
#
import logging
import torch
import torch._inductor.pattern_matcher as pm
from torch._inductor.pattern_matcher import PatternMatcherPass
from vllm.compilation.vllm_inductor_pass import VllmInductorPass
from vllm.config import VllmConfig
from vllm.logger import logger
class AddRMSNormQuantPattern:
@@ -288,7 +287,7 @@ class AddRMSNormQuantFusionPass(VllmInductorPass):
dtype = vllm_config.model_config.dtype
if dtype not in (torch.bfloat16, torch.float16):
logging.info("Quant fusion not enabled: unsupported dtype %s",
logger.debug("Quant fusion not enabled: unsupported dtype %s",
dtype)
return
@@ -306,7 +305,7 @@ class AddRMSNormQuantFusionPass(VllmInductorPass):
def __call__(self, graph: torch.fx.Graph):
self.begin()
self.matched_count = self.pattern_match_passes.apply(graph)
logging.debug("Replaced %s patterns", self.matched_count)
logger.debug("Replaced %s patterns", self.matched_count)
self.end_and_log()
def is_applicable(self, runtime_shape: int | None = None) -> bool: