Bug: Fix google gemma3n-mm audio input not working bug (#8365)
This commit is contained in:
@@ -192,7 +192,12 @@ class BaseMultimodalProcessor(ABC):
|
|||||||
|
|
||||||
# name of the feature filed
|
# name of the feature filed
|
||||||
# TODO: pass from processors
|
# TODO: pass from processors
|
||||||
self.FEATURE_NAMES = ["pixel_values", "pixel_values_videos", "audio_features"]
|
self.FEATURE_NAMES = [
|
||||||
|
"pixel_values",
|
||||||
|
"pixel_values_videos",
|
||||||
|
"audio_features",
|
||||||
|
"input_features",
|
||||||
|
]
|
||||||
|
|
||||||
def process_mm_data(
|
def process_mm_data(
|
||||||
self, input_text, images=None, videos=None, audios=None, **kwargs
|
self, input_text, images=None, videos=None, audios=None, **kwargs
|
||||||
|
|||||||
@@ -171,6 +171,11 @@ class TestGemma3nServer(TestOpenAIVisionServer):
|
|||||||
)
|
)
|
||||||
cls.base_url += "/v1"
|
cls.base_url += "/v1"
|
||||||
|
|
||||||
|
def test_audio_chat_completion(self):
|
||||||
|
self._test_audio_speech_completion()
|
||||||
|
# This _test_audio_ambient_completion test is way too complicated to pass for a small LLM
|
||||||
|
# self._test_audio_ambient_completion()
|
||||||
|
|
||||||
|
|
||||||
class TestKimiVLServer(TestOpenAIVisionServer):
|
class TestKimiVLServer(TestOpenAIVisionServer):
|
||||||
@classmethod
|
@classmethod
|
||||||
@@ -252,9 +257,7 @@ class TestPhi4MMServer(TestOpenAIVisionServer):
|
|||||||
|
|
||||||
def test_audio_chat_completion(self):
|
def test_audio_chat_completion(self):
|
||||||
self._test_audio_speech_completion()
|
self._test_audio_speech_completion()
|
||||||
# TODO: currently phi4-mm cannot pass this test.
|
# This _test_audio_ambient_completion test is way too complicated to pass for a small LLM
|
||||||
# We are investigating this issue.
|
|
||||||
# Response: La ciudad está situada en la costa este de la isla, en la desembocadura del río St. Lawrence.
|
|
||||||
# self._test_audio_ambient_completion()
|
# self._test_audio_ambient_completion()
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user