18 lines
611 B
Python
18 lines
611 B
Python
from vllm.inputs.registry import InputContext
|
|
from vllm.multimodal.base import MultiModalInputs, MultiModalPlugin
|
|
|
|
|
|
class AudioPlugin(MultiModalPlugin):
|
|
"""Plugin for audio data."""
|
|
|
|
def get_data_key(self) -> str:
|
|
return "audio"
|
|
|
|
def _default_input_mapper(self, ctx: InputContext,
|
|
data: object) -> MultiModalInputs:
|
|
raise NotImplementedError("There is no default audio input mapper")
|
|
|
|
def _default_max_multimodal_tokens(self, ctx: InputContext) -> int:
|
|
raise NotImplementedError(
|
|
"There is no default maximum multimodal tokens")
|