vllm.model_executor.models.smolvlm

SmolVLMForConditionalGeneration ¶

Bases: Idefics3ForConditionalGeneration

Source code in vllm/model_executor/models/smolvlm.py

@MULTIMODAL_REGISTRY.register_processor(SmolVLMMultiModalProcessor,
                                        info=SmolVLMProcessingInfo,
                                        dummy_inputs=SmolVLMDummyInputsBuilder)
class SmolVLMForConditionalGeneration(Idefics3ForConditionalGeneration):

    def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
        super().__init__(
            vllm_config=vllm_config,
            prefix=prefix,
        )

init ¶

__init__(*, vllm_config: VllmConfig, prefix: str = '')

Source code in vllm/model_executor/models/smolvlm.py

def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
    super().__init__(
        vllm_config=vllm_config,
        prefix=prefix,
    )

SmolVLMProcessingInfo ¶

Bases: Idefics3ProcessingInfo

Source code in vllm/model_executor/models/smolvlm.py

class SmolVLMProcessingInfo(Idefics3ProcessingInfo):

    def get_hf_processor(
        self,
        *,
        max_image_size: Optional[dict[str, int]] = None,
        **kwargs: object,
    ) -> SmolVLMProcessor:
        if max_image_size is not None:
            kwargs["max_image_size"] = max_image_size

        return self.ctx.get_hf_processor(SmolVLMProcessor, **kwargs)

    def _get_image_token(
            self, processor: Optional[SmolVLMProcessor]) -> tuple[str, str]:
        if processor is None:
            processor = self.get_hf_processor()
        image_token = processor.image_token
        fake_image_token = processor.fake_image_token
        global_image_token = processor.global_image_token
        return image_token, fake_image_token, global_image_token

_get_image_token ¶

_get_image_token(
    processor: Optional[SmolVLMProcessor],
) -> tuple[str, str]

Source code in vllm/model_executor/models/smolvlm.py

def _get_image_token(
        self, processor: Optional[SmolVLMProcessor]) -> tuple[str, str]:
    if processor is None:
        processor = self.get_hf_processor()
    image_token = processor.image_token
    fake_image_token = processor.fake_image_token
    global_image_token = processor.global_image_token
    return image_token, fake_image_token, global_image_token

get_hf_processor ¶

get_hf_processor(
    *,
    max_image_size: Optional[dict[str, int]] = None,
    **kwargs: object,
) -> SmolVLMProcessor

Source code in vllm/model_executor/models/smolvlm.py

def get_hf_processor(
    self,
    *,
    max_image_size: Optional[dict[str, int]] = None,
    **kwargs: object,
) -> SmolVLMProcessor:
    if max_image_size is not None:
        kwargs["max_image_size"] = max_image_size

    return self.ctx.get_hf_processor(SmolVLMProcessor, **kwargs)

vllm.model_executor.models.smolvlm

SmolVLMForConditionalGeneration ¶

__init__ ¶

SmolVLMProcessingInfo ¶

_get_image_token ¶

get_hf_processor ¶

init ¶