from transformers import PreTrainedModel, AutoConfig, AutoModelForCausalLM | |
from transformers.utils import logging | |
logger = logging.get_logger(__name__) | |
class AudioOnlyThinker(Qwen2_5OmniThinkerForConditionalGeneration): | |
def __init__(self, config): | |
super().__init__(config) | |
self.visual = None | |
if hasattr(self.config, "vision_config"): | |
del self.config.vision_config | |
def forward(self, *args, pixel_values=None, pixel_values_videos=None, **kwargs): | |
return super().forward(*args, pixel_values=None, pixel_values_videos=None, **kwargs) |