from typing import List, Dict, Union, Optional from abc import ABC, abstractmethod from transformers import PretrainedConfig, AutoConfig, AutoModel # Model Constants IGNORE_ID = -100 IMAGE_TOKEN_ID = -200 VIDEO_TOKEN_ID = -201 IMAGE_TOKEN = "" VIDEO_TOKEN = "