import transformers from torch.cuda.amp import autocast, GradScaler from datasets import REFAVS from configs import args from torch.utils.data import DataLoader from functools import partial from models.llava import conversation as conversation_lib # from models.avs_model import VISAForCausalLM from models.avs_model import Simtoken_ForCausalLM import torch from torch.cuda import amp from transformers import AutoConfig from peft import LoraConfig, get_peft_model from torch import optim from torch.optim import AdamW from transformers import get_cosine_schedule_with_warmup from tqdm import tqdm from utils import utility import random import numpy as np import re import time import os from PIL import Image import warnings from utils.metric.utility import mask_iou warnings.filterwarnings("ignore") from transformers import logging logging.set_verbosity_error() IGNORE_INDEX = -100 IMAGE_TOKEN_INDEX = -200 DEFAULT_IMAGE_TOKEN = "" DEFAULT_IMAGE_PATCH_TOKEN = "" DEFAULT_IM_START_TOKEN = "" DEFAULT_IM_END_TOKEN = "" DEFAULT_VIDEO_TOKEN = "