import json import random import logging import re import time import itertools from dataclasses import dataclass, field from typing import Dict, Optional, Sequence, List, Tuple, Any from collections.abc import Sequence from pathlib import Path import numpy as np import torch from torch.utils.data import Dataset import transformers from . import data_list from .rope2d import get_rope_index_25, get_rope_index_2, get_rope_index_3 IGNORE_INDEX = -100 IMAGE_TOKEN_INDEX = 151655 VIDEO_TOKEN_INDEX = 151656 DEFAULT_IMAGE_TOKEN = "" DEFAULT_VIDEO_TOKEN = "