[model] support MiniCPM-o-4.5 (#10163)

Co-authored-by: Yaowei Zheng <hiyouga@buaa.edu.cn>
This commit is contained in:
Hertz
2026-02-04 23:21:27 +08:00
committed by GitHub
parent 1a02717fa8
commit 8bedfafa4e
7 changed files with 22 additions and 18 deletions

View File

@@ -27,7 +27,7 @@ Including:
import os
from collections.abc import Callable
from contextlib import contextmanager
from enum import Enum, unique
from enum import StrEnum, unique
from functools import lru_cache, wraps
from typing import Optional
@@ -39,7 +39,7 @@ from ..utils.types import ProcessGroup, Tensor, TensorLike
@unique
class DeviceType(str, Enum):
class DeviceType(StrEnum):
CPU = "cpu"
CUDA = "cuda"
META = "meta"
@@ -49,7 +49,7 @@ class DeviceType(str, Enum):
@unique
class ReduceOp(str, Enum):
class ReduceOp(StrEnum):
SUM = "sum"
MEAN = "mean"
MAX = "max"

View File

@@ -28,7 +28,7 @@ And data parallelism types:
from dataclasses import dataclass
from datetime import timedelta
from enum import Enum
from enum import StrEnum
from typing import Any, Optional
from torch.distributed import barrier, destroy_process_group, init_process_group
@@ -42,7 +42,7 @@ from . import helper
logger = logging.get_logger(__name__)
class Dim(str, Enum):
class Dim(StrEnum):
"""Dimension names."""
MP_REPLICATE = "mp_replicate"