Skip to content

vllm_omni.transformers_utils.configs.mammoth_moda2

Mammothmoda2Config

Bases: PretrainedConfig

Top-level MammothModa2 composition configuration

architectures instance-attribute

architectures = ['Mammothmoda2Model']

gen_axes_dim_rope instance-attribute

gen_axes_dim_rope = gen_axes_dim_rope or [40, 40, 40]

gen_axes_lens instance-attribute

gen_axes_lens = gen_axes_lens or [10000, 10000, 10000]

gen_condition_mode instance-attribute

gen_condition_mode = gen_condition_mode

gen_dit_config instance-attribute

gen_dit_config = gen_dit_config

gen_image_condition_refiner_config instance-attribute

gen_image_condition_refiner_config = (
    gen_image_condition_refiner_config
)

gen_transport_config instance-attribute

gen_transport_config = gen_transport_config or {}

gen_vae_config instance-attribute

gen_vae_config = gen_vae_config

image_token_id property

image_token_id: int

initializer_range instance-attribute

initializer_range = initializer_range

is_composition class-attribute instance-attribute

is_composition = True

llm_config instance-attribute

llm_config = (
    for_model(**llm_config)
    if llm_config is not None
    else None
)

model_type class-attribute instance-attribute

model_type = 'mammothmoda2'

sub_configs class-attribute instance-attribute

sub_configs: ClassVar = {'llm_config': AutoConfig}

tokenizer_class instance-attribute

tokenizer_class = 'MammothUTokenizer'

video_token_id property

video_token_id: int

vision_config property

vision_config

vision_end_token_id property

vision_end_token_id: int

vision_start_token_id property

vision_start_token_id: int

get_text_config

get_text_config(decoder: bool = False) -> PretrainedConfig

Mammothmoda2Qwen2_5_VLConfig

Bases: Qwen2_5_VLConfig

Combined configuration: text_config + vision_config.

extra_gen_vocab instance-attribute

extra_gen_vocab = getattr(
    text_config, "extra_gen_vocab", extra_gen_vocab
)

gen_vocab_size instance-attribute

gen_vocab_size = getattr(
    text_config, "gen_vocab_size", gen_vocab_size
)

gen_vocab_start_index instance-attribute

gen_vocab_start_index = getattr(
    text_config,
    "gen_vocab_start_index",
    gen_vocab_start_index,
)

image_token_id instance-attribute

image_token_id = image_token_id

keys_to_ignore_at_inference class-attribute instance-attribute

keys_to_ignore_at_inference = ['past_key_values']

model_type class-attribute instance-attribute

model_type = 'mammothmoda2_qwen2_5_vl'

moe_type instance-attribute

moe_type = getattr(text_config, 'moe_type', moe_type)

sub_configs class-attribute instance-attribute

sub_configs = {
    "vision_config": Mammothmoda2Qwen2_5_VLVisionConfig,
    "text_config": Mammothmoda2Qwen2_5_VLTextConfig,
}

text_config instance-attribute

text_config = text_config

tokenizer_class instance-attribute

tokenizer_class = 'MammothUTokenizer'

video_token_id instance-attribute

video_token_id = video_token_id

vision_config instance-attribute

vision_config = vision_config

Mammothmoda2Qwen2_5_VLTextConfig

Bases: Qwen2_5_VLTextConfig

base_config_key class-attribute instance-attribute

base_config_key = 'text_config'

base_model_pp_plan class-attribute instance-attribute

base_model_pp_plan = base_model_pp_plan

base_model_tp_plan class-attribute instance-attribute

base_model_tp_plan = base_model_tp_plan

extra_gen_vocab instance-attribute

extra_gen_vocab = extra_gen_vocab

gen_vocab_size instance-attribute

gen_vocab_size = gen_vocab_size

gen_vocab_start_index instance-attribute

gen_vocab_start_index = (
    vocab_size
    if extra_gen_vocab
    else vocab_size - gen_vocab_size
)

image_token_id instance-attribute

image_token_id = image_token_id

keys_to_ignore_at_inference class-attribute instance-attribute

keys_to_ignore_at_inference = ['past_key_values']

model_type class-attribute instance-attribute

model_type = 'mammothmoda2_qwen2_5_vl_text'

moe_type instance-attribute

moe_type = moe_type

video_token_id instance-attribute

video_token_id = video_token_id

vocab_size instance-attribute

vocab_size = int(gen_vocab_start_index) + int(
    gen_vocab_size
)

Mammothmoda2Qwen2_5_VLVisionConfig

Bases: Qwen2_5_VLVisionConfig

base_config_key class-attribute instance-attribute

base_config_key = 'vision_config'

model_type class-attribute instance-attribute

model_type = 'mammothmoda2_qwen2_5_vl_vision'