| { | |
| "architectures": [ | |
| "DreamLLMForCausalMLM" | |
| ], | |
| "attention_bias": false, | |
| "attention_dropout": 0.0, | |
| "bos_token_id": 151643, | |
| "diffusion_bs": 0, | |
| "eos_token_id": 151645, | |
| "hidden_act": "silu", | |
| "hidden_size": 3584, | |
| "initializer_range": 0.02, | |
| "intermediate_size": 18944, | |
| "log_attentions": false, | |
| "log_hidden_states": false, | |
| "loss_scale_schedule": "none", | |
| "loss_weight_lm": 1.0, | |
| "loss_weight_vm": 10.0, | |
| "max_position_embeddings": 4096, | |
| "max_window_layers": 28, | |
| "model_type": "dreamllm", | |
| "num_attention_heads": 28, | |
| "num_hidden_layers": 28, | |
| "num_key_value_heads": 4, | |
| "plugins_init_kwargs": { | |
| "dream_embedding": { | |
| "_target_": "omni.models.dreamllm_qwen2.modeling_plugins.DreamEmbedding", | |
| "embed_hidden_size": 3584, | |
| "freeze_dream_queries": false, | |
| "num_dream_queries": 256, | |
| "pretrained_model_name_or_path": "none" | |
| }, | |
| "stable_diffusion_head": { | |
| "_target_": "omni.models.dreamllm_qwen2.modeling_plugins.StableDiffusion3Head", | |
| "diffusion_name_or_path": "stabilityai/stable-diffusion-3.5-medium", | |
| "embed_hidden_size": 3584, | |
| "freeze_projector": false, | |
| "freeze_transformer": true, | |
| "freeze_vae": true, | |
| "local_files_only": false, | |
| "pretrained_model_name_or_path": "none", | |
| "projector_depth": 1, | |
| "projector_type": "linear", | |
| "random_flip": false, | |
| "resolution": 512 | |
| }, | |
| "vision_encoder": { | |
| "_target_": "omni.models.dreamllm_qwen2.modeling_plugins.InternViTEmbedding", | |
| "embed_hidden_size": 3584, | |
| "freeze_embedding_layers": true, | |
| "freeze_intern_vit_model": true, | |
| "freeze_projector": false, | |
| "intern_vit_model_name_or_path": "OpenGVLab/InternViT-300M-448px-V2_5", | |
| "local_files_only": false, | |
| "pretrained_model_name_or_path": "none", | |
| "projector_depth": 2, | |
| "projector_type": "mlp", | |
| "select_layer": -1 | |
| } | |
| }, | |
| "plugins_type": { | |
| "dream_embedding": "embedding", | |
| "stable_diffusion_head": "head", | |
| "vision_encoder": "embedding" | |
| }, | |
| "pretraining_tp": 1, | |
| "rms_norm_eps": 1e-06, | |
| "rope_scaling": null, | |
| "rope_theta": 1000000.0, | |
| "sliding_window": null, | |
| "special_tokens2ids_dict": { | |
| "<|endoftext|>": 151643, | |
| "<|im_end|>": 151645, | |
| "<|im_start|>": 151644, | |
| "additional_special_tokens": { | |
| "<dream>": 151666, | |
| "<dream_end>": 151668, | |
| "<dream_start>": 151667, | |
| "<image>": 151665, | |
| "<|image_pad|>": 151655, | |
| "<|vision_end|>": 151653, | |
| "<|vision_start|>": 151652 | |
| } | |
| }, | |
| "tie_word_embeddings": false, | |
| "torch_dtype": "bfloat16", | |
| "transformers_version": "4.46.1", | |
| "use_cache": true, | |
| "use_sliding_window": false, | |
| "vocab_size": 152064 | |
| } | |