{ "_name_or_path": "/home/yutianyu/Zephyr_checkpoints/SFT_exp/zephyr_mm_12b_SFT-knowledge_v0-caterpillar-stage2_mix#caterpillar-stage3_lvis#caterpillar-stage3_svit#caterpillar-stage3_sharegpt4v#llava#unimm-chat#mme_art500k#google_landmark-train#places_365-train#wit-en-13#22#60#10#16#12#15#10#2#20/checkpionts/checkpoint-4000", "architectures": [ "ZephyrMMForCausalLM" ], "bos_token_id": 1, "eos_token_id": 2, "fully_tune": true, "hidden_act": "silu", "hidden_size": 4096, "image_size": 448, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "mm_use_im_start_end": true, "mm_vision_tower": "eva02_enormous_patch14_clip_224.laion2b_plus", "model_type": "zephyr_mm", "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "num_query": 256, "pad_token_id": 2, "rms_norm_eps": 1e-05, "rope_theta": 10000.0, "sliding_window": 4096, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "transformers_version": "4.35.0", "tune_CLIP": true, "tune_mm_mlp_adapter": false, "use_cache": false, "use_mm_proj": true, "vocab_size": 32009 }