{ "architectures": [ "UltravoxModel" ], "audio_model_id": "kotoba-tech/kotoba-whisper-v2.2", "audio_model_lora_config": { "lora_alpha": 8, "r": 0, "target_modules": [ "k_proj", "q_proj", "linear_k", "linear_q" ] }, "auto_map": { "AutoConfig": "ultravox_config.UltravoxConfig", "AutoModel": "ultravox_model.UltravoxModel", "AutoProcessor": "ultravox_processing.UltravoxProcessor" }, "hidden_size": 4096, "ignore_index": -100, "initializer_range": 0.02, "model_type": "ultravox", "norm_init": 0.4, "pad_token_id": 1, "projector_act": "swiglu", "stack_factor": 8, "text_model_id": "google/gemma-2-2b-jpn-it", "text_model_lora_config": { "lora_alpha": 8, "r": 0, "target_modules": [ "k_proj", "q_proj", "linear_k", "linear_q" ] }, "torch_dtype": "bfloat16", "transformers_version": "4.44.0", "vocab_size": 256000 }