{ "_name_or_path": "openai/whisper-large-v2", "activation_dropout": 0.0, "activation_function": "gelu", "adaptor_activation": "relu", "adaptor_init": "constant", "adaptor_layernorm": true, "apply_spec_augment": false, "architectures": [ "WhisperSLU" ], "attention_dropout": 0.0, "begin_suppress_tokens": [ 220, 50257 ], "bos_token_id": 50257, "classifier_proj_size": 256, "crf_transition_matrix": null, "d_model": 1280, "decoder_attention_heads": 20, "decoder_ffn_dim": 5120, "decoder_layerdrop": 0.0, "decoder_layers": 32, "decoder_start_token_id": 50258, "dropout": 0.0, "encoder_attention_heads": 20, "encoder_ffn_dim": 5120, "encoder_layerdrop": 0.0, "encoder_layers": 32, "eos_token_id": 50257, "forced_decoder_ids": [ [ 1, 50259 ], [ 2, 50359 ], [ 3, 50363 ] ], "init_std": 0.02, "is_encoder_decoder": true, "mask_feature_length": 10, "mask_feature_min_masks": 0, "mask_feature_prob": 0.0, "mask_time_length": 10, "mask_time_min_masks": 2, "mask_time_prob": 0.05, "max_length": 448, "max_source_positions": 1500, "max_target_positions": 448, "median_filter_width": 7, "model_type": "whisper_for_slu", "num_hidden_layers": 32, "num_mel_bins": 80, "pad_token_id": 50257, "scale_embedding": false, "slu_attention_heads": 12, "slu_dropout": 0.0, "slu_embed_dim": 768, "slu_ffn_dim": 2048, "slu_focus": 1.0, "slu_input_from": "decoder", "slu_input_layers": [ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31 ], "slu_labels": [ "O", "B-cardinal number", "B-date", "I-date", "B-person", "I-person", "B-group", "B-geopolitical area", "I-geopolitical area", "B-law", "I-law", "B-organization", "I-organization", "B-percent", "I-percent", "B-ordinal number", "B-money", "I-money", "B-work of art", "I-work of art", "B-facility", "B-time", "I-cardinal number", "B-location", "B-quantity", "I-quantity", "I-group", "I-location", "B-product", "I-time", "B-event", "I-event", "I-facility", "B-language", "I-product", "I-ordinal number", "I-language" ], "slu_layers": 2, "slu_max_positions": null, "slu_output_dim": 37, "slu_pad_token_id": 1, "slu_start_token_id": 36, "slu_task": "named_entity_recognition", "slu_weight": 0.1, "special_token_ids": [ 50257, 50258, 50259, 50260, 50261, 50262, 50263, 50264, 50265, 50266, 50267, 50268, 50269, 50270, 50271, 50272, 50273, 50274, 50275, 50276, 50277, 50278, 50279, 50280, 50281, 50282, 50283, 50284, 50285, 50286, 50287, 50288, 50289, 50290, 50291, 50292, 50293, 50294, 50295, 50296, 50297, 50298, 50299, 50300, 50301, 50302, 50303, 50304, 50305, 50306, 50307, 50308, 50309, 50310, 50311, 50312, 50313, 50314, 50315, 50316, 50317, 50318, 50319, 50320, 50321, 50322, 50323, 50324, 50325, 50326, 50327, 50328, 50329, 50330, 50331, 50332, 50333, 50334, 50335, 50336, 50337, 50338, 50339, 50340, 50341, 50342, 50343, 50344, 50345, 50346, 50347, 50348, 50349, 50350, 50351, 50352, 50353, 50354, 50355, 50356, 50357, 50358, 50359, 50360, 50361, 50362, 50363 ], "task": "token_classification", "teacher": null, "torch_dtype": "float32", "transformers_version": "4.37.0.dev0", "use_cache": true, "use_crf": false, "use_weighted_layer_sum": false, "vocab_size": 51865 }