{ "emb_size": 768, "feedforward_size": 3072, "hidden_size": 768, "hidden_act": "relu", "heads_num": 12, "layers_num": 12, "decoder_layers_num": 12, "dropout": 0.1, "data_processor": "t5", "embedding": ["word"], "relative_position_embedding": true, "remove_embedding_layernorm": true, "tgt_embedding": ["word"], "share_embedding": true, "encoder": "transformer", "mask": "fully_visible", "layernorm_positioning": "pre", "remove_attention_scale": true, "layernorm": "t5", "remove_transformer_bias": true, "decoder": "transformer", "target": ["lm"], "tie_weights": true }