ghatgetanuj
/

funnel-transformer-xlarge_cls_SentEval-CR

Text Classification

Generated from Trainer

Inference Endpoints

Model card Files Files and versions Metrics Training metrics Community

funnel-transformer-xlarge_cls_SentEval-CR / config.json

ghatgetanuj's picture

Training in progress, epoch 1

f87d580 almost 2 years ago

885 Bytes

	{
	"_name_or_path": "funnel-transformer/xlarge",
	"activation_dropout": 0.0,
	"architectures": [
	"FunnelForSequenceClassification"
	],
	"attention_dropout": 0.1,
	"attention_type": "relative_shift",
	"block_repeats": [
	1,
	1,
	1
	],
	"block_sizes": [
	10,
	10,
	10
	],
	"d_head": 64,
	"d_inner": 4096,
	"d_model": 1024,
	"hidden_act": "gelu_new",
	"hidden_dropout": 0.1,
	"initializer_range": 0.1,
	"initializer_std": null,
	"layer_norm_eps": 1e-09,
	"max_position_embeddings": 512,
	"model_type": "funnel",
	"n_head": 16,
	"num_decoder_layers": 2,
	"pool_q_only": true,
	"pooling_type": "mean",
	"problem_type": "single_label_classification",
	"rel_attn_type": "factorized",
	"separate_cls": true,
	"torch_dtype": "float32",
	"transformers_version": "4.25.1",
	"truncate_seq": true,
	"type_vocab_size": 3,
	"vocab_size": 30522
	}