mahimairaja
/

tweet-summarization-llama-2-finetuned

Text Generation

Generated from Trainer

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

mahimairaja commited on Sep 7, 2023

Commit

1625e80

·

1 Parent(s): 9391d28

Update config.json

Files changed (1) hide show

config.json +9 -23

config.json CHANGED Viewed

@@ -1,21 +1,6 @@
-{'vocab_size': 32000,
- 'max_position_embeddings': 4096,
- 'hidden_size': 4096,
- 'intermediate_size': 11008,
- 'num_hidden_layers': 32,
- 'num_attention_heads': 32,
- 'num_key_value_heads': 32,
- 'hidden_act': 'silu',
- 'initializer_range': 0.02,
- 'rms_norm_eps': 1e-05,
- 'pretraining_tp': 1,
- 'use_cache': False,
- 'rope_scaling': None,
- 'return_dict': True,
- 'output_hidden_states': False,
- 'output_attentions': False,
  'torchscript': False,
- 'torch_dtype': 'float16',
  'use_bfloat16': False,
  'tf_legacy_loss': False,
  'pruned_heads': {},
@@ -51,10 +36,10 @@
  'exponential_decay_length_penalty': None,
  'suppress_tokens': None,
  'begin_suppress_tokens': None,
- 'architectures': ['LlamaForCausalLM'],
  'finetuning_task': None,
- 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'},
- 'label2id': {'LABEL_0': 0, 'LABEL_1': 1},
  'tokenizer_class': None,
  'prefix': None,
  'bos_token_id': 1,
@@ -64,9 +49,9 @@
  'decoder_start_token_id': None,
  'task_specific_params': None,
  'problem_type': None,
- '_name_or_path': 'mahimairaja/tweet-summarization-llama-2-finetuned',
  'transformers_version': '4.32.1',
- 'model_type': 'llama',
  'quantization_config': {'quant_method': <QuantizationMethod.BITS_AND_BYTES: 'bitsandbytes'>,
   'load_in_8bit': False,
   'load_in_4bit': True,
@@ -76,4 +61,5 @@
   'llm_int8_has_fp16_weight': False,
   'bnb_4bit_quant_type': 'nf4',
   'bnb_4bit_use_double_quant': False,
-  'bnb_4bit_compute_dtype': 'float16'}}

+{
  'torchscript': False,
+ 'torch_dtype': "float16",
  'use_bfloat16': False,
  'tf_legacy_loss': False,
  'pruned_heads': {},
  'exponential_decay_length_penalty': None,
  'suppress_tokens': None,
  'begin_suppress_tokens': None,
+ 'architectures': ["LlamaForCausalLM"],
  'finetuning_task': None,
+ 'id2label': {0: "LABEL_0", 1: "LABEL_1"},
+ 'label2id': {"LABEL_0": 0, "LABEL_1": 1},
  'tokenizer_class': None,
  'prefix': None,
  'bos_token_id': 1,
  'decoder_start_token_id': None,
  'task_specific_params': None,
  'problem_type': None,
+ '_name_or_path': "mahimairaja/tweet-summarization-llama-2-finetuned",
  'transformers_version': '4.32.1',
+ 'model_type': "llama",
  'quantization_config': {'quant_method': <QuantizationMethod.BITS_AND_BYTES: 'bitsandbytes'>,
   'load_in_8bit': False,
   'load_in_4bit': True,
   'llm_int8_has_fp16_weight': False,
   'bnb_4bit_quant_type': 'nf4',
   'bnb_4bit_use_double_quant': False,
+  'bnb_4bit_compute_dtype': 'float16'}}
+}