Upload folder using huggingface_hub (#1)

- 74f06ce4d28f33f7ff5734a62782fb3d252bb8282c61c21e43b366ee2e13287e (7af55dab05cf8a00c778e9ed9305f9069183fe3d)
- a3eaa8383591407c7a8e2526dc497b72b0a04cc47db30c683e33ba12c5f3a59b (41722a0d3e4558c4c7b7c20fb88d1158dbabb5aa)
- 41dc4850fdcdb408ec02a57a49956ad29c9f975a58ad2b31889675df3a6f4351 (e39b3ba7cc27e581a7cf80738b80b38ee055c8e7)
- 7c7049194f4b33b759ac63132321453ab058494044f4bd5700bfcd4fd8b99893 (2c04dcb71924b5c1cd4645e3ac1c39503e91318d)
- b248dae40a37523d369d2d7ac728f989902e1c48ef46a8832e815b21dc7eb26a (fb97cc26c15631b1fbb5186908bee13c60f43435)
- 4c410ac06199807ff1591397a08bb5dc8c9f21ed00d6ad6020aa9b8364570675 (fb8aeb0b9642a450dbaddb11db24772d7e0a591c)
- 7a63921612d63e57be9fe3786424c3513c1b63bfbb4f115632a199d672a9d5f4 (5ac117216c4ce1d079815512c2d2731e1b512fd2)
- 2e1b9784ba5d6632ade68239420a0fe426e841d93f9adf7fb070ddc715939b91 (9c58e46f7acdbfbfb48d186f98681917ad1f2d03)

Files changed (15) hide show

README.md +102 -0
config.json +32 -0
merges.txt +0 -0
model-00001-of-00007.safetensors +3 -0
model-00002-of-00007.safetensors +3 -0
model-00003-of-00007.safetensors +3 -0
model-00004-of-00007.safetensors +3 -0
model-00005-of-00007.safetensors +3 -0
model-00006-of-00007.safetensors +3 -0
model-00007-of-00007.safetensors +3 -0
model.safetensors.index.json +0 -0
special_tokens_map.json +51 -0
tokenizer.json +0 -0
tokenizer_config.json +188 -0
vocab.json +0 -0

README.md ADDED Viewed

	@@ -0,0 +1,102 @@

+---
+license: apache-2.0
+library_name: transformers
+tags:
+- code
+- granite
+- mlx
+base_model: ibm-granite/granite-34b-code-base
+datasets:
+- bigcode/commitpackft
+- TIGER-Lab/MathInstruct
+- meta-math/MetaMathQA
+- glaiveai/glaive-code-assistant-v3
+- glaive-function-calling-v2
+- bugdaryan/sql-create-context-instruction
+- garage-bAInd/Open-Platypus
+- nvidia/HelpSteer
+metrics:
+- code_eval
+pipeline_tag: text-generation
+inference: true
+model-index:
+- name: granite-34b-code-instruct
+  results:
+  - task:
+      type: text-generation
+    dataset:
+      name: HumanEvalSynthesis(Python)
+      type: bigcode/humanevalpack
+    metrics:
+    - type: pass@1
+      value: 62.2
+      name: pass@1
+    - type: pass@1
+      value: 56.7
+      name: pass@1
+    - type: pass@1
+      value: 62.8
+      name: pass@1
+    - type: pass@1
+      value: 47.6
+      name: pass@1
+    - type: pass@1
+      value: 57.9
+      name: pass@1
+    - type: pass@1
+      value: 41.5
+      name: pass@1
+    - type: pass@1
+      value: 53.0
+      name: pass@1
+    - type: pass@1
+      value: 45.1
+      name: pass@1
+    - type: pass@1
+      value: 50.6
+      name: pass@1
+    - type: pass@1
+      value: 36.0
+      name: pass@1
+    - type: pass@1
+      value: 42.7
+      name: pass@1
+    - type: pass@1
+      value: 23.8
+      name: pass@1
+    - type: pass@1
+      value: 54.9
+      name: pass@1
+    - type: pass@1
+      value: 47.6
+      name: pass@1
+    - type: pass@1
+      value: 55.5
+      name: pass@1
+    - type: pass@1
+      value: 51.2
+      name: pass@1
+    - type: pass@1
+      value: 47.0
+      name: pass@1
+    - type: pass@1
+      value: 45.1
+      name: pass@1
+---
+# mlx-community/granite-34b-code-instruct-8bit
+The Model [mlx-community/granite-34b-code-instruct-8bit](https://huggingface.co/mlx-community/granite-34b-code-instruct-8bit) was converted to MLX format from [ibm-granite/granite-34b-code-instruct](https://huggingface.co/ibm-granite/granite-34b-code-instruct) using mlx-lm version **0.13.0**.
+## Use with mlx
+```bash
+pip install mlx-lm
+```
+```python
+from mlx_lm import load, generate
+model, tokenizer = load("mlx-community/granite-34b-code-instruct-8bit")
+response = generate(model, tokenizer, prompt="hello", verbose=True)
+```

config.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+    "activation_function": "gelu_pytorch_tanh",
+    "architectures": [
+        "GPTBigCodeForCausalLM"
+    ],
+    "attention_softmax_in_fp32": true,
+    "attn_pdrop": 0.1,
+    "bos_token_id": 0,
+    "embd_pdrop": 0.1,
+    "eos_token_id": 0,
+    "initializer_range": 0.02,
+    "layer_norm_epsilon": 1e-05,
+    "model_type": "gpt_bigcode",
+    "multi_query": true,
+    "n_embd": 6144,
+    "n_head": 48,
+    "n_inner": 24576,
+    "n_layer": 88,
+    "n_positions": 8192,
+    "pad_token_id": 0,
+    "quantization": {
+        "group_size": 64,
+        "bits": 8
+    },
+    "resid_pdrop": 0.1,
+    "scale_attention_softmax_in_fp32": true,
+    "scale_attn_weights": true,
+    "torch_dtype": "bfloat16",
+    "transformers_version": "4.41.0.dev0",
+    "use_cache": true,
+    "vocab_size": 49152
+}

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

model-00001-of-00007.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a095cd0844cd528542404318e9555417a0e09c022714e67f7de88233f66bdd3b
+size 5290926981

model-00002-of-00007.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d898b7cc6a54b87563f8fa8fde4dfc0ba9d3597a5deff4978e8c632bd0eeeeb2
+size 5237561094

model-00003-of-00007.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5491498cfda12fc9415b1d4938518ad46ce0c07a4916f133b60b644033fb727c
+size 5237561096

model-00004-of-00007.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e025e55ff46ad16a3c983df37e9214d8f65ed082d32fab5d3bcce04d09b46160
+size 5237561110

model-00005-of-00007.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb5702004b8cc1cd134c9b889599544a6fb666f8ef893bb4c5924bef1317b06a
+size 5237561094

model-00006-of-00007.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3f50fcfb036cb22ca279fe36c2a22c9dfcbd30027d61406c7bc2205cd37a7dc9
+size 5237561032

model-00007-of-00007.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:03932f6dfe82a8e6813243c3a7ab975d176c9be2f1d34aa197ef23c79704d519
+size 4349894014

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,51 @@

+{
+  "additional_special_tokens": [
+    "<|endoftext|>",
+    "<fim_prefix>",
+    "<fim_middle>",
+    "<fim_suffix>",
+    "<fim_pad>",
+    "<filename>",
+    "<gh_stars>",
+    "<issue_start>",
+    "<issue_comment>",
+    "<issue_closed>",
+    "<jupyter_start>",
+    "<jupyter_text>",
+    "<jupyter_code>",
+    "<jupyter_output>",
+    "<empty_output>",
+    "<commit_before>",
+    "<commit_msg>",
+    "<commit_after>",
+    "<reponame>"
+  ],
+  "bos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,188 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<fim_prefix>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "<fim_middle>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<fim_suffix>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "<fim_pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "5": {
+      "content": "<filename>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "6": {
+      "content": "<gh_stars>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "7": {
+      "content": "<issue_start>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "8": {
+      "content": "<issue_comment>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "9": {
+      "content": "<issue_closed>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "10": {
+      "content": "<jupyter_start>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "11": {
+      "content": "<jupyter_text>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "12": {
+      "content": "<jupyter_code>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "13": {
+      "content": "<jupyter_output>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "14": {
+      "content": "<empty_output>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "15": {
+      "content": "<commit_before>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "16": {
+      "content": "<commit_msg>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "17": {
+      "content": "<commit_after>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "18": {
+      "content": "<reponame>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [
+    "<|endoftext|>",
+    "<fim_prefix>",
+    "<fim_middle>",
+    "<fim_suffix>",
+    "<fim_pad>",
+    "<filename>",
+    "<gh_stars>",
+    "<issue_start>",
+    "<issue_comment>",
+    "<issue_closed>",
+    "<jupyter_start>",
+    "<jupyter_text>",
+    "<jupyter_code>",
+    "<jupyter_output>",
+    "<empty_output>",
+    "<commit_before>",
+    "<commit_msg>",
+    "<commit_after>",
+    "<reponame>"
+  ],
+  "bos_token": "<|endoftext|>",
+  "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ 'Question:\n' + message['content'] + '\n\n' }}{% elif message['role'] == 'system' %}\n{{ 'System:\n' + message['content'] + '\n\n' }}{% elif message['role'] == 'assistant' %}{{ 'Answer:\n'  + message['content'] + '\n\n' }}{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ 'Answer:\n' }}{% endif %}{% endfor %}",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "<|endoftext|>",
+  "model_max_length": 9223372036854775807,
+  "pad_token": "<|endoftext|>",
+  "padding_side": "left",
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>",
+  "vocab_size": 49152
+}

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff