End of training

Files changed (6) hide show

README.md CHANGED Viewed

@@ -27,17 +27,17 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/yvonnehe499-northeastern-university/huggingface/runs/impjt14h)
 This model was trained with DPO, a method introduced in [Direct Preference Optimization: Your Language Model is Secretly a Reward Model](https://huggingface.co/papers/2305.18290).
 ### Framework versions
-- TRL: 0.13.0.dev0
-- Transformers: 4.47.0
 - Pytorch: 2.5.1+cu121
 - Datasets: 3.1.0
-- Tokenizers: 0.21.0
 ## Citations

 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/yvonnehe499-northeastern-university/huggingface/runs/8mbpb626)
 This model was trained with DPO, a method introduced in [Direct Preference Optimization: Your Language Model is Secretly a Reward Model](https://huggingface.co/papers/2305.18290).
 ### Framework versions
+- TRL: 0.12.1
+- Transformers: 4.46.3
 - Pytorch: 2.5.1+cu121
 - Datasets: 3.1.0
+- Tokenizers: 0.20.3
 ## Citations

adapter_config.json CHANGED Viewed

@@ -20,8 +20,8 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "q_proj",
-    "v_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "v_proj",
+    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ae315c9fb313b4e3151fd83a20a10e3434ec0aea85575941f88e1058a3943af7
 size 6824216

 version https://git-lfs.github.com/spec/v1
+oid sha256:4a896621a21eb9b27db486ea609e28c7968ab287d04930bfed20d951be6cfc49
 size 6824216

runs/Dec06_04-43-54_83b1d48b5f83/events.out.tfevents.1733460235.83b1d48b5f83.1849.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e100ce4df6923c4fdb5e532771b2b96ffa2553de4d7bcf4534f8bf9bb5c54895
+size 6448

tokenizer_config.json CHANGED Viewed

@@ -2052,7 +2052,6 @@
   "bos_token": "<|begin_of_text|>",
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|end_of_text|>",
-  "extra_special_tokens": {},
   "model_input_names": [
     "input_ids",
     "attention_mask"

   "bos_token": "<|begin_of_text|>",
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|end_of_text|>",
   "model_input_names": [
     "input_ids",
     "attention_mask"

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2fbdcf3984e519c8dc1390c2cf674818daba5ea7821e3e1acfe51acc5adad7c2
-size 6200

 version https://git-lfs.github.com/spec/v1
+oid sha256:34a23d8d192ab938a92f27c4916e0ce8e9f392d36a021b5d94063fd39e045159
+size 6072