llm-human-feedback-collector-chat-interface-dpo

Sleeping

App Files Files Community

davidberenstein1957 HF staff commited on Jul 25

Commit

2c31d1f

•

1 Parent(s): a2a6071

Update human feedback collector interface

Browse files

Files changed (3) hide show

README.md +3 -0
app.py +10 -2
chat_interface_preference.py +4 -5

README.md CHANGED Viewed

@@ -13,3 +13,6 @@ short_description: LLM, chatbot, human-feedback
 ---
 Check out the configuration reference at <https://huggingface.co/docs/hub/spaces-config-reference>

 ---
 Check out the configuration reference at <https://huggingface.co/docs/hub/spaces-config-reference>
+> [!WARNING]
+> This is a warning message. Be cautious when proceeding.

app.py CHANGED Viewed

@@ -120,8 +120,16 @@ chat_interface = ChatInterface(
         ["What are great things cook when getting started with Asian cooking?"],
         ["Who was Anthony Bourdain?"],
     ],
-    title="💪🏽🦾 LLM human-feedback collector ChatInterface (DPO) 🦾💪🏽",
-    description="""This is an adaptation of the gr.ChatInferface which allows for human feedback collection for SFT, DPO and KTO.""",
 )
 with gr.Blocks(css="style.css") as demo:

         ["What are great things cook when getting started with Asian cooking?"],
         ["Who was Anthony Bourdain?"],
     ],
+    title="💪🏽🦾 Human Feedback Collector | Meta-Llama-3.1-8B-Instruct | (DPO) 🦾💪🏽",
+    description="".join(
+        [
+            "This is an adaptation of the [`gr.ChatInferface`](https://www.gradio.app/docs/gradio/chatinterface) and [`huggingface_hub.CommitScheduler`](https://huggingface.co/docs/huggingface_hub/main/en/package_reference/hf_api#huggingface_hub.CommitScheduler) which allows for human feedback collection. ",
+            "Another cool tool for capturing Gradio interactions is the [`gr.HuggingFaceDatasetSaver`](https://www.gradio.app/guides/using-flagging#the-hugging-face-dataset-saver-callback). ",
+            "This demo shows how you might capture human feedback directly from applications within Gradio. ",
+            "The captured feedback can directly be used for fine-tuning LLMs within framework like [transformers](https://github.com/huggingface/transformers), [TRL](https://github.com/huggingface/trl) or [AutoTrain](https://huggingface.co/autotrain), ",
+            "however, it might benefit from additional data curation with something like [Argilla](https://github.com/argilla-io/argilla/) for human feedback and/or [distilabel](https://github.com/argilla-io/distilabel/) for AI feedback. Argilla can even be [deployed for free on Hugging Face Spaces](https://argilla-io.github.io/argilla/latest/getting_started/huggingface-spaces/).",
+        ]
+    ),
 )
 with gr.Blocks(css="style.css") as demo:

chat_interface_preference.py CHANGED Viewed

@@ -219,14 +219,13 @@ class ChatInterface(Blocks):
         with self:
             if title:
                 Markdown(f"<h1 style='text-align: center; margin-bottom: 1rem'>{self.title}</h1>")
-            if description:
-                Markdown(description)
             if self.commit_scheduler:
                 Markdown(
-                    f"## Data is being logged to a datset on the hub: [{self.commit_scheduler.repo_id}](https://huggingface.co/datasets/{self.commit_scheduler.repo_id})"
                 )
-                Markdown(f"### Techniques: {self.prefence_techniques}")
-                Markdown(f"### MIN TURNS: {self.min_turns} - MAX TURN: {self.max_turns}")
             if chatbot:
                 self.chatbot = chatbot.render()
             else:

         with self:
             if title:
                 Markdown(f"<h1 style='text-align: center; margin-bottom: 1rem'>{self.title}</h1>")
             if self.commit_scheduler:
                 Markdown(
+                    f'<center><h2>Data is being logged to <a href="https://huggingface.co/datasets/{self.commit_scheduler.repo_id}">a dataset on the Hugging Face Hub</a></h2></center>'
                 )
+            if description:
+                Markdown(description)
             if chatbot:
                 self.chatbot = chatbot.render()
             else: