Spaces:

mimifuel2018
/

Qwen2.5-72B

Running

App Files Files Community

mimifuel2018 commited on 11 days ago

Commit

c126a1f

•

1 Parent(s): 6436fcc

Update app.py

Browse files

Files changed (1) hide show

app.py +33 -15

app.py CHANGED Viewed

@@ -1,26 +1,36 @@
 import os
 import gradio as gr
 from http import HTTPStatus
 import dashscope
 from dashscope import Generation
 from dashscope.api_entities.dashscope_response import Role
-from typing import List, Optional, Tuple, Dict
 default_system = 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.'
-dashscope.api_key = os.getenv('YOUR_API_TOKEN')  # Ensure this token is managed securely
 History = List[Tuple[str, str]]
 Messages = List[Dict[str, str]]
 def clear_session() -> History:
     return '', []
 def modify_system_session(system: str) -> str:
-    if system is None or len(system) == 0:
         system = default_system
     return system, system, []
 def history_to_messages(history: History, system: str) -> Messages:
     messages = [{'role': Role.SYSTEM, 'content': system}]
     for h in history:
@@ -28,20 +38,22 @@ def history_to_messages(history: History, system: str) -> Messages:
         messages.append({'role': Role.ASSISTANT, 'content': h[1]})
     return messages
 def messages_to_history(messages: Messages) -> Tuple[str, History]:
     assert messages[0]['role'] == Role.SYSTEM
     system = messages[0]['content']
     history = []
     for q, r in zip(messages[1::2], messages[2::2]):
-        history.append([q['content'], r['content']])
     return system, history
-def model_chat(query: Optional[str], history: Optional[History], system: str
-) -> Tuple[str, str, History]:
     if query is None:
         query = ''
     if history is None:
         history = []
     messages = history_to_messages(history, system)
     messages.append({'role': Role.USER, 'content': query})
@@ -51,14 +63,18 @@ def model_chat(query: Optional[str], history: Optional[History], system: str
         messages=messages,
         result_format='message',
         stream=True,
-        max_new_tokens=150  # Set response length limit
     )
     for response in gen:
         if response.status_code == HTTPStatus.OK:
             role = response.output.choices[0].message.role
-            response = response.output.choices[0].message.content
-            system, history = messages_to_history(messages + [{'role': role, 'content': response}])
             yield '', history, system
         else:
             raise ValueError('Request id: %s, Status code: %s, error code: %s, error message: %s' % (
@@ -68,7 +84,7 @@ def model_chat(query: Optional[str], history: Optional[History], system: str
 # Gradio Interface Setup
 with gr.Blocks() as demo:
-    gr.Markdown("""<center><font size=8>Qwen2.5-72B-Instruct👾</center>""")
     with gr.Row():
         with gr.Column(scale=3):
@@ -76,6 +92,7 @@ with gr.Blocks() as demo:
         with gr.Column(scale=1):
             modify_system = gr.Button("🛠️ Set system prompt and clear history", scale=2)
         system_state = gr.Textbox(value=default_system, visible=False)
     chatbot = gr.Chatbot(label='Qwen2.5-72B-Instruct')
     textbox = gr.Textbox(lines=1, label='Input')
@@ -83,26 +100,27 @@ with gr.Blocks() as demo:
         clear_history = gr.Button("🧹 Clear history")
         submit = gr.Button("🚀 Send")
     textbox.submit(model_chat,
                    inputs=[textbox, chatbot, system_state],
                    outputs=[textbox, chatbot, system_input],
-                   concurrency_limit=5)  # Reduced for free plan
     submit.click(model_chat,
                  inputs=[textbox, chatbot, system_state],
                  outputs=[textbox, chatbot, system_input],
                  concurrency_limit=5)
     clear_history.click(fn=clear_session,
                         inputs=[],
                         outputs=[textbox, chatbot],
                         concurrency_limit=5)
     modify_system.click(fn=modify_system_session,
                         inputs=[system_input],
                         outputs=[system_state, system_input, chatbot],
                         concurrency_limit=5)
-# Launching with reduced threads for free plan
 demo.queue(api_open=False)
 demo.launch(max_threads=10)

 import os
 import gradio as gr
 from http import HTTPStatus
+from typing import List, Optional, Tuple, Dict
 import dashscope
 from dashscope import Generation
 from dashscope.api_entities.dashscope_response import Role
+# Configuration
 default_system = 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.'
+dashscope.api_key = os.getenv('HF_TOKEN')  # Replace 'YOUR_API_TOKEN' with your actual API token.
+# Typing definitions
 History = List[Tuple[str, str]]
 Messages = List[Dict[str, str]]
+# Function to log chat history to logs.txt
+def log_history_to_file(query: str, response: str, file_path="logs.txt"):
+    with open(file_path, "a") as f:
+        f.write(f"User: {query}\n")
+        f.write(f"Assistant: {response}\n\n")
+# Function to clear session history
 def clear_session() -> History:
     return '', []
+# Function to modify system session prompt
 def modify_system_session(system: str) -> str:
+    if not system:
         system = default_system
     return system, system, []
+# Convert history to messages format
 def history_to_messages(history: History, system: str) -> Messages:
     messages = [{'role': Role.SYSTEM, 'content': system}]
     for h in history:
         messages.append({'role': Role.ASSISTANT, 'content': h[1]})
     return messages
+# Convert messages back to history format
 def messages_to_history(messages: Messages) -> Tuple[str, History]:
     assert messages[0]['role'] == Role.SYSTEM
     system = messages[0]['content']
     history = []
     for q, r in zip(messages[1::2], messages[2::2]):
+        history.append((q['content'], r['content']))
     return system, history
+# Main function for chat
+def model_chat(query: Optional[str], history: Optional[History], system: str) -> Tuple[str, str, History]:
     if query is None:
         query = ''
     if history is None:
         history = []
     messages = history_to_messages(history, system)
     messages.append({'role': Role.USER, 'content': query})
         messages=messages,
         result_format='message',
         stream=True,
+        max_new_tokens=150  # Limit response length to save resources
     )
     for response in gen:
         if response.status_code == HTTPStatus.OK:
             role = response.output.choices[0].message.role
+            response_text = response.output.choices[0].message.content
+            # Log chat to file
+            log_history_to_file(query, response_text)
+            system, history = messages_to_history(messages + [{'role': role, 'content': response_text}])
             yield '', history, system
         else:
             raise ValueError('Request id: %s, Status code: %s, error code: %s, error message: %s' % (
 # Gradio Interface Setup
 with gr.Blocks() as demo:
+    gr.Markdown("<center><font size=8>Qwen2.5-72B-Instruct👾</center>")
     with gr.Row():
         with gr.Column(scale=3):
         with gr.Column(scale=1):
             modify_system = gr.Button("🛠️ Set system prompt and clear history", scale=2)
         system_state = gr.Textbox(value=default_system, visible=False)
     chatbot = gr.Chatbot(label='Qwen2.5-72B-Instruct')
     textbox = gr.Textbox(lines=1, label='Input')
         clear_history = gr.Button("🧹 Clear history")
         submit = gr.Button("🚀 Send")
+    # Link buttons to functions
     textbox.submit(model_chat,
                    inputs=[textbox, chatbot, system_state],
                    outputs=[textbox, chatbot, system_input],
+                   concurrency_limit=5)
     submit.click(model_chat,
                  inputs=[textbox, chatbot, system_state],
                  outputs=[textbox, chatbot, system_input],
                  concurrency_limit=5)
     clear_history.click(fn=clear_session,
                         inputs=[],
                         outputs=[textbox, chatbot],
                         concurrency_limit=5)
     modify_system.click(fn=modify_system_session,
                         inputs=[system_input],
                         outputs=[system_state, system_input, chatbot],
                         concurrency_limit=5)
+# Launching Gradio Interface with reduced threads for free plan
 demo.queue(api_open=False)
 demo.launch(max_threads=10)