YangWu001 commited on
Commit
d5b26cf
·
1 Parent(s): c9aa76d
Files changed (2) hide show
  1. app.py +45 -20
  2. app_update_title.py +104 -0
app.py CHANGED
@@ -1,9 +1,15 @@
1
  import gradio as gr
2
  from huggingface_hub import InferenceClient
 
 
3
 
4
  # Inference client setup
5
  client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
6
 
 
 
 
 
7
  def respond(
8
  message,
9
  history: list[tuple[str, str]],
@@ -11,28 +17,45 @@ def respond(
11
  max_tokens,
12
  temperature,
13
  top_p,
 
14
  ):
15
- messages = [{"role": "system", "content": system_message}]
16
-
17
- for val in history:
18
- if val[0]:
19
- messages.append({"role": "user", "content": val[0]})
20
- if val[1]:
21
- messages.append({"role": "assistant", "content": val[1]})
22
-
23
- messages.append({"role": "user", "content": message})
24
-
25
- response = ""
26
- for message in client.chat_completion(
27
- messages,
28
- max_tokens=max_tokens,
29
- stream=True,
30
- temperature=temperature,
31
- top_p=top_p,
32
- ):
33
- token = message.choices[0].delta.content
34
- response += token
35
  yield response
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
36
 
37
  # Custom CSS for a fancy look
38
  custom_css = """
@@ -94,6 +117,8 @@ demo = gr.ChatInterface(
94
  step=0.05,
95
  label="Top-p (nucleus sampling)",
96
  ),
 
 
97
  ],
98
  css=custom_css,
99
  title="🌟 Fancy AI Chatbot 🌟",
 
1
  import gradio as gr
2
  from huggingface_hub import InferenceClient
3
+ import time
4
+ import threading
5
 
6
  # Inference client setup
7
  client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
8
 
9
+ # Global flag to determine the mode and to handle cancellation
10
+ use_local = False
11
+ stop_inference = False
12
+
13
  def respond(
14
  message,
15
  history: list[tuple[str, str]],
 
17
  max_tokens,
18
  temperature,
19
  top_p,
20
+ use_local_model,
21
  ):
22
+ global use_local, stop_inference
23
+ use_local = use_local_model
24
+ stop_inference = False # Reset cancellation flag
25
+
26
+ if use_local:
27
+ # Simulate local inference
28
+ time.sleep(2) # simulate a delay
29
+ response = "This is a response from the local model."
 
 
 
 
 
 
 
 
 
 
 
 
30
  yield response
31
+ else:
32
+ # API-based inference
33
+ messages = [{"role": "system", "content": system_message}]
34
+ for val in history:
35
+ if val[0]:
36
+ messages.append({"role": "user", "content": val[0]})
37
+ if val[1]:
38
+ messages.append({"role": "assistant", "content": val[1]})
39
+ messages.append({"role": "user", "content": message})
40
+
41
+ response = ""
42
+ for message in client.chat_completion(
43
+ messages,
44
+ max_tokens=max_tokens,
45
+ stream=True,
46
+ temperature=temperature,
47
+ top_p=top_p,
48
+ ):
49
+ if stop_inference:
50
+ yield "Inference cancelled."
51
+ break
52
+ token = message.choices[0].delta.content
53
+ response += token
54
+ yield response
55
+
56
+ def cancel_inference():
57
+ global stop_inference
58
+ stop_inference = True
59
 
60
  # Custom CSS for a fancy look
61
  custom_css = """
 
117
  step=0.05,
118
  label="Top-p (nucleus sampling)",
119
  ),
120
+ gr.Checkbox(label="Use Local Model", value=False),
121
+ gr.Button("Cancel Inference", variant="danger", on_click=cancel_inference),
122
  ],
123
  css=custom_css,
124
  title="🌟 Fancy AI Chatbot 🌟",
app_update_title.py ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ from huggingface_hub import InferenceClient
3
+
4
+ # Inference client setup
5
+ client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
6
+
7
+ def respond(
8
+ message,
9
+ history: list[tuple[str, str]],
10
+ system_message,
11
+ max_tokens,
12
+ temperature,
13
+ top_p,
14
+ ):
15
+ messages = [{"role": "system", "content": system_message}]
16
+
17
+ for val in history:
18
+ if val[0]:
19
+ messages.append({"role": "user", "content": val[0]})
20
+ if val[1]:
21
+ messages.append({"role": "assistant", "content": val[1]})
22
+
23
+ messages.append({"role": "user", "content": message})
24
+
25
+ response = ""
26
+ for message in client.chat_completion(
27
+ messages,
28
+ max_tokens=max_tokens,
29
+ stream=True,
30
+ temperature=temperature,
31
+ top_p=top_p,
32
+ ):
33
+ token = message.choices[0].delta.content
34
+ response += token
35
+ yield response
36
+
37
+ # Custom CSS for a fancy look
38
+ custom_css = """
39
+ #main-container {
40
+ background-color: #f0f0f0;
41
+ font-family: 'Arial', sans-serif;
42
+ }
43
+
44
+ .gradio-container {
45
+ max-width: 700px;
46
+ margin: 0 auto;
47
+ padding: 20px;
48
+ background: white;
49
+ box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1);
50
+ border-radius: 10px;
51
+ }
52
+
53
+ .gr-button {
54
+ background-color: #4CAF50;
55
+ color: white;
56
+ border: none;
57
+ border-radius: 5px;
58
+ padding: 10px 20px;
59
+ cursor: pointer;
60
+ transition: background-color 0.3s ease;
61
+ }
62
+
63
+ .gr-button:hover {
64
+ background-color: #45a049;
65
+ }
66
+
67
+ .gr-slider input {
68
+ color: #4CAF50;
69
+ }
70
+
71
+ .gr-chat {
72
+ font-size: 16px;
73
+ }
74
+
75
+ #title {
76
+ text-align: center;
77
+ font-size: 2em;
78
+ margin-bottom: 20px;
79
+ color: #333;
80
+ }
81
+ """
82
+
83
+ # Define the interface
84
+ demo = gr.ChatInterface(
85
+ respond,
86
+ additional_inputs=[
87
+ gr.Textbox(value="You are a friendly Chatbot.", label="System message", interactive=True),
88
+ gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
89
+ gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
90
+ gr.Slider(
91
+ minimum=0.1,
92
+ maximum=1.0,
93
+ value=0.95,
94
+ step=0.05,
95
+ label="Top-p (nucleus sampling)",
96
+ ),
97
+ ],
98
+ css=custom_css,
99
+ title="🌟 Fancy AI Chatbot 🌟",
100
+ description="Interact with the AI chatbot using customizable settings below."
101
+ )
102
+
103
+ if __name__ == "__main__":
104
+ demo.launch()