kwabs22
commited on
Commit
•
a30ec9b
1
Parent(s):
b781202
deepseek coder lite reminder
Browse files
app.py
CHANGED
@@ -298,12 +298,12 @@ AllWorkflows = {
|
|
298 |
|
299 |
with gr.Blocks() as iface:
|
300 |
with gr.Tab("Single prompt"):
|
301 |
-
gr.HTML("<a href='https://huggingface.co/spaces/stabilityai/stablelm-2-1_6b-zephyr'> -- Original StabilityAI demo -- </a> | To be tested later
|
302 |
gr.Interface(
|
303 |
fn=generate_response,
|
304 |
inputs=gr.Textbox(lines=2, placeholder="Type your message here..."),
|
305 |
outputs="text",
|
306 |
-
title="Stable LM 2 Zephyr (1.6b) LLama.cpp Interface Test (Inconsistent Performance - 100 tokens in 50 secs (when this HF space is updated) or 800+ secs(HF space open for long))",
|
307 |
description="No Prompt template used yet (Essentially autocomplete). No Message History for now - Enter your message and get a response.",
|
308 |
flagging_dir="/usr/src/app/flagged",
|
309 |
)
|
|
|
298 |
|
299 |
with gr.Blocks() as iface:
|
300 |
with gr.Tab("Single prompt"):
|
301 |
+
gr.HTML("<a href='https://huggingface.co/spaces/stabilityai/stablelm-2-1_6b-zephyr'> -- Original StabilityAI demo -- </a> | To be tested later - <a href='https://huggingface.co/spaces/Qwen/Qwen2-0.5B-Instruct'> -- Qwen2 0.5B Instruct -- </a> | DeepSeek-Coder-V2-Lite-Instruct-Q3_K_M.gguf += 8gb so test for how big the context can be and how speed is affected ")
|
302 |
gr.Interface(
|
303 |
fn=generate_response,
|
304 |
inputs=gr.Textbox(lines=2, placeholder="Type your message here..."),
|
305 |
outputs="text",
|
306 |
+
title="Stable LM 2 Zephyr (1.6b) LLama.cpp Interface Test (Inconsistent Performance - 100 tokens in 50 secs (when this HF space is updated can even go 6tokens a second for non formatted text) or 800+ secs(HF space open for long))",
|
307 |
description="No Prompt template used yet (Essentially autocomplete). No Message History for now - Enter your message and get a response.",
|
308 |
flagging_dir="/usr/src/app/flagged",
|
309 |
)
|