Spaces:

KwabsHug
/

FrontEndasPromptEngineeringTest

Sleeping

kwabs22 commited on Jun 24

Commit

a30ec9b

•

1 Parent(s): b781202

deepseek coder lite reminder

Files changed (1) hide show

app.py CHANGED Viewed

@@ -298,12 +298,12 @@ AllWorkflows = {
 with gr.Blocks() as iface:
     with gr.Tab("Single prompt"):
-        gr.HTML("<a href='https://huggingface.co/spaces/stabilityai/stablelm-2-1_6b-zephyr'> -- Original StabilityAI demo -- </a> | To be tested later (can q4 work on small size?) - <a href='https://huggingface.co/spaces/Qwen/Qwen2-0.5B-Instruct'> -- Qwen2 0.5B Instruct -- </a> |  ")
         gr.Interface(
             fn=generate_response,
             inputs=gr.Textbox(lines=2, placeholder="Type your message here..."),
             outputs="text",
-            title="Stable LM 2 Zephyr (1.6b) LLama.cpp Interface Test (Inconsistent Performance - 100 tokens in 50 secs (when this HF space is updated) or 800+ secs(HF space open for long))",
             description="No Prompt template used yet (Essentially autocomplete). No Message History for now - Enter your message and get a response.",
             flagging_dir="/usr/src/app/flagged",
         )

 with gr.Blocks() as iface:
     with gr.Tab("Single prompt"):
+        gr.HTML("<a href='https://huggingface.co/spaces/stabilityai/stablelm-2-1_6b-zephyr'> -- Original StabilityAI demo -- </a> | To be tested later - <a href='https://huggingface.co/spaces/Qwen/Qwen2-0.5B-Instruct'> -- Qwen2 0.5B Instruct -- </a> | DeepSeek-Coder-V2-Lite-Instruct-Q3_K_M.gguf  += 8gb so test for how big the context can be and how speed is affected  ")
         gr.Interface(
             fn=generate_response,
             inputs=gr.Textbox(lines=2, placeholder="Type your message here..."),
             outputs="text",
+            title="Stable LM 2 Zephyr (1.6b) LLama.cpp Interface Test (Inconsistent Performance - 100 tokens in 50 secs (when this HF space is updated can even go 6tokens a second for non formatted text) or 800+ secs(HF space open for long))",
             description="No Prompt template used yet (Essentially autocomplete). No Message History for now - Enter your message and get a response.",
             flagging_dir="/usr/src/app/flagged",
         )