Bacchus-Chat

Sleeping

App Files Files Community

gmonsoon commited on Feb 3

Commit

76ca409

•

1 Parent(s): cbf15f8

Upload 4 files

Browse files

Files changed (4) hide show

Dockerfile +24 -0
README.md +5 -8
app.py +54 -0
requirements.txt +2 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,24 @@

+# Use an alias for the base image for easier updates
+FROM python:3.10 as base
+# Set model
+ENV MODEL=indischepartij/MiaLatte-Indo-Mistral-7b-GGUF
+ENV QUANT=Q5_K_M
+ENV CHAT_TEMPLATE=chatml
+# Set the working directory
+WORKDIR /app
+# Install Python requirements
+COPY ./requirements.txt /app/
+RUN pip install --no-cache-dir --upgrade -r requirements.txt
+# Download model
+RUN MODEL_NAME_FILE=$(echo ${MODEL#*/} | tr '[:upper:]' '[:lower:]' | sed 's/-gguf$//') && \
+    wget https://huggingface.co/${MODEL}/resolve/main/${MODEL_NAME_FILE}.${QUANT}.gguf -O model.gguf
+# Copy the rest of your application
+COPY . .
+# Command to run the application
+CMD ["python", "app.py"]

README.md CHANGED Viewed

@@ -1,13 +1,10 @@
 ---
-title: MiaLatte Chat
-emoji: 🏃
-colorFrom: purple
-colorTo: gray
-sdk: gradio
-sdk_version: 4.16.0
-app_file: app.py
 pinned: false
-license: cc-by-nc-4.0
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: test
+emoji: 😻
+colorFrom: red
+colorTo: green
+sdk: docker
 pinned: false
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

app.py ADDED Viewed

	@@ -0,0 +1,54 @@

+import os
+import json
+import gradio as gr
+from llama_cpp import Llama
+# Get environment variables
+model_id = os.getenv('MODEL')
+quant = os.getenv('QUANT')
+chat_template = os.getenv('CHAT_TEMPLATE')
+# Interface variables
+model_name = model_id.split('/')[1].split('-GGUF')[0]
+title = f"😻 {model_name}"
+description = f"Chat with <a href=\"https://huggingface.co/{model_id}\">{model_name}</a> in GGUF format ({quant})!"
+# Initialize the LLM
+llm = Llama(model_path="model.gguf",
+            n_ctx=32768,
+            n_threads=2,
+            chat_format=chat_template)
+# Function for streaming chat completions
+def chat_stream_completion(message, history, system_prompt):
+    messages_prompts = [{"role": "system", "content": system_prompt}]
+    for human, assistant in history:
+        messages_prompts.append({"role": "user", "content": human})
+        messages_prompts.append({"role": "assistant", "content": assistant})
+    messages_prompts.append({"role": "user", "content": message})
+    response = llm.create_chat_completion(
+        messages=messages_prompts,
+        stream=True
+    )
+    message_repl = ""
+    for chunk in response:
+        if len(chunk['choices'][0]["delta"]) != 0 and "content" in chunk['choices'][0]["delta"]:
+            message_repl = message_repl + chunk['choices'][0]["delta"]["content"]
+        yield message_repl
+# Gradio chat interface
+gr.ChatInterface(
+    fn=chat_stream_completion,
+    title=title,
+    description=description,
+    additional_inputs=[gr.Textbox("Kamu adalah Mia, asisten AI yang pintar dan ceria.")],
+    additional_inputs_accordion="📝 System prompt",
+    examples=[
+        ["sebutkan sumber daya alam yang termasuk energi fosil?"],
+        ["Apa jenis skincare yang cocok untuk kulit sensitif?"],
+        ["berapa hasil penghitungan dari 4^2+5"],
+        ["jelaskan mengenai deret fibonacci"],
+        ["Tolong berikan saya tutorial cara memasak Nasi Goreng"]
+    ]
+).queue().launch(server_name="0.0.0.0")

requirements.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ llama-cpp-python
2	+ gradio