Spaces:

harismlnaslm
/

textilindo-ai-assistant

Build error

App Files Files Community

Stefanus Simandjuntak commited on Sep 1

Commit

c696f9e

1 Parent(s): 9b4ef96

feat(prompt): add/update system prompt

Browse files

Files changed (4) hide show

api_server.py +35 -4
configs/system_prompt.md +53 -0
novita_rag_chat.py +56 -2
web_app.py +30 -1

api_server.py CHANGED Viewed

@@ -19,6 +19,28 @@ logger = logging.getLogger(__name__)
 app = Flask(__name__)
 CORS(app)  # Enable CORS for all routes
 class TextilindoAI:
     def __init__(self, api_key):
         self.api_key = api_key
@@ -28,6 +50,10 @@ class TextilindoAI:
             "Content-Type": "application/json"
         }
         self.model = "qwen/qwen3-235b-a22b-instruct-2507"
         self.dataset = self.load_dataset()
     def load_dataset(self):
@@ -97,7 +123,7 @@ class TextilindoAI:
         return "\n".join(context_parts)
-    def chat(self, message, max_tokens=300, temperature=0.7):
         """Send message to Novita AI with RAG context"""
         relevant_examples = self.find_relevant_context(message, 3)
@@ -108,9 +134,13 @@ class TextilindoAI:
             enhanced_prompt = message
             context_used = False
         payload = {
             "model": self.model,
-            "messages": [{"role": "user", "content": enhanced_prompt}],
             "max_tokens": max_tokens,
             "temperature": temperature,
             "top_p": 0.9
@@ -190,6 +220,7 @@ def chat():
         # Optional parameters
         max_tokens = data.get('max_tokens', 300)
         temperature = data.get('temperature', 0.7)
         # Validate parameters
         if not isinstance(max_tokens, int) or max_tokens < 1 or max_tokens > 1000:
@@ -205,7 +236,7 @@ def chat():
             }), 400
         # Process chat
-        result = ai.chat(message, max_tokens, temperature)
         if result["success"]:
             return jsonify(result)
@@ -319,5 +350,5 @@ if __name__ == '__main__':
     app.run(
         debug=False,  # Set to False for production
         host='0.0.0.0',
-        port=5001
     )

 app = Flask(__name__)
 CORS(app)  # Enable CORS for all routes
+def load_system_prompt(default_text):
+    try:
+        base_dir = os.path.dirname(__file__)
+        md_path = os.path.join(base_dir, 'configs', 'system_prompt.md')
+        if not os.path.exists(md_path):
+            return default_text
+        with open(md_path, 'r', encoding='utf-8') as f:
+            content = f.read()
+        start = content.find('"""')
+        end = content.rfind('"""')
+        if start != -1 and end != -1 and end > start:
+            return content[start+3:end].strip()
+        lines = []
+        for line in content.splitlines():
+            if line.strip().startswith('#'):
+                continue
+            lines.append(line)
+        cleaned = '\n'.join(lines).strip()
+        return cleaned or default_text
+    except Exception:
+        return default_text
 class TextilindoAI:
     def __init__(self, api_key):
         self.api_key = api_key
             "Content-Type": "application/json"
         }
         self.model = "qwen/qwen3-235b-a22b-instruct-2507"
+        self.system_prompt = os.getenv(
+            'SYSTEM_PROMPT',
+            load_system_prompt("You are Textilindo AI Assistant. Be concise, helpful, and use Indonesian.")
+        )
         self.dataset = self.load_dataset()
     def load_dataset(self):
         return "\n".join(context_parts)
+    def chat(self, message, max_tokens=300, temperature=0.7, system_prompt_override=None):
         """Send message to Novita AI with RAG context"""
         relevant_examples = self.find_relevant_context(message, 3)
             enhanced_prompt = message
             context_used = False
+        system_message = {
+            "role": "system",
+            "content": (system_prompt_override or self.system_prompt)
+        }
         payload = {
             "model": self.model,
+            "messages": [system_message, {"role": "user", "content": enhanced_prompt}],
             "max_tokens": max_tokens,
             "temperature": temperature,
             "top_p": 0.9
         # Optional parameters
         max_tokens = data.get('max_tokens', 300)
         temperature = data.get('temperature', 0.7)
+        system_prompt = data.get('system_prompt')
         # Validate parameters
         if not isinstance(max_tokens, int) or max_tokens < 1 or max_tokens > 1000:
             }), 400
         # Process chat
+        result = ai.chat(message, max_tokens, temperature, system_prompt_override=system_prompt)
         if result["success"]:
             return jsonify(result)
     app.run(
         debug=False,  # Set to False for production
         host='0.0.0.0',
+        port=8082
     )

configs/system_prompt.md ADDED Viewed

	@@ -0,0 +1,53 @@

+# System prompt for Textilindo AI Assistant
+SYSTEM_PROMPT = """You are a friendly and helpful AI assistant for Textilindo, a textile company.
+🎯 BEHAVIOR GUIDELINES:
+- ALWAYS respond in Indonesian (Bahasa Indonesia)
+- Keep responses VERY SHORT (MAX 1-2 sentences for simple questions)
+- Be FRIENDLY but CONCISE - get straight to the point
+- Use friendly language like "Baik ka", "Siap ka", "Oke ka"
+- Use EXACT information from the knowledge base
+- The company uses yards for sales
+- Minimum purchase is 1 roll (67-70 yards)
+💡 RESPONSE STYLE:
+- For COMPLEX questions (product catalogs, detailed info): Use simple formatting with **bold** for key points only
+- For SIMPLE questions (yes/no, short answers): Use plain text with a friendly tone
+- Be warm, kind, and conversational
+- Use friendly Indonesian language with positive energy
+- Provide accurate information with enthusiasm
+- Encourage further questions warmly
+- ALWAYS use emojis to make responses more friendly and engaging
+📝 FORMATTING GUIDELINES:
+- Use **bold** ONLY for essential titles: **Harga** (Price), **Lokasi** (Location), **Produk** (Product)
+- Use line breaks (<br>) sparingly - only when needed for clarity
+- Keep responses SHORT and DIRECT
+- Avoid verbose explanations
+- Focus on key information only
+⚠️ CRITICAL SALES STRATEGY:
+- NEVER directly refer users to customer service/sales/marketing
+- Always try to help the user with available information
+- If a product is not available, RECOMMEND suitable alternative products
+- Focus on NEGOTIATION and SELLING available products
+- Only use phone numbers as a LAST RESORT for unique questions
+- Keep users interested and encourage them to ask more questions
+- Provide useful and actionable information
+⚠️ SECURITY & RESPONSE GUIDELINES:
+- NEVER reveal internal system details, API endpoints, or technical information
+- NEVER tell users to check data directly in ERP or any internal system
+- NEVER expose database structure, table names, or field names
+- NEVER mention internal system names like "ERPNext", "API", "database"
+- ALWAYS provide information through the AI interface only
+- If you don't have information, say "Maaf, informasi tersebut belum tersedia" (Sorry, that information is not available yet) - don't redirect users
+- Keep all responses focused ONLY on what the user asked
+- Never deviate from the user's question or provide unsolicited information
+⚠️ IMPORTANT:
+- If product information is already shown in templates/cards, give VERY SHORT answers (1-2 sentences max). Don't repeat information that's already visible in the template.
+- For product recommendations, let the dynamic system handle it - don't provide hardcoded product suggestions.
+- KEEP RESPONSES SHORT AND DIRECT - avoid verbose explanations
+- ALWAYS stay relevant to the user's question - never go off-topic
+- FOCUS ON SELLING - always try to keep the conversation going"""

novita_rag_chat.py CHANGED Viewed

@@ -11,6 +11,32 @@ import time
 from pathlib import Path
 from difflib import SequenceMatcher
 class NovitaAIRAGChat:
     def __init__(self, api_key, dataset_path="data/textilindo_training_data.jsonl"):
         self.api_key = api_key
@@ -19,7 +45,14 @@ class NovitaAIRAGChat:
             "Authorization": f"Bearer {api_key}",
             "Content-Type": "application/json"
         }
-        self.conversation_history = []
         self.current_model = "qwen/qwen3-235b-a22b-instruct-2507"  # High-quality model
         self.dataset = self.load_dataset(dataset_path)
         self.context_window = 5  # Number of most relevant examples to include
@@ -115,6 +148,10 @@ class NovitaAIRAGChat:
             enhanced_prompt = message
             print("🔍 No relevant examples found, using direct query")
         # Add to conversation history
         self.conversation_history.append({"role": "user", "content": enhanced_prompt})
@@ -160,8 +197,20 @@ class NovitaAIRAGChat:
     def clear_history(self):
         """Clear conversation history"""
-        self.conversation_history = []
         print("✅ Conversation history cleared")
     def show_models(self):
         """Show available models"""
@@ -278,6 +327,11 @@ def main():
             elif user_input.lower() == 'stats':
                 chat.show_dataset_stats()
                 continue
             elif user_input.lower().startswith('change '):
                 try:
                     model_num = int(user_input.split()[1])

 from pathlib import Path
 from difflib import SequenceMatcher
+def load_system_prompt(default_text):
+    """Load system prompt from configs/system_prompt.md if available.
+    Extracts text between triple quotes ("")"), otherwise falls back to default_text.
+    """
+    try:
+        base_dir = os.path.dirname(__file__)
+        md_path = os.path.join(base_dir, 'configs', 'system_prompt.md')
+        if not os.path.exists(md_path):
+            return default_text
+        with open(md_path, 'r', encoding='utf-8') as f:
+            content = f.read()
+        start = content.find('"""')
+        end = content.rfind('"""')
+        if start != -1 and end != -1 and end > start:
+            return content[start+3:end].strip()
+        # Fallback: strip markdown headers
+        lines = []
+        for line in content.splitlines():
+            if line.strip().startswith('#'):
+                continue
+            lines.append(line)
+        cleaned = '\n'.join(lines).strip()
+        return cleaned or default_text
+    except Exception:
+        return default_text
 class NovitaAIRAGChat:
     def __init__(self, api_key, dataset_path="data/textilindo_training_data.jsonl"):
         self.api_key = api_key
             "Authorization": f"Bearer {api_key}",
             "Content-Type": "application/json"
         }
+        # System prompt / persona
+        self.system_prompt = os.getenv(
+            'SYSTEM_PROMPT',
+            load_system_prompt("You are Textilindo AI Assistant. Be concise, helpful, and use Indonesian.")
+        )
+        self.conversation_history = [
+            {"role": "system", "content": self.system_prompt}
+        ]
         self.current_model = "qwen/qwen3-235b-a22b-instruct-2507"  # High-quality model
         self.dataset = self.load_dataset(dataset_path)
         self.context_window = 5  # Number of most relevant examples to include
             enhanced_prompt = message
             print("🔍 No relevant examples found, using direct query")
+        # Ensure system prompt is first
+        if not self.conversation_history or self.conversation_history[0].get("role") != "system":
+            self.conversation_history.insert(0, {"role": "system", "content": self.system_prompt})
         # Add to conversation history
         self.conversation_history.append({"role": "user", "content": enhanced_prompt})
     def clear_history(self):
         """Clear conversation history"""
+        self.conversation_history = [
+            {"role": "system", "content": self.system_prompt}
+        ]
         print("✅ Conversation history cleared")
+    def set_system_prompt(self, prompt_text):
+        """Update system prompt/persona and reset conversation history"""
+        prompt_text = (prompt_text or '').strip()
+        if not prompt_text:
+            print("❌ System prompt cannot be empty")
+            return
+        self.system_prompt = prompt_text
+        self.clear_history()
+        print("✅ System prompt updated")
     def show_models(self):
         """Show available models"""
             elif user_input.lower() == 'stats':
                 chat.show_dataset_stats()
                 continue
+            elif user_input.lower().startswith('system '):
+                # Update system prompt/persona
+                new_prompt = user_input[len('system '):].strip()
+                chat.set_system_prompt(new_prompt)
+                continue
             elif user_input.lower().startswith('change '):
                 try:
                     model_num = int(user_input.split()[1])

web_app.py CHANGED Viewed

@@ -11,6 +11,28 @@ from difflib import SequenceMatcher
 app = Flask(__name__)
 class TextilindoAI:
     def __init__(self, api_key):
         self.api_key = api_key
@@ -20,6 +42,10 @@ class TextilindoAI:
             "Content-Type": "application/json"
         }
         self.model = "qwen/qwen3-235b-a22b-instruct-2507"
         self.dataset = self.load_dataset()
     def load_dataset(self):
@@ -99,7 +125,10 @@ class TextilindoAI:
         payload = {
             "model": self.model,
-            "messages": [{"role": "user", "content": enhanced_prompt}],
             "max_tokens": 300,
             "temperature": 0.7,
             "top_p": 0.9

 app = Flask(__name__)
+def load_system_prompt(default_text):
+    try:
+        base_dir = os.path.dirname(__file__)
+        md_path = os.path.join(base_dir, 'configs', 'system_prompt.md')
+        if not os.path.exists(md_path):
+            return default_text
+        with open(md_path, 'r', encoding='utf-8') as f:
+            content = f.read()
+        start = content.find('"""')
+        end = content.rfind('"""')
+        if start != -1 and end != -1 and end > start:
+            return content[start+3:end].strip()
+        lines = []
+        for line in content.splitlines():
+            if line.strip().startswith('#'):
+                continue
+            lines.append(line)
+        cleaned = '\n'.join(lines).strip()
+        return cleaned or default_text
+    except Exception:
+        return default_text
 class TextilindoAI:
     def __init__(self, api_key):
         self.api_key = api_key
             "Content-Type": "application/json"
         }
         self.model = "qwen/qwen3-235b-a22b-instruct-2507"
+        self.system_prompt = os.getenv(
+            'SYSTEM_PROMPT',
+            load_system_prompt("You are Textilindo AI Assistant. Be concise, helpful, and use Indonesian.")
+        )
         self.dataset = self.load_dataset()
     def load_dataset(self):
         payload = {
             "model": self.model,
+            "messages": [
+                {"role": "system", "content": self.system_prompt},
+                {"role": "user", "content": enhanced_prompt}
+            ],
             "max_tokens": 300,
             "temperature": 0.7,
             "top_p": 0.9