Spaces:

JustKiddo
/

IOTraining

Sleeping

App Files Files Community

JustKiddo commited on 10 days ago

Commit

289913c

•

1 Parent(s): 80eee0f

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -7

app.py CHANGED Viewed

@@ -33,7 +33,7 @@ class VietnameseChatbot:
         # Pre-compute embeddings for faster response generation
         print("Pre-computing conversation embeddings...")
-        self.conversation_embeddings = self._precompute_embeddings()
     def _load_conversation_data(self):
         """
@@ -50,7 +50,7 @@ class VietnameseChatbot:
             {"query": "Bạn từ đâu đến?", "response": "Tôi được phát triển bởi một nhóm kỹ sư AI, và tôn chỉ của tôi là hỗ trợ con người."},
             # Small talk
-            {"query": "Bạn thích gì?", "response": "Tôi thích học hỏi và giú đỡ mọi người. Mỗi cuộc trò chuyện là một cơ hội để tôi phát triển."},
             {"query": "Bạn có thể làm gì?", "response": "Tôi có thể trò chuyện, trả lời câu hỏi, và hỗ trợ bạn trong nhiều tình huống khác nhau."},
             # Weather and time
@@ -67,16 +67,39 @@ class VietnameseChatbot:
         ]
     @st.cache_data
-    def _precompute_embeddings(self):
         """
-        Pre-compute embeddings for all conversation queries
         Cached to avoid recomputing on every run
         """
         embeddings = []
-        for item in self.conversation_data:
-            embedding = self.embed_text(item['query'])
             if embedding is not None:
-                embeddings.append(embedding[0])
         return np.array(embeddings)
     def embed_text(self, text):

         # Pre-compute embeddings for faster response generation
         print("Pre-computing conversation embeddings...")
+        self.conversation_embeddings = self._compute_embeddings()
     def _load_conversation_data(self):
         """
             {"query": "Bạn từ đâu đến?", "response": "Tôi được phát triển bởi một nhóm kỹ sư AI, và tôn chỉ của tôi là hỗ trợ con người."},
             # Small talk
+            {"query": "Bạn thích gì?", "response": "Tôi thích học hỏi và giúp đỡ mọi người. Mỗi cuộc trò chuyện là một cơ hội để tôi phát triển."},
             {"query": "Bạn có thể làm gì?", "response": "Tôi có thể trò chuyện, trả lời câu hỏi, và hỗ trợ bạn trong nhiều tình huống khác nhau."},
             # Weather and time
         ]
     @st.cache_data
+    def _compute_embeddings(queries):
         """
+        Pre-compute embeddings for conversation queries
         Cached to avoid recomputing on every run
         """
+        def embed_single_text(text, tokenizer, model):
+            try:
+                # Tokenize and generate embeddings
+                inputs = tokenizer(text, return_tensors='pt', padding=True, truncation=True)
+                with torch.no_grad():
+                    model_output = model(**inputs)
+                # Mean pooling
+                token_embeddings = model_output[0]
+                input_mask_expanded = inputs['attention_mask'].unsqueeze(-1).expand(token_embeddings.size()).float()
+                embeddings = torch.sum(token_embeddings * input_mask_expanded, 1) / torch.clamp(input_mask_expanded.sum(1), min=1e-9)
+                return embeddings.numpy()[0]
+            except Exception as e:
+                print(f"Embedding error: {e}")
+                return None
+        # Import these arguments to make the function self-contained
+        from transformers import AutoTokenizer, AutoModel
+        tokenizer = AutoTokenizer.from_pretrained('intfloat/multilingual-e5-small')
+        model = AutoModel.from_pretrained('intfloat/multilingual-e5-small', torch_dtype=torch.float16)
         embeddings = []
+        for query in queries:
+            embedding = embed_single_text(query['query'], tokenizer, model)
             if embedding is not None:
+                embeddings.append(embedding)
         return np.array(embeddings)
     def embed_text(self, text):