Spaces:

C2MV
/

Biotech2

Running on Zero

C2MV commited on Sep 21, 2024

Commit

0788e60

verified ·

1 Parent(s): 9fa15f3

Update interface.py

Files changed (1) hide show

interface.py CHANGED Viewed

@@ -22,20 +22,27 @@ tokenizer = AutoTokenizer.from_pretrained(model_path)
 model = AutoModelForCausalLM.from_pretrained(model_path)
 # No movemos el modelo al dispositivo aquí
 @spaces.GPU(duration=100)
-def generate_analysis(prompt, max_length=MAX_LENGTH, device=None):
     try:
         if device is None:
             device = torch.device('cpu')
         if next(model.parameters()).device != device:
             model.to(device)
         input_ids = tokenizer.encode(prompt, return_tensors='pt').to(device)
         max_gen_length = min(max_length + input_ids.size(1), model.config.max_position_embeddings)
         generated_ids = model.generate(
             input_ids=input_ids,
             max_length=max_gen_length,
-            temperature=TEMPERATURE,
             num_return_sequences=1,
             no_repeat_ngram_size=2,
             early_stopping=True
@@ -44,6 +51,8 @@ def generate_analysis(prompt, max_length=MAX_LENGTH, device=None):
         output_text = tokenizer.decode(generated_ids[0], skip_special_tokens=True)
         analysis = output_text[len(prompt):].strip()
         return analysis
     except Exception as e:
         return f"Ocurrió un error durante el análisis: {e}"

 model = AutoModelForCausalLM.from_pretrained(model_path)
 # No movemos el modelo al dispositivo aquí
+from decorators import spaces
 @spaces.GPU(duration=100)
+def generate_analysis(prompt, max_length=1024, device=None):
     try:
         if device is None:
             device = torch.device('cpu')
+        # Mover el modelo al dispositivo adecuado (GPU o CPU)
         if next(model.parameters()).device != device:
             model.to(device)
+        # Preparar los datos de entrada en el dispositivo correcto
         input_ids = tokenizer.encode(prompt, return_tensors='pt').to(device)
         max_gen_length = min(max_length + input_ids.size(1), model.config.max_position_embeddings)
+        # Generar el texto
         generated_ids = model.generate(
             input_ids=input_ids,
             max_length=max_gen_length,
+            temperature=0.7,
             num_return_sequences=1,
             no_repeat_ngram_size=2,
             early_stopping=True
         output_text = tokenizer.decode(generated_ids[0], skip_special_tokens=True)
         analysis = output_text[len(prompt):].strip()
         return analysis
+    except RuntimeError as e:
+        return f"Error durante la ejecución: {str(e)}"
     except Exception as e:
         return f"Ocurrió un error durante el análisis: {e}"