dfdfdfd

Sleeping

Yjhhh commited on Sep 4

Commit

8a6af4d

•

1 Parent(s): 7691684

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,5 +1,4 @@
 from fastapi import FastAPI, HTTPException, Request
-from pydantic import BaseModel
 import uvicorn
 import requests
 import os
@@ -8,7 +7,7 @@ import time
 import asyncio
 from typing import List, Dict, Any
 from tqdm import tqdm
-from llama_cpp import Llama  # Asegúrate de ajustar esto según la biblioteca que utilices
 app = FastAPI()
@@ -69,11 +68,10 @@ class ModelManager:
                 temp_filename = await self.save_model_to_temp_file(model_config)
                 start_time = time.time()
                 print(f"Cargando modelo desde {temp_filename}")
-                # Asegúrate de usar el método correcto para cargar el modelo
                 llama = Llama.load(temp_filename)
                 end_time = time.time()
                 load_duration = end_time - start_time
-                if load_duration > 0:
                     print(f"Modelo {model_config['name']} tardó {load_duration:.2f} segundos en cargar, dividiendo automáticamente")
                     await self.handle_large_model(temp_filename, model_config)
                 else:

 from fastapi import FastAPI, HTTPException, Request
 import uvicorn
 import requests
 import os
 import asyncio
 from typing import List, Dict, Any
 from tqdm import tqdm
+from llama_cpp import Llama
 app = FastAPI()
                 temp_filename = await self.save_model_to_temp_file(model_config)
                 start_time = time.time()
                 print(f"Cargando modelo desde {temp_filename}")
                 llama = Llama.load(temp_filename)
                 end_time = time.time()
                 load_duration = end_time - start_time
+                if load_duration > 0.5:
                     print(f"Modelo {model_config['name']} tardó {load_duration:.2f} segundos en cargar, dividiendo automáticamente")
                     await self.handle_large_model(temp_filename, model_config)
                 else: