jdgalvan
/

Phi-3-mini-4k-instruct

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

jdgalvan commited on Jul 9, 2024

Commit

e06a121

·

verified ·

1 Parent(s): f98e8e2

Delete handler.py

Files changed (1) hide show

handler.py +0 -32

handler.py DELETED Viewed

@@ -1,32 +0,0 @@
-from typing import Dict, List, Any
-from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
-class EndpointHandler():
-    def __init__(self, path=""):
-      # Load model directly
-        model = AutoModelForCausalLM.from_pretrained(
-            "jdgalvan/Phi-3-mini-4k-instruct",
-            device_map="cuda",
-            torch_dtype="auto",
-            trust_remote_code=True,
-        )
-        tokenizer = AutoTokenizer.from_pretrained("jdgalvan/Phi-3-mini-4k-instruct")
-        self.pipe = pipeline(
-            "text-generation",
-            model=model,
-            tokenizer=tokenizer,
-        )
-    def __call__(self, data: Dict[str, Any]) -> List[Dict[str, Any]]:
-        inputs = data.pop("inputs", data)
-        parameters = data.pop("parameters", None)
-        # pass inputs with all kwargs in data
-        if parameters is not None:
-            prediction = self.pipe(inputs, **parameters)
-        else:
-            prediction = self.pipe(inputs)
-        return prediction