Update handler.py
Browse files- handler.py +1 -1
handler.py
CHANGED
@@ -5,7 +5,7 @@ MAX_TOKENS=8192
|
|
5 |
|
6 |
class EndpointHandler():
|
7 |
def __init__(self, data):
|
8 |
-
self.model = Llama.from_pretrained("
|
9 |
|
10 |
def __call__(self, data: Dict[str, Any]) -> List[Dict[str, Any]]:
|
11 |
inputs = data.pop("inputs", "")
|
|
|
5 |
|
6 |
class EndpointHandler():
|
7 |
def __init__(self, data):
|
8 |
+
self.model = Llama.from_pretrained("lmstudio-ai/gemma-2b-it-GGUF", filename="gemma-2b.q8_0.gguf", n_ctx=8192, cache_dir="./", n_gpu_layers=99)
|
9 |
|
10 |
def __call__(self, data: Dict[str, Any]) -> List[Dict[str, Any]]:
|
11 |
inputs = data.pop("inputs", "")
|