MrOvkill commited on
Commit
4405341
·
verified ·
1 Parent(s): 02bec62

Update handler.py

Browse files
Files changed (1) hide show
  1. handler.py +1 -1
handler.py CHANGED
@@ -5,7 +5,7 @@ MAX_TOKENS=8192
5
 
6
  class EndpointHandler():
7
  def __init__(self, data):
8
- self.model = Llama.from_pretrained("MrOvkill/gemma-2-inference-endpoint-GGUF", filename="gemma-2b.q8_0.gguf")
9
 
10
  def __call__(self, data: Dict[str, Any]) -> List[Dict[str, Any]]:
11
  inputs = data.pop("inputs", "")
 
5
 
6
  class EndpointHandler():
7
  def __init__(self, data):
8
+ self.model = Llama.from_pretrained("lmstudio-ai/gemma-2b-it-GGUF", filename="gemma-2b.q8_0.gguf", n_ctx=8192, cache_dir="./", n_gpu_layers=99)
9
 
10
  def __call__(self, data: Dict[str, Any]) -> List[Dict[str, Any]]:
11
  inputs = data.pop("inputs", "")