jpohhhh commited on
Commit
26a30ca
·
1 Parent(s): 6e21725

Try passing model repo [deploy failing]

Browse files

It's really strange: philschmid fork loads fine, and duplicating
philschmid fork in this repo doesn't.

Files changed (1) hide show
  1. handler.py +1 -1
handler.py CHANGED
@@ -14,7 +14,7 @@ def mean_pooling(model_output, attention_mask):
14
  class EndpointHandler():
15
  def __init__(self, path=""):
16
  # load the optimized model
17
- self.model = ORTModelForFeatureExtraction.from_pretrained(path, file_name="model-quantized.onnx")
18
  self.tokenizer = AutoTokenizer.from_pretrained(path)
19
 
20
  def __call__(self, data: Any) -> List[List[float]]:
 
14
  class EndpointHandler():
15
  def __init__(self, path=""):
16
  # load the optimized model
17
+ self.model = ORTModelForFeatureExtraction.from_pretrained("jpohhhh/MiniLM-L6-v2-optimum-embeddings", file_name="model-quantized.onnx")
18
  self.tokenizer = AutoTokenizer.from_pretrained(path)
19
 
20
  def __call__(self, data: Any) -> List[List[float]]: