Try passing model repo [deploy failing]
Browse filesIt's really strange: philschmid fork loads fine, and duplicating
philschmid fork in this repo doesn't.
- handler.py +1 -1
handler.py
CHANGED
@@ -14,7 +14,7 @@ def mean_pooling(model_output, attention_mask):
|
|
14 |
class EndpointHandler():
|
15 |
def __init__(self, path=""):
|
16 |
# load the optimized model
|
17 |
-
self.model = ORTModelForFeatureExtraction.from_pretrained(
|
18 |
self.tokenizer = AutoTokenizer.from_pretrained(path)
|
19 |
|
20 |
def __call__(self, data: Any) -> List[List[float]]:
|
|
|
14 |
class EndpointHandler():
|
15 |
def __init__(self, path=""):
|
16 |
# load the optimized model
|
17 |
+
self.model = ORTModelForFeatureExtraction.from_pretrained("jpohhhh/MiniLM-L6-v2-optimum-embeddings", file_name="model-quantized.onnx")
|
18 |
self.tokenizer = AutoTokenizer.from_pretrained(path)
|
19 |
|
20 |
def __call__(self, data: Any) -> List[List[float]]:
|