jpohhhh
/

msmarco-MiniLM-L-6-v3_onnx

sentence-embeddings

endpoints-template

Inference Endpoints

Model card Files Files and versions Community

jpohhhh commited on Jun 21, 2023

Commit

df00d4a

·

1 Parent(s): dbdba21

Update handler.py

Files changed (1) hide show

handler.py +4 -2

handler.py CHANGED Viewed

@@ -4,7 +4,7 @@ from optimum.pipelines import pipeline
 from optimum.onnxruntime import ORTModelForFeatureExtraction
 from pathlib import Path
 import torch
 #Mean Pooling - Take attention mask into account for correct averaging
@@ -15,10 +15,12 @@ def mean_pooling(model_output, attention_mask):
 class EndpointHandler():
     def __init__(self, path=""):
         # self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         task = "feature-extraction"
         tokenizer = AutoTokenizer.from_pretrained('sentence-transformers/msmarco-MiniLM-L-6-v3')
-        model_regular = ORTModelForFeatureExtraction.from_pretrained(Path("onnx"), file_name="model.onnx", from_transformers=False)
         self.onnx_extractor = pipeline(task, model=model_regular, tokenizer=tokenizer)
         # self.model.to(self.device)
         # print("model will run on ", self.device)

 from optimum.onnxruntime import ORTModelForFeatureExtraction
 from pathlib import Path
+import os
 import torch
 #Mean Pooling - Take attention mask into account for correct averaging
 class EndpointHandler():
     def __init__(self, path=""):
+        print("HELLO THIS IS THE CWD:", os.getcwd())
+        print("HELLO THIS IS THE PATH ARG:", path)
         # self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         task = "feature-extraction"
         tokenizer = AutoTokenizer.from_pretrained('sentence-transformers/msmarco-MiniLM-L-6-v3')
+        model_regular = ORTModelForFeatureExtraction.from_pretrained(Path(path / "onnx"), file_name="model.onnx", from_transformers=False)
         self.onnx_extractor = pipeline(task, model=model_regular, tokenizer=tokenizer)
         # self.model.to(self.device)
         # print("model will run on ", self.device)