jpohhhh
/

msmarco-MiniLM-L-6-v3_onnx

sentence-embeddings

endpoints-template

Inference Endpoints

Model card Files Files and versions Community

jpohhhh commited on Jun 21, 2023

Commit

dbdba21

·

1 Parent(s): 2758b9b

Try using path...

Files changed (1) hide show

handler.py +3 -1

handler.py CHANGED Viewed

@@ -2,6 +2,8 @@ from typing import Dict, List, Any
 from transformers import AutoTokenizer, AutoModel
 from optimum.pipelines import pipeline
 from optimum.onnxruntime import ORTModelForFeatureExtraction
 import torch
@@ -16,7 +18,7 @@ class EndpointHandler():
         # self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         task = "feature-extraction"
         tokenizer = AutoTokenizer.from_pretrained('sentence-transformers/msmarco-MiniLM-L-6-v3')
-        model_regular = ORTModelForFeatureExtraction.from_pretrained("onnx", file_name="model.onnx", from_transformers=False)
         self.onnx_extractor = pipeline(task, model=model_regular, tokenizer=tokenizer)
         # self.model.to(self.device)
         # print("model will run on ", self.device)

 from transformers import AutoTokenizer, AutoModel
 from optimum.pipelines import pipeline
 from optimum.onnxruntime import ORTModelForFeatureExtraction
+from pathlib import Path
 import torch
         # self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         task = "feature-extraction"
         tokenizer = AutoTokenizer.from_pretrained('sentence-transformers/msmarco-MiniLM-L-6-v3')
+        model_regular = ORTModelForFeatureExtraction.from_pretrained(Path("onnx"), file_name="model.onnx", from_transformers=False)
         self.onnx_extractor = pipeline(task, model=model_regular, tokenizer=tokenizer)
         # self.model.to(self.device)
         # print("model will run on ", self.device)