Lord-Raven commited on
Commit
2d12eef
·
1 Parent(s): 33cbc37

Trying ONNX models on CPU.

Browse files
Files changed (2) hide show
  1. app.py +3 -3
  2. requirements.txt +1 -1
app.py CHANGED
@@ -31,10 +31,10 @@ file_name = "onnx/model.onnx"
31
 
32
  model_name_cpu = "MoritzLaurer/ModernBERT-large-zeroshot-v2.0"
33
 
34
- model_cpu = ORTModelForSequenceClassification.from_pretrained(model_id=model_name_cpu, file_name=file_name)
35
- tokenizer_cpu = AutoTokenizer.from_pretrained(model_name_cpu)
36
 
37
- classifier_cpu = pipeline(task="zero-shot-classification", model=model_cpu, tokenizer=tokenizer_cpu)
38
  classifier_gpu = pipeline(task="zero-shot-classification", model=model_name, tokenizer=tokenizer_name, device="cuda:0")
39
 
40
  def classify(data_string, request: gradio.Request):
 
31
 
32
  model_name_cpu = "MoritzLaurer/ModernBERT-large-zeroshot-v2.0"
33
 
34
+ # model_cpu = ORTModelForSequenceClassification.from_pretrained(model_id=model_name_cpu, file_name=file_name)
35
+ # tokenizer_cpu = AutoTokenizer.from_pretrained(model_name_cpu)
36
 
37
+ classifier_cpu = pipeline(task="zero-shot-classification", model=model_name_cpu, tokenizer=model_name_cpu)
38
  classifier_gpu = pipeline(task="zero-shot-classification", model=model_name, tokenizer=tokenizer_name, device="cuda:0")
39
 
40
  def classify(data_string, request: gradio.Request):
requirements.txt CHANGED
@@ -4,5 +4,5 @@ huggingface_hub==0.32.4
4
  json5==0.9.25
5
  numpy
6
  uvicorn
7
- optimum[onnxruntime]==1.25.3
8
  transformers==4.51.3
 
4
  json5==0.9.25
5
  numpy
6
  uvicorn
7
+ optimum[onnxruntime-gpu]==1.25.3
8
  transformers==4.51.3