Lord-Raven commited on
Commit
3e5a168
·
1 Parent(s): 30d670a

Playing with models.

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -11,7 +11,7 @@ from optimum.onnxruntime import ORTModelForSequenceClassification
11
  # "Xenova/distilbert-base-uncased-mnli" "typeform/distilbert-base-uncased-mnli" Bad answers
12
  # "Xenova/deBERTa-v3-base-mnli" "MoritzLaurer/DeBERTa-v3-base-mnli" Still a bit slow and not great answers
13
  model_name = "xenova/nli-deberta-v3-small"
14
- file_name = "onnx/model_fp16.onnx"
15
  tokenizer_name = "cross-encoder/nli-deberta-v3-small"
16
  model = ORTModelForSequenceClassification.from_pretrained(model_name, file_name=file_name)
17
  tokenizer = AutoTokenizer.from_pretrained(tokenizer_name, model_max_length=512)
 
11
  # "Xenova/distilbert-base-uncased-mnli" "typeform/distilbert-base-uncased-mnli" Bad answers
12
  # "Xenova/deBERTa-v3-base-mnli" "MoritzLaurer/DeBERTa-v3-base-mnli" Still a bit slow and not great answers
13
  model_name = "xenova/nli-deberta-v3-small"
14
+ file_name = "onnx/model_quantized.onnx"
15
  tokenizer_name = "cross-encoder/nli-deberta-v3-small"
16
  model = ORTModelForSequenceClassification.from_pretrained(model_name, file_name=file_name)
17
  tokenizer = AutoTokenizer.from_pretrained(tokenizer_name, model_max_length=512)