File size: 2,089 Bytes
93643d5
040c521
b0d2a02
e83c60c
3554a8b
d54f118
6b9e813
bd9482b
b0d2a02
 
31fb3f9
 
 
6b9e813
d184de8
31fb3f9
6b9e813
 
 
dc02763
6c40a85
dc02763
cfd4b0d
6b9e813
cfd4b0d
fd25b82
cfd4b0d
cc8b299
fd25b82
b0d2a02
8a243e5
 
 
 
b0d2a02
a822923
 
 
f3bcef9
 
fd25b82
47a0109
daac94f
9704577
0686401
 
5071704
93643d5
 
daac94f
0686401
93643d5
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
import gradio
import json
import torch
from transformers import AutoTokenizer
from transformers import pipeline
from fastapi import FastAPI
from fastapi.middleware.cors import CORSMiddleware
from optimum.onnxruntime import ORTModelForSequenceClassification

# CORS Config
app = FastAPI()

app.add_middleware(
    CORSMiddleware,
    allow_origins=["https://jhuhman.com"], #["https://statosphere-3704059fdd7e.c5v4v4jx6pq5.win"],
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
)
# "xenova/mobilebert-uncased-mnli" "typeform/mobilebert-uncased-mnli" Fast but small
# "xenova/deberta-v3-base-tasksource-nli" Not impressed
# "Xenova/bart-large-mnli" A bit slow
# "Xenova/distilbert-base-uncased-mnli" "typeform/distilbert-base-uncased-mnli" Bad answers

model_name = "Xenova/deBERTa-v3-base-mnli"
file_name = "onnx/model_quantized.onnx"
tokenizer_name = "MoritzLaurer/DeBERTa-v3-base-mnli"
model = ORTModelForSequenceClassification.from_pretrained(model_name, file_name=file_name)
tokenizer = AutoTokenizer.from_pretrained(tokenizer_name, model_max_length=512)

# file = cached_download("https://huggingface.co/" + model_name + "")
# sess = InferenceSession(file)

classifier = pipeline(task="zero-shot-classification", model=model, tokenizer=tokenizer)

def zero_shot_classification(data_string, request: gradio.Request):
    if request:
        print("Request headers dictionary:", request.headers)
        if request.headers["origin"] not in ["https://statosphere-3704059fdd7e.c5v4v4jx6pq5.win", "https://jhuhman-statosphere-backend.hf.space"]:
            return "{}"
    print(data_string)
    data = json.loads(data_string)
    print(data)
    results = classifier(data['sequence'], candidate_labels=data['candidate_labels'], hypothesis_template=data['hypothesis_template'], multi_label=data['multi_label'])
    response_string = json.dumps(results)
    return response_string

gradio_interface = gradio.Interface(
    fn = zero_shot_classification,
    inputs = gradio.Textbox(label="JSON Input"),
    outputs = gradio.Textbox()
)
gradio_interface.launch()