CwAnkit07's picture
Update app.py
36765fa verified
raw
history blame
713 Bytes
from fastapi import FastAPI
from pydantic import BaseModel
from transformers import pipeline
# Load AI Model for Question Extraction from Local Model Folder
question_extractor = pipeline("text-classification", model="./model")
app = FastAPI()
class OCRText(BaseModel):
text: str
@app.post("/extract_question")
def extract_question(data: OCRText):
text = data.text
lines = text.split("\n")
ranked_lines = sorted(lines, key=lambda line: question_extractor(line)[0]['score'], reverse=True)
top_sentences = [line for line in ranked_lines[:3] if len(line) > 10] # Keep Top 3 Sentences
question_text = " ".join(top_sentences)
return {"extracted_question": question_text}