Spaces:

CwAnkit07
/

Question-textractor

Running

CwAnkit07 commited on Feb 8

Commit

7737855

verified ·

1 Parent(s): 42adfb3

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

+from fastapi import FastAPI
+from pydantic import BaseModel
+from transformers import pipeline
+# Load AI Model for Question Extraction
+question_extractor = pipeline("text-classification", model="textattack/bert-base-uncased-MRPC")
+app = FastAPI()
+# Define API Input Format
+class OCRText(BaseModel):
+    text: str
+@app.post("/extract_question")
+def extract_question(data: OCRText):
+    text = data.text
+    lines = text.split("\n")
+    # Use AI Model to Identify Question Parts
+    ranked_lines = sorted(lines, key=lambda line: question_extractor(line)[0]['score'], reverse=True)
+    top_sentences = [line for line in ranked_lines[:3] if len(line) > 10]  # Keep Top 3 Sentences
+    question_text = " ".join(top_sentences)
+    return {"extracted_question": question_text}