Spaces:

Noureddinesa
/

Layoutlmv3_v2_space

Running

App Files Files Community

ITSAIDI commited on Apr 17, 2024

Commit

0de3957

1 Parent(s): 8b164b3

sd

Browse files

Files changed (1) hide show

utilitis.py +9 -11

utilitis.py CHANGED Viewed

@@ -7,7 +7,11 @@ import numpy as np
 import time
 model_Hugging_path = "Noureddinesa/Output_LayoutLMv3_v7"
 #############################################################################
 #############################################################################
@@ -16,10 +20,6 @@ def Labels():
     id2label = {v: k for v, k in enumerate(labels)}
     label2id = {k: v for v, k in enumerate(labels)}
     return id2label, label2id
-#############################################################################
-#############################################################################
-ocr = PaddleOCR(use_angle_cls=False,lang='fr',rec=False)
 def processbbox(BBOX, width, height):
@@ -39,10 +39,9 @@ def processbbox(BBOX, width, height):
 def Preprocess(image):
-    ocr = PaddleOCR(use_angle_cls=False,lang='fr',rec=False)
     image_array = np.array(image)
     width, height = image.size
-    results = ocr.ocr(image_array, cls=True)
     results = results[0]
     test_dict = {'image': image ,'tokens':[], "bboxes":[]}
     for item in results :
@@ -77,12 +76,11 @@ def unnormalize_box(bbox, width, height):
 def get_word(bboxes,image):
     x_min, y_min, x_max, y_max = bboxes
     roi = image.crop((x_min, y_min, x_max, y_max)) # Region of intrest
-    #roi = enhance_image(roi,1,1.5)
     roi_np = np.array(roi) # To array
-    result = ocr.ocr(roi_np, cls=True) # Apply OCR to ROI
     if result != [None]:
-        return result[0][0][1][0]
-    else:
         return ""
 #############################################################################
 #############################################################################

 import time
 model_Hugging_path = "Noureddinesa/Output_LayoutLMv3_v7"
+ocr = PaddleOCR(use_angle_cls=False,
+                lang='fr',
+                  rec=False,
+                  use_tensorrt = True
+                )
 #############################################################################
 #############################################################################
     id2label = {v: k for v, k in enumerate(labels)}
     label2id = {k: v for v, k in enumerate(labels)}
     return id2label, label2id
 def processbbox(BBOX, width, height):
 def Preprocess(image):
     image_array = np.array(image)
     width, height = image.size
+    results = ocr.ocr(image_array,  cls=False,rec = True)
     results = results[0]
     test_dict = {'image': image ,'tokens':[], "bboxes":[]}
     for item in results :
 def get_word(bboxes,image):
     x_min, y_min, x_max, y_max = bboxes
     roi = image.crop((x_min, y_min, x_max, y_max)) # Region of intrest
     roi_np = np.array(roi) # To array
+    result = ocr.ocr(roi_np, cls=False,det = False,rec = True)
     if result != [None]:
+        return result[0][0][0]
+    else :
         return ""
 #############################################################################
 #############################################################################