Spaces:

gaunernst
/

layoutlm-docvqa-paddleocr

Running

gaunernst commited on Feb 14, 2024

Commit

90a9cee

verified ·

1 Parent(s): 3366430

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,11 +11,9 @@ model_tag = "impira/layoutlm-document-qa"
 MODEL = LayoutLMForQuestionAnswering.from_pretrained(model_tag).eval()
 TOKENIZER = AutoTokenizer.from_pretrained(model_tag)
 OCR = PaddleOCR(
-    use_angle_cls=True,
     lang="en",
     det_limit_side_len=10_000,
     det_db_score_mode="slow",
-    enable_mlkdnn=True,
 )
@@ -27,7 +25,7 @@ def predict(image: Image.Image, question: str, ocr_engine: str):
     image_np = np.array(image)
     if ocr_engine == PADDLE_OCR_LABEL:
-        ocr_result = OCR.ocr(image_np)[0]
         words = [x[1][0] for x in ocr_result]
         boxes = np.asarray([x[0] for x in ocr_result])  # (n_boxes, 4, 2)

 MODEL = LayoutLMForQuestionAnswering.from_pretrained(model_tag).eval()
 TOKENIZER = AutoTokenizer.from_pretrained(model_tag)
 OCR = PaddleOCR(
     lang="en",
     det_limit_side_len=10_000,
     det_db_score_mode="slow",
 )
     image_np = np.array(image)
     if ocr_engine == PADDLE_OCR_LABEL:
+        ocr_result = OCR.ocr(image_np, cls=False)[0]
         words = [x[1][0] for x in ocr_result]
         boxes = np.asarray([x[0] for x in ocr_result])  # (n_boxes, 4, 2)