Spaces:

ikraamkb
/

qtAnswering

Sleeping

App Files Files Community

ikraamkb commited on Mar 27

Commit

171f476

verified ·

1 Parent(s): 1f136e0

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -11

app.py CHANGED Viewed

@@ -197,7 +197,7 @@ def truncate_text(text, max_length=2048):
 # ✅ Answer Questions from Image or Document
 def answer_question(file, question: str):
     try:
-        # ✅ Image Processing (Gradio sends images as NumPy arrays)
         if isinstance(file, np.ndarray):
             image = Image.fromarray(file)
             caption = image_captioning_pipeline(image)[0]['generated_text']
@@ -209,26 +209,31 @@ def answer_question(file, question: str):
         if validation_error:
             return validation_error
-        # ✅ Read File Bytes Properly
-        if hasattr(file, "read"):  # Gradio passes file objects
-            file_bytes = file.read()
-        elif isinstance(file, bytes):  # Direct bytes input
-            file_bytes = file
         else:
-            raise ValueError("Unexpected file type received!")
-        # ✅ Get File Extension
         file_ext = file.name.split(".")[-1].lower() if hasattr(file, "name") else None
-        # ✅ Extract Text from Supported Documents
-        text = None
         if file_ext == "pdf":
             text = extract_text_from_pdf(file_bytes)
         elif file_ext in ["docx", "pptx"]:
             text = extract_text_with_tika(file_bytes)
         elif file_ext == "xlsx":
             text = extract_text_from_excel(file_bytes)
         if not text or "❌" in text:
             return f"⚠️ No text extracted. Error: {text}"
@@ -238,7 +243,7 @@ def answer_question(file, question: str):
         return response[0]["generated_text"]
     except Exception as e:
-        print(f"❌ General Processing Error: {e}")  # Log error
         return f"❌ Processing Error: {str(e)}"
 # ✅ Gradio Interface (Unified for Images & Documents)

 # ✅ Answer Questions from Image or Document
 def answer_question(file, question: str):
     try:
+        # ✅ Handle Image Files
         if isinstance(file, np.ndarray):
             image = Image.fromarray(file)
             caption = image_captioning_pipeline(image)[0]['generated_text']
         if validation_error:
             return validation_error
+        # ✅ Extract File Bytes Correctly
+        file_bytes = None
+        if isinstance(file, bytes):
+            file_bytes = file  # Directly received bytes
+        elif hasattr(file, "read"):
+            file_bytes = file.read()  # Read bytes from file object
+        elif isinstance(file, str):
+            return "❌ Error: File received as a string, expected binary data!"
         else:
+            return f"❌ Unexpected file type received! Type: {type(file)}"
+        # ✅ Extract Text Based on File Extension
         file_ext = file.name.split(".")[-1].lower() if hasattr(file, "name") else None
         if file_ext == "pdf":
             text = extract_text_from_pdf(file_bytes)
         elif file_ext in ["docx", "pptx"]:
             text = extract_text_with_tika(file_bytes)
         elif file_ext == "xlsx":
             text = extract_text_from_excel(file_bytes)
+        else:
+            return f"❌ Unsupported file format: {file_ext}"
+        # ✅ Validate Extraction
         if not text or "❌" in text:
             return f"⚠️ No text extracted. Error: {text}"
         return response[0]["generated_text"]
     except Exception as e:
+        print(f"❌ General Processing Error: {e}")  # Log error to console
         return f"❌ Processing Error: {str(e)}"
 # ✅ Gradio Interface (Unified for Images & Documents)