Spaces:

gauri-sharan
/

test-two

Sleeping

gauri-sharan commited on Sep 29, 2024

Commit

200c7bb

verified ·

1 Parent(s): 47c68aa

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -74,13 +74,13 @@ def ocr_and_extract(image, text_query):
             generated_ids, skip_special_tokens=True, clean_up_tokenization_spaces=False
         )
-        # Filter out system and user prompts
-        filtered_output = [line for line in output_text[0].split("\n") if not any(kw in line.lower() for kw in ["system", "user"])]
         # Clean up the temporary file
         os.remove(temp_image_path)
-        return "\n".join(filtered_output)
     except Exception as e:
         error_message = str(e)

             generated_ids, skip_special_tokens=True, clean_up_tokenization_spaces=False
         )
+        # Filter out "You are a helpful assistant" and "assistant" labels
+        filtered_output = [line for line in output_text[0].split("\n") if not any(kw in line.lower() for kw in ["you are a helpful assistant", "assistant", "user", "system"])]
         # Clean up the temporary file
         os.remove(temp_image_path)
+        return "\n".join(filtered_output).strip()
     except Exception as e:
         error_message = str(e)