Spaces:

winamnd
/

ocr-llm-test

Running

winamnd commited on Feb 16

Commit

a30c719

verified ·

1 Parent(s): 8a941fb

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,6 +5,7 @@ import csv
 import os
 import cv2
 import numpy as np
 import easyocr
 import keras_ocr
 from paddleocr import PaddleOCR
@@ -78,32 +79,23 @@ def generate_ocr(method, img):
     return text_output, label
-# Save extracted text to JSON & CSV (in the specified repository)
 def save_results(text, label):
     data = {"text": text, "label": label}
-    # Ensure the repository exists
-    repo_path = "./winamnd/ocr-llm-test"
-    if not os.path.exists(repo_path):
-        os.makedirs(repo_path)
-    # Define the full file paths for JSON and CSV
-    results_json = os.path.join(repo_path, "ocr_results.json")
-    results_csv = os.path.join(repo_path, "ocr_results.csv")
     # Save to JSON
-    if not os.path.exists(results_json):
-        with open(results_json, "w") as f:
             json.dump([], f)
-    with open(results_json, "r+") as f:
         content = json.load(f)
         content.append(data)
         f.seek(0)
         json.dump(content, f, indent=4)
     # Save to CSV
-    file_exists = os.path.exists(results_csv)
-    with open(results_csv, "a", newline="") as f:
         writer = csv.DictWriter(f, fieldnames=["text", "label"])
         if not file_exists:
             writer.writeheader()

 import os
 import cv2
 import numpy as np
+import pandas as pd
 import easyocr
 import keras_ocr
 from paddleocr import PaddleOCR
     return text_output, label
+# Save extracted text to JSON & CSV
 def save_results(text, label):
     data = {"text": text, "label": label}
     # Save to JSON
+    if not os.path.exists(RESULTS_JSON):
+        with open(RESULTS_JSON, "w") as f:
             json.dump([], f)
+    with open(RESULTS_JSON, "r+") as f:
         content = json.load(f)
         content.append(data)
         f.seek(0)
         json.dump(content, f, indent=4)
     # Save to CSV
+    file_exists = os.path.exists(RESULTS_CSV)
+    with open(RESULTS_CSV, "a", newline="") as f:
         writer = csv.DictWriter(f, fieldnames=["text", "label"])
         if not file_exists:
             writer.writeheader()