Spaces:

shreyasvaidya
/

Scene-Text-Translator

Sleeping

shreyasvaidya commited on Jan 19

Commit

2e80db5

verified ·

1 Parent(s): 63da76a

Upload folder using huggingface_hub

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,6 +11,12 @@ from transformers import (
 )
 import numpy as np
 import torch
 from IndicTransToolkit import IndicProcessor
@@ -107,6 +113,7 @@ def process_image(image):
     #         # Recognize text in the cropped area
     #         recognized_text = ocr.recognise(cropped_path, script_lang)
     #         recognized_texts.append(recognized_text)
     for id, bbox in enumerate(detections):
         # Identify the script and crop the image to this region
         script_lang, cropped_path = ocr.crop_and_identify_script(pil_image, bbox)
@@ -120,13 +127,14 @@ def process_image(image):
         if script_lang:
             recognized_text = ocr.recognise(cropped_path, script_lang)
             recognized_texts[f"img_{id}"] = {"txt": recognized_text, "bbox": [x1, y1, x2, y2]}
     # Combine recognized texts into a single string for display
     # recognized_texts_combined = " ".join(recognized_texts)
     string = detect_para(recognized_texts)
     recognized_texts_combined = '\n'.join([' '.join(line) for line in string])
-    recognized_texts_combined = translate(recognized_texts_combined,script_lang)
     return output_image, recognized_texts_combined

 )
 import numpy as np
 import torch
+from collections import Counter
+def Most_Common(lst):
+    data = Counter(lst)
+    return data.most_common(1)[0][0]
 from IndicTransToolkit import IndicProcessor
     #         # Recognize text in the cropped area
     #         recognized_text = ocr.recognise(cropped_path, script_lang)
     #         recognized_texts.append(recognized_text)
+    langs = []
     for id, bbox in enumerate(detections):
         # Identify the script and crop the image to this region
         script_lang, cropped_path = ocr.crop_and_identify_script(pil_image, bbox)
         if script_lang:
             recognized_text = ocr.recognise(cropped_path, script_lang)
             recognized_texts[f"img_{id}"] = {"txt": recognized_text, "bbox": [x1, y1, x2, y2]}
+            langs.append(script_lang)
     # Combine recognized texts into a single string for display
     # recognized_texts_combined = " ".join(recognized_texts)
     string = detect_para(recognized_texts)
     recognized_texts_combined = '\n'.join([' '.join(line) for line in string])
+    recognized_texts_combined = translate(recognized_texts_combined,Most_Common(langs))
     return output_image, recognized_texts_combined