uk-en-translator

Running on Zero

Yehor commited on 28 days ago

Commit

26a7c02

verified ·

1 Parent(s): 477660f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,13 +10,13 @@ import torch
 import torchaudio
 import gradio as gr
 import torchaudio.transforms as T
-import easyocr
 import polars as pl
 from importlib.metadata import version
 from gradio.utils import is_zero_gpu_space
 from gradio.themes import Base
 from transformers import (
     AutoModelForCausalLM,
     AutoTokenizer,
@@ -67,7 +67,12 @@ audio_model = AutoModelForCTC.from_pretrained(
 processor = Wav2Vec2BertProcessor.from_pretrained("Yehor/w2v-bert-uk-v2.1-bf16")
 # Load OCR
-ocr_model = easyocr.Reader(["uk"], gpu=True)
 # Examples
 examples_text = [
@@ -299,7 +304,12 @@ def inference_image(image, progress=gr.Progress()):
     if not isinstance(image, str):
         raise gr.Error("Please paste your image file.")
-    results = ocr_model.readtext(image, detail=0)
     text = " ".join(results)
     print("Text:", text)

 import torchaudio
 import gradio as gr
 import torchaudio.transforms as T
 import polars as pl
 from importlib.metadata import version
 from gradio.utils import is_zero_gpu_space
 from gradio.themes import Base
+from paddleocr import PaddleOCR
 from transformers import (
     AutoModelForCausalLM,
     AutoTokenizer,
 processor = Wav2Vec2BertProcessor.from_pretrained("Yehor/w2v-bert-uk-v2.1-bf16")
 # Load OCR
+ocr_model = PaddleOCR(
+    lang="uk",
+    use_doc_orientation_classify=False,
+    use_doc_unwarping=False,
+    use_textline_orientation=False,
+)
 # Examples
 examples_text = [
     if not isinstance(image, str):
         raise gr.Error("Please paste your image file.")
+    predictions = ocr_model.predict(image)
+    results = []
+    for prediction in predictions:
+      results.append(' '.join(prediction['rec_texts']))
     text = " ".join(results)
     print("Text:", text)