Spaces:

madhavkotecha
/

OCR_with_LLMs

Running

madhavkotecha commited on Nov 27, 2024

Commit

69e1964

verified ·

1 Parent(s): 38eb8df

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,6 +7,7 @@ import pandas as pd
 from nltk.translate import bleu_score
 from nltk.translate.bleu_score import SmoothingFunction
 import torch
 yolo_weights_path = "final_wts.pt"
@@ -183,3 +184,33 @@ logits_flattened = slogits.reshape(-1, slogits.shape[-1])
 processor.batch_decode([logits_flattened.argmax(-1)], skip_special_tokens=True)

 from nltk.translate import bleu_score
 from nltk.translate.bleu_score import SmoothingFunction
 import torch
+import gradio as gr
 yolo_weights_path = "final_wts.pt"
 processor.batch_decode([logits_flattened.argmax(-1)], skip_special_tokens=True)
+---------------------------------------
+def gradio_inference(image_path):
+    """
+    Function to handle inference and output the generated texts and final processed texts.
+    """
+    df, bounding_path, tokens, logits, gen_texts = inference(image_path, debug=False, return_texts='final_v2')
+    # Convert the DataFrame for final texts to a readable format
+    final_texts = df.to_string(index=False)
+    # Convert the list of generated texts into a readable string
+    gen_texts_output = '\n'.join(gen_texts)
+    return gen_texts_output, final_texts
+image_input = gr.inputs.Image(type="filepath", label="Upload Image")
+generated_output = gr.outputs.Textbox(label="Generated Texts")
+final_output = gr.outputs.Textbox(label="Final Processed Texts")
+interface = gr.Interface(
+    fn=gradio_inference,
+    inputs=image_input,
+    outputs=[generated_output, final_output],
+    title="OCR using LLMs",
+    description="Upload an image and get generated and final processed texts",
+)
+interface.launch()