Spaces:

lightonai
/

LightOnOCR-1B-Demo

Running

App Files Files Community

staghado commited on Oct 24

Commit

dd3a410

verified ·

1 Parent(s): 734c7e1

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -8

app.py CHANGED Viewed

@@ -46,7 +46,7 @@ def process_pdf(pdf_path, page_num=1):
 def process_input(file_input, temperature, page_num):
     if file_input is None:
-        yield "Please upload an image or PDF first.", "", "", None
         return
     image_to_process = None
@@ -59,18 +59,18 @@ def process_input(file_input, temperature, page_num):
             image_to_process, total_pages, actual_page = process_pdf(file_path, int(page_num))
             page_info = f"Processing page {actual_page} of {total_pages}"
         except Exception as e:
-            yield f"Error processing PDF: {str(e)}", "", "", None
             return
     else:
         try:
             image_to_process = Image.open(file_path)
             page_info = "Processing image"
         except Exception as e:
-            yield f"Error opening image: {str(e)}", "", "", None
             return
     content = [
-        {"type": "text", "text": "Extract the text from this image."},
         {
             "type": "image_url",
             "image_url": {"url": f"data:image/png;base64,{image_to_base64(image_to_process)}"}
@@ -113,16 +113,34 @@ def process_input(file_input, temperature, page_num):
                         if content_delta:
                             accumulated_response += content_delta
                             if first_chunk:
-                                yield accumulated_response, accumulated_response, page_info, image_to_process
                                 first_chunk = False
                             else:
-                                yield accumulated_response, accumulated_response, page_info, gr.update()
                 except json.JSONDecodeError:
                     continue
     except Exception as e:
         error_msg = f"Error: {str(e)}"
-        yield error_msg, error_msg, page_info, image_to_process
 with gr.Blocks(title="📖 Image/PDF OCR", theme=gr.themes.Soft()) as demo:
@@ -193,7 +211,13 @@ with gr.Blocks(title="📖 Image/PDF OCR", theme=gr.themes.Soft()) as demo:
     submit_btn.click(
         fn=process_input,
         inputs=[file_input, temperature, num_pages],
-        outputs=[output_text, raw_output, page_info, rendered_image]
     )
     clear_btn.click(

 def process_input(file_input, temperature, page_num):
     if file_input is None:
+        yield "Please upload an image or PDF first.", "", "", None, gr.update()
         return
     image_to_process = None
             image_to_process, total_pages, actual_page = process_pdf(file_path, int(page_num))
             page_info = f"Processing page {actual_page} of {total_pages}"
         except Exception as e:
+            yield f"Error processing PDF: {str(e)}", "", "", None, gr.update()
             return
     else:
         try:
             image_to_process = Image.open(file_path)
             page_info = "Processing image"
         except Exception as e:
+            yield f"Error opening image: {str(e)}", "", "", None, gr.update()
             return
     content = [
+        {"type": "text", "text": ""},
         {
             "type": "image_url",
             "image_url": {"url": f"data:image/png;base64,{image_to_base64(image_to_process)}"}
                         if content_delta:
                             accumulated_response += content_delta
                             if first_chunk:
+                                yield accumulated_response, accumulated_response, page_info, image_to_process, gr.update()
                                 first_chunk = False
                             else:
+                                yield accumulated_response, accumulated_response, page_info, gr.update(), gr.update()
                 except json.JSONDecodeError:
                     continue
     except Exception as e:
         error_msg = f"Error: {str(e)}"
+        yield error_msg, error_msg, page_info, image_to_process, gr.update()
+def update_slider(file_input):
+    if file_input is None:
+        return gr.update(maximum=20, value=1)
+    file_path = file_input if isinstance(file_input, str) else file_input.name
+    if file_path.lower().endswith('.pdf'):
+        try:
+            pdf = pdfium.PdfDocument(file_path)
+            total_pages = len(pdf)
+            pdf.close()
+            return gr.update(maximum=total_pages, value=1)
+        except:
+            return gr.update(maximum=20, value=1)
+    else:
+        return gr.update(maximum=1, value=1)
 with gr.Blocks(title="📖 Image/PDF OCR", theme=gr.themes.Soft()) as demo:
     submit_btn.click(
         fn=process_input,
         inputs=[file_input, temperature, num_pages],
+        outputs=[output_text, raw_output, page_info, rendered_image, num_pages]
+    )
+    file_input.change(
+        fn=update_slider,
+        inputs=[file_input],
+        outputs=[num_pages]
     )
     clear_btn.click(