Spaces:

kh-CHEUNG
/

test_img_text-streamlit

Sleeping

kh-CHEUNG commited on Apr 16, 2024

Commit

ae12c74

verified ·

1 Parent(s): 4eea76c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -36,10 +36,6 @@ def unnormalize_box(box, image_width, image_height):
     return [x1, y1, x2, y2]
-# Get the coordinates from the output text and denormalize them
-coordinates = extract_coordinates(output_text)
-coordinates = unnormalize_box(coordinates, unnormalized_image.width, unnormalized_image.height)
 processor = AutoProcessor.from_pretrained("microsoft/udop-large", apply_ocr=True)
 model = UdopForConditionalGeneration.from_pretrained("microsoft/udop-large")
@@ -93,14 +89,21 @@ with col2:
                 st.write(output_text)
             case "Layout Analysis":
                 output_text = processor.batch_decode(model_output, skip_special_tokens=False)[0]
                 mean = processor.image_processor.image_mean
                 std = processor.image_processor.image_std
                 unnormalized_image = (encoding.pixel_values.squeeze().numpy() * np.array(std)[:, None, None]) + np.array(mean)[:, None, None]
                 unnormalized_image = (unnormalized_image * 255).astype(np.uint8)
                 unnormalized_image = np.moveaxis(unnormalized_image, 0, -1)
                 unnormalized_image = Image.fromarray(unnormalized_image)
                 draw = ImageDraw.Draw(unnormalized_image)
                 draw.rectangle(coordinates, outline="red")
                 st.image(unnormalized_image, caption="Output Image")
     elif testButton and selected_file == "None":
         st.write("Please upload and select a document (/an image).")

     return [x1, y1, x2, y2]
 processor = AutoProcessor.from_pretrained("microsoft/udop-large", apply_ocr=True)
 model = UdopForConditionalGeneration.from_pretrained("microsoft/udop-large")
                 st.write(output_text)
             case "Layout Analysis":
                 output_text = processor.batch_decode(model_output, skip_special_tokens=False)[0]
                 mean = processor.image_processor.image_mean
                 std = processor.image_processor.image_std
                 unnormalized_image = (encoding.pixel_values.squeeze().numpy() * np.array(std)[:, None, None]) + np.array(mean)[:, None, None]
                 unnormalized_image = (unnormalized_image * 255).astype(np.uint8)
                 unnormalized_image = np.moveaxis(unnormalized_image, 0, -1)
                 unnormalized_image = Image.fromarray(unnormalized_image)
+                # Get the coordinates from the output text and denormalize them
+                coordinates = extract_coordinates(output_text)
+                coordinates = unnormalize_box(coordinates, unnormalized_image.width, unnormalized_image.height)
                 draw = ImageDraw.Draw(unnormalized_image)
                 draw.rectangle(coordinates, outline="red")
                 st.image(unnormalized_image, caption="Output Image")
     elif testButton and selected_file == "None":
         st.write("Please upload and select a document (/an image).")