aws-solutions-library-samples
diff --git a/‎CHANGELOG.md‎
Lines changed: 6 additions & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎VERSION‎
Lines changed: 1 addition & 1 deletion b/‎VERSION‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎lib/idp_common_pkg/idp_common/assessment/granular_service.py‎
Lines changed: 21 additions & 9 deletions b/‎lib/idp_common_pkg/idp_common/assessment/granular_service.py‎
Lines changed: 21 additions & 9 deletions
diff --git a/‎lib/idp_common_pkg/idp_common/assessment/service.py‎
Lines changed: 21 additions & 9 deletions b/‎lib/idp_common_pkg/idp_common/assessment/service.py‎
Lines changed: 21 additions & 9 deletions
diff --git a/‎lib/idp_common_pkg/idp_common/classification/service.py‎
Lines changed: 20 additions & 6 deletions b/‎lib/idp_common_pkg/idp_common/classification/service.py‎
Lines changed: 20 additions & 6 deletions
diff --git a/‎lib/idp_common_pkg/idp_common/extraction/service.py‎
Lines changed: 20 additions & 6 deletions b/‎lib/idp_common_pkg/idp_common/extraction/service.py‎
Lines changed: 20 additions & 6 deletions
diff --git a/‎lib/idp_common_pkg/idp_common/image/__init__.py‎
Lines changed: 45 additions & 13 deletions b/‎lib/idp_common_pkg/idp_common/image/__init__.py‎
Lines changed: 45 additions & 13 deletions
@@ -25,6 +25,12 @@ SPDX-License-Identifier: MIT-0
 
 
 ### Fixed
+- **OCR Service Image Processing for PNG/JPG Files**
+  - Fixed issue where PNG files were being unnecessarily converted to JPEG format and resized
+  - PNG and JPG files now preserve their original format when stored in S3
+  - Image resolution is preserved by default unless explicitly configured via `resize_config`
+  - DPI settings now only apply to PDF files, not to image files
+  - Resolves issue where PNG files were being converted to lower resolution JPG files
 
 
 ## [0.3.7]
 
@@ -1 +1 @@
-0.3.8-wip1
+0.3.8-wip3
@@ -1098,17 +1098,29 @@ def process_document_section(self, document: Document, section_id: str) -> Docum
                 page = document.pages[page_id]
                 image_uri = page.image_uri
 
+            if target_width is not None and target_height is not None:
+                # Handle empty strings and convert to int
+                if isinstance(target_width, str) and not target_width.strip():
+                    target_width = None
+                if isinstance(target_height, str) and not target_height.strip():
+                    target_height = None
+
+                # Only proceed if we have valid values after cleaning
                 if target_width is not None and target_height is not None:
-                    # Cast to int in case config values are strings
-                    target_width = int(target_width)
-                    target_height = int(target_height)
-                    image_content = image.prepare_image(
-                        image_uri, target_width, target_height
-                    )
+                    try:
+                        target_width = int(target_width)
+                        target_height = int(target_height)
+                        image_content = image.prepare_image(
+                            image_uri, target_width, target_height
+                        )
+                    except (ValueError, TypeError) as e:
+                        logger.warning(f"Invalid resize configuration values: {e}")
+                        # Fall back to default image preparation
+                        image_content = image.prepare_image(image_uri)
                 else:
-                    image_content = image.prepare_image(
-                        image_uri
-                    )  # Uses function defaults
+                    image_content = image.prepare_image(image_uri)
+            else:
+                image_content = image.prepare_image(image_uri)  # Uses function defaults
                 page_images.append(image_content)
 
             t3 = time.time()
 
@@ -696,17 +696,29 @@ def process_document_section(self, document: Document, section_id: str) -> Docum
                 page = document.pages[page_id]
                 image_uri = page.image_uri
 
+            if target_width is not None and target_height is not None:
+                # Handle empty strings and convert to int
+                if isinstance(target_width, str) and not target_width.strip():
+                    target_width = None
+                if isinstance(target_height, str) and not target_height.strip():
+                    target_height = None
+
+                # Only proceed if we have valid values after cleaning
                 if target_width is not None and target_height is not None:
-                    # Cast to int in case config values are strings
-                    target_width = int(target_width)
-                    target_height = int(target_height)
-                    image_content = image.prepare_image(
-                        image_uri, target_width, target_height
-                    )
+                    try:
+                        target_width = int(target_width)
+                        target_height = int(target_height)
+                        image_content = image.prepare_image(
+                            image_uri, target_width, target_height
+                        )
+                    except (ValueError, TypeError) as e:
+                        logger.warning(f"Invalid resize configuration values: {e}")
+                        # Fall back to default image preparation
+                        image_content = image.prepare_image(image_uri)
                 else:
-                    image_content = image.prepare_image(
-                        image_uri
-                    )  # Uses function defaults
+                    image_content = image.prepare_image(image_uri)
+            else:
+                image_content = image.prepare_image(image_uri)  # Uses function defaults
                 page_images.append(image_content)
 
             t3 = time.time()
 
@@ -618,12 +618,26 @@ def classify_page_bedrock(
                 target_height = image_config.get("target_height")
 
                 if target_width is not None and target_height is not None:
-                    # Cast to int in case config values are strings
-                    target_width = int(target_width)
-                    target_height = int(target_height)
-                    image_content = image.prepare_image(
-                        image_uri, target_width, target_height
-                    )
+                    # Handle empty strings and convert to int
+                    if isinstance(target_width, str) and not target_width.strip():
+                        target_width = None
+                    if isinstance(target_height, str) and not target_height.strip():
+                        target_height = None
+
+                    # Only proceed if we have valid values after cleaning
+                    if target_width is not None and target_height is not None:
+                        try:
+                            target_width = int(target_width)
+                            target_height = int(target_height)
+                            image_content = image.prepare_image(
+                                image_uri, target_width, target_height
+                            )
+                        except (ValueError, TypeError) as e:
+                            logger.warning(f"Invalid resize configuration values: {e}")
+                            # Fall back to default image preparation
+                            image_content = image.prepare_image(image_uri)
+                    else:
+                        image_content = image.prepare_image(image_uri)
                 else:
                     image_content = image.prepare_image(
                         image_uri
 
@@ -619,12 +619,26 @@ def process_document_section(self, document: Document, section_id: str) -> Docum
                 page = document.pages[page_id]
                 image_uri = page.image_uri
                 if target_width is not None and target_height is not None:
-                    # Cast to int in case config values are strings
-                    target_width = int(target_width)
-                    target_height = int(target_height)
-                    image_content = image.prepare_image(
-                        image_uri, target_width, target_height
-                    )
+                    # Handle empty strings and convert to int
+                    if isinstance(target_width, str) and not target_width.strip():
+                        target_width = None
+                    if isinstance(target_height, str) and not target_height.strip():
+                        target_height = None
+
+                    # Only proceed if we have valid values after cleaning
+                    if target_width is not None and target_height is not None:
+                        try:
+                            target_width = int(target_width)
+                            target_height = int(target_height)
+                            image_content = image.prepare_image(
+                                image_uri, target_width, target_height
+                            )
+                        except (ValueError, TypeError) as e:
+                            logger.warning(f"Invalid resize configuration values: {e}")
+                            # Fall back to default image preparation
+                            image_content = image.prepare_image(image_uri)
+                    else:
+                        image_content = image.prepare_image(image_uri)
                 else:
                     image_content = image.prepare_image(
                         image_uri
 
@@ -12,54 +12,86 @@
 
 def resize_image(image_data: bytes, 
                 target_width: int = 951, 
-                target_height: int = 1268) -> bytes:
+                target_height: int = 1268,
+                allow_upscale: bool = False) -> bytes:
     """
     Resize an image to fit within target dimensions while preserving aspect ratio.
     No padding, no distortion - pure proportional scaling.
+    Preserves original format when possible.
     
     Args:
         image_data: Raw image bytes
         target_width: Target width in pixels
         target_height: Target height in pixels
+        allow_upscale: Whether to allow making the image larger than original
         
     Returns:
-        Resized image as JPEG bytes
+        Resized image bytes in original format (or JPEG if format cannot be preserved)
     """
     image = Image.open(io.BytesIO(image_data))
     current_width, current_height = image.size
+    original_format = image.format  # Store original format
 
     # Calculate scaling factor to fit within bounds while preserving aspect ratio
     width_ratio = target_width / current_width
     height_ratio = target_height / current_height
     scale_factor = min(width_ratio, height_ratio)  # Fit within bounds
 
-    # Only resize if we're making it smaller
-    if scale_factor < 1.0:
+    # Determine if resizing is needed
+    needs_resize = (scale_factor < 1.0) or (allow_upscale and scale_factor > 1.0)
+    
+    if needs_resize:
         new_width = int(current_width * scale_factor)
         new_height = int(current_height * scale_factor)
         logger.info(f"Resizing image from {current_width}x{current_height} to {new_width}x{new_height} (scale: {scale_factor:.3f})")
         image = image.resize((new_width, new_height), Image.LANCZOS)
+        
+        # Save in original format if possible
+        img_byte_array = io.BytesIO()
+        
+        # Determine save format - use original if available, otherwise JPEG
+        if original_format and original_format in ['JPEG', 'PNG', 'GIF', 'BMP', 'TIFF', 'WEBP']:
+            save_format = original_format
+        else:
+            save_format = 'JPEG'
+            logger.info(f"Converting from {original_format or 'unknown'} to JPEG")
+        
+        # Prepare save parameters
+        save_kwargs = {"format": save_format}
+        
+        # Add quality parameters for JPEG
+        if save_format in ['JPEG', 'JPG']:
+            save_kwargs["quality"] = 95  # High quality
+            save_kwargs["optimize"] = True
+        
+        # Handle format-specific requirements
+        if save_format == 'PNG' and image.mode not in ['RGBA', 'LA', 'L', 'P']:
+            # PNG requires specific modes
+            if image.mode == 'CMYK':
+                image = image.convert('RGB')
+        
+        image.save(img_byte_array, **save_kwargs)
+        return img_byte_array.getvalue()
     else:
-        logger.debug(f"Image {current_width}x{current_height} already fits within {target_width}x{target_height}, no resizing needed")
-    
-    # Convert to JPEG bytes
-    img_byte_array = io.BytesIO()
-    image.save(img_byte_array, format="JPEG")
-    return img_byte_array.getvalue()
+        # No resizing needed - return original data unchanged
+        logger.info(f"Image {current_width}x{current_height} already fits within {target_width}x{target_height}, returning original")
+        return image_data
 
 def prepare_image(image_source: Union[str, bytes],
                  target_width: int = 951, 
-                 target_height: int = 1268) -> bytes:
+                 target_height: int = 1268,
+                 allow_upscale: bool = False) -> bytes:
     """
     Prepare an image for model input from either S3 URI or raw bytes
     
     Args:
         image_source: Either an S3 URI (s3://bucket/key) or raw image bytes
         target_width: Target width in pixels
         target_height: Target height in pixels
+        allow_upscale: Whether to allow making the image larger than original
         
     Returns:
-        Processed image as JPEG bytes ready for model input
+        Processed image bytes ready for model input (preserves format when possible)
     """
     # Get the image data
     if isinstance(image_source, str) and image_source.startswith('s3://'):
@@ -70,7 +102,7 @@ def prepare_image(image_source: Union[str, bytes],
         raise ValueError(f"Invalid image source: {type(image_source)}. Must be S3 URI or bytes.")
 
     # Resize and process
-    return resize_image(image_data, target_width, target_height)
+    return resize_image(image_data, target_width, target_height, allow_upscale)
 
 def apply_adaptive_binarization(image_data: bytes) -> bytes:
     """