Defend against float conversion exceptions

Bob Strahan · Bob Strahan · commit 5238e8f2c412 · 2025-06-19T16:39:09.000Z
diff --git a/lib/idp_common_pkg/idp_common/assessment/service.py b/lib/idp_common_pkg/idp_common/assessment/service.py
@@ -858,20 +858,11 @@ def process_document_section(self, document: Document, section_id: str) -> Docum
                         # Create a default assessment structure
                         default_assessment = {
                             "confidence": 0.5,
-                            "confidence_reason": f"LLM returned list format for non-list attribute '{attr_name}'. Using default confidence.",
+                            "confidence_reason": f"LLM returned list format for non-list attribute '{attr_name}'. Using default confidence (0.5) and threshold ({attr_threshold}).",
                             "confidence_threshold": attr_threshold,
                         }
                         enhanced_assessment_data[attr_name] = default_assessment
 
-                        # Add alert since we're using default confidence
-                        if 0.5 < attr_threshold:
-                            confidence_threshold_alerts.append(
-                                {
-                                    "attribute_name": attr_name,
-                                    "confidence": 0.5,
-                                    "confidence_threshold": attr_threshold,
-                                }
-                            )
                 else:
                     # Handle other unexpected types
                     logger.warning(
@@ -882,21 +873,11 @@ def process_document_section(self, document: Document, section_id: str) -> Docum
                     # Create a default assessment structure
                     default_assessment = {
                         "confidence": 0.5,
-                        "confidence_reason": f"LLM returned unexpected type {type(attr_assessment)} for attribute '{attr_name}'. Using default confidence.",
+                        "confidence_reason": f"LLM returned unexpected type {type(attr_assessment)} for attribute '{attr_name}'. Using default confidence (0.5) and threshold ({attr_threshold}).",
                         "confidence_threshold": attr_threshold,
                     }
                     enhanced_assessment_data[attr_name] = default_assessment
 
-                    # Add alert since we're using default confidence
-                    if 0.5 < attr_threshold:
-                        confidence_threshold_alerts.append(
-                            {
-                                "attribute_name": attr_name,
-                                "confidence": 0.5,
-                                "confidence_threshold": attr_threshold,
-                            }
-                        )
-
             # Update the existing extraction result with enhanced assessment data
             extraction_data["explainability_info"] = [enhanced_assessment_data]
             extraction_data["metadata"] = extraction_data.get("metadata", {})
diff --git a/patterns/pattern-3/template.yaml b/patterns/pattern-3/template.yaml
@@ -377,7 +377,19 @@ Resources:
               model:
                 type: string
                 description: Model identifier
-                enum: ["us.amazon.nova-lite-v1:0", "us.amazon.nova-pro-v1:0", "us.amazon.nova-premier-v1:0", "us.anthropic.claude-3-haiku-20240307-v1:0", "us.anthropic.claude-3-5-sonnet-20241022-v2:0", "us.anthropic.claude-3-7-sonnet-20250219-v1:0", "us.anthropic.claude-sonnet-4-20250514-v1:0", "us.anthropic.claude-opus-4-20250514-v1:0"]
+                enum: 
+                  - !If 
+                    - HasCustomExtractionModelARN
+                    - !Ref CustomExtractionModelARN
+                    - !Ref AWS::NoValue
+                  - "us.amazon.nova-lite-v1:0"
+                  - "us.amazon.nova-pro-v1:0"
+                  - "us.amazon.nova-premier-v1:0"
+                  - "us.anthropic.claude-3-haiku-20240307-v1:0"
+                  - "us.anthropic.claude-3-5-sonnet-20241022-v2:0"
+                  - "us.anthropic.claude-3-7-sonnet-20250219-v1:0"
+                  - "us.anthropic.claude-sonnet-4-20250514-v1:0"
+                  - "us.anthropic.claude-opus-4-20250514-v1:0"
                 order: 1
               temperature:
                 type: number
@@ -404,49 +416,50 @@ Resources:
                 order: 6
               task_prompt:
                 type: string
-                description: Task prompt - supports placeholders {DOCUMENT_CLASS} (replaced with the detected class label), {ATTRIBUTE_NAMES_AND_DESCRIPTIONS} (replaced with the attribute names and descriptions for the detected class), and {DOCUMENT_TEXT} (replaced by the OCR output). Optionally use <<CACHEPOINT>> to separate static and dynamic elements of prompt for Bedrock prompt caching.
+                description: Task prompt - supports placeholders {DOCUMENT_CLASS} (replaced with the detected class label), {ATTRIBUTE_NAMES_AND_DESCRIPTIONS} (replaced with the attribute names and descriptions for the detected class), {FEW_SHOT_EXAMPLES} (replaced by classPrompt and image data from examples in class definitions), {DOCUMENT_TEXT} (replaced by the OCR output), and {DOCUMENT_IMAGE} (replaced by the page image attachments for each page). Optionally use <<CACHEPOINT>> to separate static and dynamic elements of prompt for Bedrock prompt caching.
                 order: 7
-          evaluation:
+          assessment:
             order: 5
             type: object
-            sectionLabel: Evaluation Inference
+            sectionLabel: Assessment Inference
             properties:
-              llm_method:
-                type: object
-                properties:
-                  model:
-                    type: string
-                    description: Bedrock model ID
-                    enum: ["us.amazon.nova-lite-v1:0", "us.amazon.nova-pro-v1:0", "us.amazon.nova-premier-v1:0", "us.anthropic.claude-3-haiku-20240307-v1:0", "us.anthropic.claude-3-5-sonnet-20241022-v2:0", "us.anthropic.claude-3-7-sonnet-20250219-v1:0", "us.anthropic.claude-sonnet-4-20250514-v1:0", "us.anthropic.claude-opus-4-20250514-v1:0"]
-                    order: 1
-                  temperature:
-                    type: number
-                    description: Sampling temperature
-                    default: 0.0
-                    order: 2
-                  top_k:
-                    type: number
-                    description: Sampling Top K
-                    default: 250
-                    order: 3
-                  top_p:
-                    type: number
-                    description: Sampling Top P
-                    order: 4
-                  max_tokens:
-                    type: number
-                    description: Max tokens
-                    order: 5
-                  system_prompt:
-                    type: string
-                    format: textarea
-                    description: System prompt for LLM evaluation
-                    order: 6
-                  task_prompt:
-                    type: string
-                    format: textarea
-                    description: Task prompt for LLM evaluation - supports parameters {DOCUMENT_CLASS}, {ATTRIBUTE_NAME}, {ATTRIBUTE_DESCRIPTION}, {EXPECTED_VALUE} and {ACTUAL_VALUE}
-                    order: 7
+              default_confidence_threshold:
+                type: number
+                description: Default confidence threshold for all attributes (0.0 to 1.0). If an attribute doesn't have its own threshold, this default will be used for confidence threshold alerts.
+                minimum: 0
+                maximum: 1
+                order: 1
+              model:
+                type: string
+                description: Bedrock model ID
+                enum: ["us.amazon.nova-lite-v1:0", "us.amazon.nova-pro-v1:0", "us.amazon.nova-premier-v1:0", "us.anthropic.claude-3-haiku-20240307-v1:0", "us.anthropic.claude-3-5-sonnet-20241022-v2:0", "us.anthropic.claude-3-7-sonnet-20250219-v1:0", "us.anthropic.claude-sonnet-4-20250514-v1:0", "us.anthropic.claude-opus-4-20250514-v1:0"]
+                order: 2
+              temperature:
+                type: number
+                description: Sampling temperature
+                order: 3
+              top_k:
+                type: number
+                description: Sampling Top K
+                order: 4
+              top_p:
+                type: number
+                description: Sampling Top P
+                order: 5
+              max_tokens:
+                type: number
+                description: Max tokens
+                order: 6
+              system_prompt:
+                type: string
+                format: textarea
+                description: System prompt
+                order: 7
+              task_prompt:
+                type: string
+                format: textarea
+                description: Task prompt - supports placeholders {DOCUMENT_TEXT} (markdown text), {OCR_TEXT_CONFIDENCE} (OCR text blocks with confidence), {DOCUMENT_CLASS}, {ATTRIBUTE_NAMES_AND_DESCRIPTIONS}, {EXTRACTION_RESULTS} and {DOCUMENT_IMAGE}. Use <<CACHEPOINT>> to separate static and dynamic elements of prompt for Bedrock prompt caching.
+                order: 8
           summarization:
             order: 6
             type: object
@@ -483,10 +496,51 @@ Resources:
                 format: textarea
                 description: Task prompt - supports parameter {DOCUMENT_TEXT}. Optionally use <<CACHEPOINT>> to separate static and dynamic elements of prompt for Bedrock prompt caching.
                 order: 7
-          pricing:
+          evaluation:
             order: 7
+            type: object
+            sectionLabel: Evaluation Inference
+            properties:
+              llm_method:
+                type: object
+                properties:
+                  model:
+                    type: string
+                    description: Bedrock model ID
+                    enum: ["us.amazon.nova-lite-v1:0", "us.amazon.nova-pro-v1:0", "us.amazon.nova-premier-v1:0", "us.anthropic.claude-3-haiku-20240307-v1:0", "us.anthropic.claude-3-5-sonnet-20241022-v2:0", "us.anthropic.claude-3-7-sonnet-20250219-v1:0", "us.anthropic.claude-sonnet-4-20250514-v1:0", "us.anthropic.claude-opus-4-20250514-v1:0"]
+                    order: 1
+                  temperature:
+                    type: number
+                    description: Sampling temperature
+                    default: 0.0
+                    order: 2
+                  top_k:
+                    type: number
+                    description: Sampling Top K
+                    default: 250
+                    order: 3
+                  top_p:
+                    type: number
+                    description: Sampling Top P
+                    order: 4
+                  max_tokens:
+                    type: number
+                    description: Max tokens
+                    order: 5
+                  system_prompt:
+                    type: string
+                    format: textarea
+                    description: System prompt for LLM evaluation
+                    order: 6
+                  task_prompt:
+                    type: string
+                    format: textarea
+                    description: Task prompt for LLM evaluation - supports placeholders {DOCUMENT_CLASS}, {ATTRIBUTE_NAME}, {ATTRIBUTE_DESCRIPTION}, {EXPECTED_VALUE} and {ACTUAL_VALUE}
+                    order: 7
+          pricing:
+            order: 8
             type: array
-            sectionLabel: Pricing Estimates - check https://aws.amazon.com/bedrock/pricing/ & https://aws.amazon.com/textract/pricing/
+            sectionLabel: Pricing (Estimates only - check https://aws.amazon.com/bedrock/pricing/ & https://aws.amazon.com/textract/pricing/)
             listLabel: Services
             itemLabel: Service/API
             columns: 2