aws-solutions-library-samples
diff --git a/‎CHANGELOG.md‎
Lines changed: 11 additions & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎config_library/pattern-1/lending-package-sample/config.yaml‎
Lines changed: 8 additions & 8 deletions b/‎config_library/pattern-1/lending-package-sample/config.yaml‎
Lines changed: 8 additions & 8 deletions
diff --git a/‎config_library/pattern-2/bank-statement-sample/config.yaml‎
Lines changed: 9 additions & 9 deletions b/‎config_library/pattern-2/bank-statement-sample/config.yaml‎
Lines changed: 9 additions & 9 deletions
diff --git a/‎config_library/pattern-2/criteria-validation/config.yaml‎
Lines changed: 4 additions & 4 deletions b/‎config_library/pattern-2/criteria-validation/config.yaml‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎config_library/pattern-2/lending-package-sample/config.yaml‎
Lines changed: 9 additions & 9 deletions b/‎config_library/pattern-2/lending-package-sample/config.yaml‎
Lines changed: 9 additions & 9 deletions
diff --git a/‎config_library/pattern-2/rvl-cdip-package-sample-with-few-shot-examples/config.yaml‎
Lines changed: 9 additions & 9 deletions b/‎config_library/pattern-2/rvl-cdip-package-sample-with-few-shot-examples/config.yaml‎
Lines changed: 9 additions & 9 deletions
diff --git a/‎config_library/pattern-2/rvl-cdip-package-sample/config.yaml‎
Lines changed: 9 additions & 9 deletions b/‎config_library/pattern-2/rvl-cdip-package-sample/config.yaml‎
Lines changed: 9 additions & 9 deletions
@@ -17,6 +17,17 @@ SPDX-License-Identifier: MIT-0
   - Resolves #146
 
 ### Changed
+
+- **Improved Temperature and Top_P Parameter Logic for Deterministic Output**
+  - Changed inference parameter selection logic to allow `temperature=0.0` for deterministic output (recommended by Anthropic and other model providers)
+  - **New Logic**: Uses `top_p` only when it has a positive value (> 0); otherwise uses `temperature` including `temperature=0.0`
+  - **Previous Logic**: Used `top_p` whenever `temperature=0.0`, preventing proper deterministic configuration
+  - **Key Benefits**: Enables proper deterministic output with `temperature=0.0`, more intuitive parameter behavior, aligns with model provider best practices (Anthropic recommends `temperature=0` for consistent outputs)
+  - **Affected Components**: Bedrock client (`lib/idp_common_pkg/idp_common/bedrock/client.py`), Agentic extraction service (`lib/idp_common_pkg/idp_common/extraction/agentic_idp.py`)
+  - **Configuration Guidance**: Set `top_p: 0` to use `temperature` parameter; set `top_p` to positive value to override temperature
+  - Set temperature to 0.0 in discovery config for deterministic discovery output (was previously set to 1.0)
+  - Set top_p to 0.0 in all repo config files to force use of temperature setting by default.
+
 - Removed page image limit entirely across all IDP services (classification, extraction, assessment) following Amazon Bedrock API removal of image count restrictions. The system now processes all document pages without artificial truncation, with info logging to track image counts for monitoring purposes.
   - Resolves #147
 
 
@@ -6,7 +6,7 @@ assessment:
   default_confidence_threshold: '0.8'
 summarization:
   enabled: true
-  top_p: '0.1'
+  top_p: "0.0"
   max_tokens: '4096'
   top_k: '5'
   task_prompt: >-
@@ -62,14 +62,14 @@ summarization:
 
     Do not include any text, explanations, or notes outside of this JSON
     structure. The JSON must be properly formatted and parseable.
-  temperature: '0.0'
+  temperature: "0.0"
   model: us.amazon.nova-premier-v1:0
   system_prompt: >-
     You are a document summarization expert who can analyze and summarize documents from various domains including medical, financial, legal, and general business documents. Your task is to create a summary that captures the key information, main points, and important details from the document. Your output must be in valid JSON format. \nSummarization Style: Balanced\\nCreate a balanced summary that provides a moderate level of detail. Include the main points and key supporting information, while maintaining the document's overall structure. Aim for a comprehensive yet concise summary.\n Your output MUST be in valid JSON format with markdown content. You MUST strictly adhere to the output format specified in the instructions.
 evaluation:
   enabled: true
   llm_method:
-    top_p: '0.1'
+    top_p: "0.0"
     max_tokens: '4096'
     top_k: '5'
     task_prompt: >-
@@ -101,7 +101,7 @@ evaluation:
         "score": 0.0 to 1.0,
         "reason": "Your explanation here"
       }
-    temperature: '0.0'
+    temperature: "0.0"
     model: us.anthropic.claude-3-haiku-20240307-v1:0
     system_prompt: >-
       You are an evaluator that helps determine if the predicted and expected values match for document attribute extraction. You will consider the context and meaning rather than just exact string matching.
@@ -151,8 +151,8 @@ discovery:
           ]
       }
   with_ground_truth:
-    top_p: '0.1'
-    temperature: '1.0'
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains unstructured data. Analyze the data line by line using the provided ground truth as reference.                        
       <GROUND_TRUTH_REFERENCE>
@@ -179,8 +179,8 @@ discovery:
       field definitions.
     max_tokens: '10000'
   without_ground_truth:
-    top_p: '0.1'
-    temperature: '1.0'
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains forms data. Analyze the form line by line.
       Image may contains multiple pages, process all the pages. 
 
@@ -100,7 +100,7 @@ classification:
   image:
     target_height: ""
     target_width: ""
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "4096"
   top_k: "5"
   task_prompt: >-
@@ -243,7 +243,7 @@ extraction:
   image:
     target_height: ""
     target_width: ""
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "10000"
   top_k: "5"
   task_prompt: >-
@@ -338,7 +338,7 @@ extraction:
     You are a document assistant. Respond only with JSON. Never make up data, only provide data found in the document being provided.
 summarization:
   enabled: true
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "4096"
   top_k: "5"
   task_prompt: >-
@@ -411,7 +411,7 @@ assessment:
     simple_batch_size: "3"
     list_batch_size: "1"
   default_confidence_threshold: "0.8"
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "10000"
   top_k: "5"
   temperature: "0.0"
@@ -560,7 +560,7 @@ assessment:
 evaluation:
   enabled: true
   llm_method:
-    top_p: "0.1"
+    top_p: "0.0"
     max_tokens: "4096"
     top_k: "5"
     task_prompt: >-
@@ -642,8 +642,8 @@ discovery:
           ]
       }
   with_ground_truth:
-    top_p: "0.1"
-    temperature: "1.0"
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains unstructured data. Analyze the data line by line using the provided ground truth as reference.                        
       <GROUND_TRUTH_REFERENCE>
@@ -670,8 +670,8 @@ discovery:
       field definitions.
     max_tokens: "10000"
   without_ground_truth:
-    top_p: "0.1"
-    temperature: "1.0"
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains forms data. Analyze the form line by line.
       Image may contains multiple pages, process all the pages. 
 
@@ -232,8 +232,8 @@ discovery:
           ]
       }
   with_ground_truth:
-    top_p: '0.1'
-    temperature: '1.0'
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains unstructured data. Analyze the data line by line using the provided ground truth as reference.                        
       <GROUND_TRUTH_REFERENCE>
@@ -260,8 +260,8 @@ discovery:
       field definitions.
     max_tokens: '10000'
   without_ground_truth:
-    top_p: '0.1'
-    temperature: '1.0'
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains forms data. Analyze the form line by line.
       Image may contains multiple pages, process all the pages. 
 
@@ -1194,7 +1194,7 @@ classification:
     target_width: ""
   model: us.amazon.nova-pro-v1:0
   temperature: "0.0"
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "4096"
   top_k: "5"
   system_prompt: >-
@@ -1256,7 +1256,7 @@ extraction:
   image:
     target_width: ""
     target_height: ""
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "10000"
   top_k: "5"
   task_prompt: >-
@@ -1351,7 +1351,7 @@ extraction:
     You are a document assistant. Respond only with JSON. Never make up data, only provide data found in the document being provided.
 summarization:
   enabled: true
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "4096"
   top_k: "5"
   task_prompt: >-
@@ -1435,7 +1435,7 @@ assessment:
     simple_batch_size: "3"
     list_batch_size: "1"
   default_confidence_threshold: "0.8"
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "10000"
   top_k: "5"
   temperature: "0.0"
@@ -1583,7 +1583,7 @@ assessment:
 evaluation:
   enabled: true
   llm_method:
-    top_p: "0.1"
+    top_p: "0.0"
     max_tokens: "4096"
     top_k: "5"
     task_prompt: >-
@@ -1665,8 +1665,8 @@ discovery:
           ]
       }
   with_ground_truth:
-    top_p: "0.1"
-    temperature: "1.0"
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains unstructured data. Analyze the data line by line using the provided ground truth as reference.                        
       <GROUND_TRUTH_REFERENCE>
@@ -1693,8 +1693,8 @@ discovery:
       field definitions.
     max_tokens: "10000"
   without_ground_truth:
-    top_p: "0.1"
-    temperature: "1.0"
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains forms data. Analyze the form line by line.
       Image may contains multiple pages, process all the pages. 
 
@@ -816,7 +816,7 @@ classification:
   sectionSplitting: llm_determined
   model: us.amazon.nova-pro-v1:0
   temperature: "0.0"
-  top_p: "0.1"
+  top_p: "0.0"
   top_k: "5"
   max_tokens: "4096"
   system_prompt: >-
@@ -869,7 +869,7 @@ extraction:
     target_width: ""
   model: us.amazon.nova-pro-v1:0
   temperature: "0.0"
-  top_p: "0.1"
+  top_p: "0.0"
   top_k: "5"
   max_tokens: "4096"
   system_prompt: >
@@ -973,7 +973,7 @@ assessment:
     simple_batch_size: "3"
     list_batch_size: "1"
   default_confidence_threshold: "0.8"
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "10000"
   top_k: "5"
   temperature: "0.0"
@@ -1121,7 +1121,7 @@ assessment:
 evaluation:
   enabled: true
   llm_method:
-    top_p: "0.1"
+    top_p: "0.0"
     max_tokens: "4096"
     top_k: "5"
     task_prompt: >
@@ -1165,7 +1165,7 @@ evaluation:
       context and meaning rather than just exact string matching.
 summarization:
   enabled: true
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "4096"
   top_k: "5"
   task_prompt: >
@@ -1287,8 +1287,8 @@ discovery:
           ]
       }
   with_ground_truth:
-    top_p: "0.1"
-    temperature: "1.0"
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains unstructured data. Analyze the data line by line using the provided ground truth as reference.                        
       <GROUND_TRUTH_REFERENCE>
@@ -1315,8 +1315,8 @@ discovery:
       field definitions.
     max_tokens: "10000"
   without_ground_truth:
-    top_p: "0.1"
-    temperature: "1.0"
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains forms data. Analyze the form line by line.
       Image may contains multiple pages, process all the pages. 
 
@@ -767,7 +767,7 @@ classification:
   image:
     target_height: ""
     target_width: ""
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "4096"
   top_k: "5"
   task_prompt: >-
@@ -910,7 +910,7 @@ extraction:
   image:
     target_width: ""
     target_height: ""
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "10000"
   top_k: "5"
   task_prompt: >-
@@ -1005,7 +1005,7 @@ extraction:
     You are a document assistant. Respond only with JSON. Never make up data, only provide data found in the document being provided.
 summarization:
   enabled: true
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "4096"
   top_k: "5"
   task_prompt: >-
@@ -1077,7 +1077,7 @@ assessment:
     simple_batch_size: "3"
     list_batch_size: "1"
   default_confidence_threshold: "0.8"
-  top_p: "0.1"
+  top_p: "0.0"
   max_tokens: "10000"
   top_k: "5"
   temperature: "0.0"
@@ -1225,7 +1225,7 @@ assessment:
 evaluation:
   enabled: true
   llm_method:
-    top_p: "0.1"
+    top_p: "0.0"
     max_tokens: "4096"
     top_k: "5"
     task_prompt: >-
@@ -1307,8 +1307,8 @@ discovery:
           ]
       }
   with_ground_truth:
-    top_p: "0.1"
-    temperature: "1.0"
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains unstructured data. Analyze the data line by line using the provided ground truth as reference.                        
       <GROUND_TRUTH_REFERENCE>
@@ -1335,8 +1335,8 @@ discovery:
       field definitions.
     max_tokens: "10000"
   without_ground_truth:
-    top_p: "0.1"
-    temperature: "1.0"
+    top_p: "0.0"
+    temperature: "0.0"
     user_prompt: >-
       This image contains forms data. Analyze the form line by line.
       Image may contains multiple pages, process all the pages.