Cost Estimator UI Feature for Context Grouping and Subtotals

Bob Strahan · Bob Strahan · commit 26e1835ee08c · 2025-06-05T20:32:27.000Z
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -7,6 +7,10 @@ SPDX-License-Identifier: MIT-0
 
 ### Added
 
+- **Cost Estimator UI Feature for Context Grouping and Subtotals**
+  - Added context grouping functionality to organize cost estimates by logical categories (e.g. OCR, Classification, etc.)
+  - Implemented subtotal calculations for better cost breakdown visualization
+
 - **DynamoDB Caching for Resilient Classification**
   - Added optional DynamoDB caching to the multimodal page-level classification service to improve efficiency and resilience
   - Cache successful page classification results to avoid redundant processing during retries when some pages fail due to throttling
diff --git a/lib/idp_common_pkg/idp_common/bedrock/client.py b/lib/idp_common_pkg/idp_common/bedrock/client.py
@@ -78,7 +78,8 @@ def __call__(
         top_k: Optional[Union[float, str]] = None,
         top_p: Optional[Union[float, str]] = None,
         max_tokens: Optional[Union[int, str]] = None,
-        max_retries: Optional[int] = None
+        max_retries: Optional[int] = None,
+        context: str = "Unspecified"
     ) -> Dict[str, Any]:
         """
         Make the instance callable with the same signature as the original function.
@@ -109,7 +110,8 @@ def __call__(
             top_k=top_k,
             top_p=top_p,
             max_tokens=max_tokens,
-            max_retries=effective_max_retries
+            max_retries=effective_max_retries,
+            context=context
         )
     
     def _preprocess_content_for_cachepoint(self, content: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
@@ -177,7 +179,8 @@ def invoke_model(
         top_k: Optional[Union[float, str]] = 5,
         top_p: Optional[Union[float, str]] = 0.1,
         max_tokens: Optional[Union[int, str]] = None,
-        max_retries: Optional[int] = None
+        max_retries: Optional[int] = None,
+        context: str = "Unspecified"
     ) -> Dict[str, Any]:
         """
         Invoke a Bedrock model with retry logic.
@@ -335,7 +338,8 @@ def invoke_model(
             converse_params=converse_params,
             retry_count=0,
             max_retries=effective_max_retries,
-            request_start_time=request_start_time
+            request_start_time=request_start_time,
+            context=context
         )
         
         return result
@@ -346,7 +350,8 @@ def _invoke_with_retry(
         retry_count: int,
         max_retries: int,
         request_start_time: float,
-        last_exception: Exception = None
+        last_exception: Exception = None,
+        context: str = "Unspecified"
     ) -> Dict[str, Any]:
         """
         Recursive helper method to handle retries for Bedrock invocation.
@@ -424,7 +429,7 @@ def _invoke_with_retry(
             response_with_metering = {
                 "response": response,
                 "metering": {
-                    f"bedrock/{converse_params['modelId']}": {
+                    f"{context}/bedrock/{converse_params['modelId']}": {
                         **usage
                     }
                 }
@@ -470,7 +475,8 @@ def _invoke_with_retry(
                     retry_count=retry_count + 1,
                     max_retries=max_retries,
                     request_start_time=request_start_time,
-                    last_exception=e
+                    last_exception=e,
+                    context=context
                 )
             else:
                 logger.error(f"Non-retryable Bedrock error: {error_code} - {error_message}")
@@ -838,6 +844,7 @@ def _sanitize_response_for_logging(self, response: Dict[str, Any]) -> Dict[str,
     top_p: Optional top_p parameter (float or string)
     max_tokens: Optional max_tokens parameter (int or string)
     max_retries: Optional override for the instance's max_retries setting
+    context: Context prefix for metering key (default: "Unspecified")
     
 Returns:
     Bedrock response object with metering information
diff --git a/lib/idp_common_pkg/idp_common/classification/service.py b/lib/idp_common_pkg/idp_common/classification/service.py
@@ -770,7 +770,7 @@ def classify_page_sagemaker(
 
                 # Add some metering data for consistency with Bedrock
                 metering = {
-                    "sagemaker/invoke_endpoint": {
+                    "Classification/sagemaker/invoke_endpoint": {
                         "invocations": 1,
                     }
                 }
@@ -910,6 +910,7 @@ def _invoke_bedrock_model(
             top_k=config["top_k"],
             top_p=config["top_p"],
             max_tokens=config["max_tokens"],
+            context="Classification",
         )
 
     def _create_unclassified_result(
diff --git a/lib/idp_common_pkg/idp_common/extraction/service.py b/lib/idp_common_pkg/idp_common/extraction/service.py
@@ -708,6 +708,7 @@ def process_document_section(self, document: Document, section_id: str) -> Docum
                 top_k=top_k,
                 top_p=top_p,
                 max_tokens=max_tokens,
+                context="Extraction",
             )
 
             total_duration = time.time() - request_start_time
diff --git a/lib/idp_common_pkg/idp_common/ocr/service.py b/lib/idp_common_pkg/idp_common/ocr/service.py
@@ -284,7 +284,7 @@ def _process_single_page(
         # Extract metering data
         feature_combo = self._feature_combo()
         metering = {
-            f"textract/{self._get_api_name()}{feature_combo}": {
+            f"OCR/textract/{self._get_api_name()}{feature_combo}": {
                 "pages": textract_result["DocumentMetadata"]["Pages"]
             }
         }
diff --git a/lib/idp_common_pkg/idp_common/summarization/service.py b/lib/idp_common_pkg/idp_common/summarization/service.py
@@ -221,6 +221,7 @@ def _invoke_bedrock_model(
             top_k=config["top_k"],
             top_p=config["top_p"],
             max_tokens=config["max_tokens"],
+            context="Summarization",
         )
 
     def _create_error_summary(self, error_message: str) -> DocumentSummary:
diff --git a/patterns/pattern-1/src/processresults_function/index.py b/patterns/pattern-1/src/processresults_function/index.py
@@ -549,10 +549,10 @@ def handler(event, context):
     
     # Add metering information
     document.metering = {
-        "bda/documents-custom": {
+        "BDAProject/bda/documents-custom": {
             "pages": custom_pages_count
         },
-        "bda/documents-standard": {
+        "BDAProject/bda/documents-standard": {
             "pages": standard_pages_count
         }
     }
diff --git a/src/ui/src/components/document-panel/DocumentPanel.jsx b/src/ui/src/components/document-panel/DocumentPanel.jsx
@@ -142,8 +142,24 @@ const MeteringTable = ({ meteringData, preCalculatedTotals }) => {
     contextGroups[item.context].push(item);
   });
 
-  // Sort contexts alphabetically and add items with subtotals
-  const sortedContexts = Object.keys(contextGroups).sort();
+  // Sort contexts in specific order: OCR, Classification, Extraction, Summarization
+  const contextOrder = ['OCR', 'Classification', 'Extraction', 'Summarization'];
+  const sortedContexts = Object.keys(contextGroups).sort((a, b) => {
+    const aIndex = contextOrder.indexOf(a);
+    const bIndex = contextOrder.indexOf(b);
+
+    // If both contexts are in the predefined order, sort by their position
+    if (aIndex !== -1 && bIndex !== -1) {
+      return aIndex - bIndex;
+    }
+
+    // If only one context is in the predefined order, it comes first
+    if (aIndex !== -1) return -1;
+    if (bIndex !== -1) return 1;
+
+    // If neither context is in the predefined order, sort alphabetically
+    return a.localeCompare(b);
+  });
 
   sortedContexts.forEach((context) => {
     // Add all items for this context

Original file line number	Diff line number	Diff line change
`@@ -770,7 +770,7 @@ def classify_page_sagemaker(`
`770`	`770`
`771`	`771`	`# Add some metering data for consistency with Bedrock`
`772`	`772`	`metering = {`
`773`		`- "sagemaker/invoke_endpoint": {`
	`773`	`+ "Classification/sagemaker/invoke_endpoint": {`
`774`	`774`	`"invocations": 1,`
`775`	`775`	`}`
`776`	`776`	`}`
`@@ -910,6 +910,7 @@ def _invoke_bedrock_model(`
`910`	`910`	`top_k=config["top_k"],`
`911`	`911`	`top_p=config["top_p"],`
`912`	`912`	`max_tokens=config["max_tokens"],`
	`913`	`+ context="Classification",`
`913`	`914`	`)`
`914`	`915`
`915`	`916`	`def _create_unclassified_result(`
Original file line number	Diff line number	Diff line change
`@@ -708,6 +708,7 @@ def process_document_section(self, document: Document, section_id: str) -> Docum`
`708`	`708`	`top_k=top_k,`
`709`	`709`	`top_p=top_p,`
`710`	`710`	`max_tokens=max_tokens,`
	`711`	`+ context="Extraction",`
`711`	`712`	`)`
`712`	`713`
`713`	`714`	`total_duration = time.time() - request_start_time`
Original file line number	Diff line number	Diff line change
`@@ -284,7 +284,7 @@ def _process_single_page(`
`284`	`284`	`# Extract metering data`
`285`	`285`	`feature_combo = self._feature_combo()`
`286`	`286`	`metering = {`
`287`		`- f"textract/{self._get_api_name()}{feature_combo}": {`
	`287`	`+ f"OCR/textract/{self._get_api_name()}{feature_combo}": {`
`288`	`288`	`"pages": textract_result["DocumentMetadata"]["Pages"]`
`289`	`289`	`}`
`290`	`290`	`}`
Original file line number	Diff line number	Diff line change
`@@ -221,6 +221,7 @@ def _invoke_bedrock_model(`
`221`	`221`	`top_k=config["top_k"],`
`222`	`222`	`top_p=config["top_p"],`
`223`	`223`	`max_tokens=config["max_tokens"],`
	`224`	`+ context="Summarization",`
`224`	`225`	`)`
`225`	`226`
`226`	`227`	`def _create_error_summary(self, error_message: str) -> DocumentSummary:`
Original file line number	Diff line number	Diff line change
`@@ -549,10 +549,10 @@ def handler(event, context):`
`549`	`549`
`550`	`550`	`# Add metering information`
`551`	`551`	`document.metering = {`
`552`		`- "bda/documents-custom": {`
	`552`	`+ "BDAProject/bda/documents-custom": {`
`553`	`553`	`"pages": custom_pages_count`
`554`	`554`	`},`
`555`		`- "bda/documents-standard": {`
	`555`	`+ "BDAProject/bda/documents-standard": {`
`556`	`556`	`"pages": standard_pages_count`
`557`	`557`	`}`
`558`	`558`	`}`