Merge branch 'feature/categorize-cost-estimate-by-step' into 'develop'

rstrahan · rstrahan · commit 75f363e90762 · 2025-06-05T21:14:39.000Z
Feature/categorize cost estimate by step

See merge request genaiic-reusable-assets/engagement-artifacts/genaiic-idp-accelerator!154
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -7,6 +7,10 @@ SPDX-License-Identifier: MIT-0
 
 ### Added
 
+- **Cost Estimator UI Feature for Context Grouping and Subtotals**
+  - Added context grouping functionality to organize cost estimates by logical categories (e.g. OCR, Classification, etc.)
+  - Implemented subtotal calculations for better cost breakdown visualization
+
 - **DynamoDB Caching for Resilient Classification**
   - Added optional DynamoDB caching to the multimodal page-level classification service to improve efficiency and resilience
   - Cache successful page classification results to avoid redundant processing during retries when some pages fail due to throttling
diff --git a/lib/idp_common_pkg/idp_common/bedrock/client.py b/lib/idp_common_pkg/idp_common/bedrock/client.py
@@ -78,7 +78,8 @@ def __call__(
         top_k: Optional[Union[float, str]] = None,
         top_p: Optional[Union[float, str]] = None,
         max_tokens: Optional[Union[int, str]] = None,
-        max_retries: Optional[int] = None
+        max_retries: Optional[int] = None,
+        context: str = "Unspecified"
     ) -> Dict[str, Any]:
         """
         Make the instance callable with the same signature as the original function.
@@ -109,7 +110,8 @@ def __call__(
             top_k=top_k,
             top_p=top_p,
             max_tokens=max_tokens,
-            max_retries=effective_max_retries
+            max_retries=effective_max_retries,
+            context=context
         )
     
     def _preprocess_content_for_cachepoint(self, content: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
@@ -177,7 +179,8 @@ def invoke_model(
         top_k: Optional[Union[float, str]] = 5,
         top_p: Optional[Union[float, str]] = 0.1,
         max_tokens: Optional[Union[int, str]] = None,
-        max_retries: Optional[int] = None
+        max_retries: Optional[int] = None,
+        context: str = "Unspecified"
     ) -> Dict[str, Any]:
         """
         Invoke a Bedrock model with retry logic.
@@ -335,7 +338,8 @@ def invoke_model(
             converse_params=converse_params,
             retry_count=0,
             max_retries=effective_max_retries,
-            request_start_time=request_start_time
+            request_start_time=request_start_time,
+            context=context
         )
         
         return result
@@ -346,7 +350,8 @@ def _invoke_with_retry(
         retry_count: int,
         max_retries: int,
         request_start_time: float,
-        last_exception: Exception = None
+        last_exception: Exception = None,
+        context: str = "Unspecified"
     ) -> Dict[str, Any]:
         """
         Recursive helper method to handle retries for Bedrock invocation.
@@ -424,7 +429,7 @@ def _invoke_with_retry(
             response_with_metering = {
                 "response": response,
                 "metering": {
-                    f"bedrock/{converse_params['modelId']}": {
+                    f"{context}/bedrock/{converse_params['modelId']}": {
                         **usage
                     }
                 }
@@ -470,7 +475,8 @@ def _invoke_with_retry(
                     retry_count=retry_count + 1,
                     max_retries=max_retries,
                     request_start_time=request_start_time,
-                    last_exception=e
+                    last_exception=e,
+                    context=context
                 )
             else:
                 logger.error(f"Non-retryable Bedrock error: {error_code} - {error_message}")
@@ -838,6 +844,7 @@ def _sanitize_response_for_logging(self, response: Dict[str, Any]) -> Dict[str,
     top_p: Optional top_p parameter (float or string)
     max_tokens: Optional max_tokens parameter (int or string)
     max_retries: Optional override for the instance's max_retries setting
+    context: Context prefix for metering key (default: "Unspecified")
     
 Returns:
     Bedrock response object with metering information
diff --git a/lib/idp_common_pkg/idp_common/classification/service.py b/lib/idp_common_pkg/idp_common/classification/service.py
@@ -770,7 +770,7 @@ def classify_page_sagemaker(
 
                 # Add some metering data for consistency with Bedrock
                 metering = {
-                    "sagemaker/invoke_endpoint": {
+                    "Classification/sagemaker/invoke_endpoint": {
                         "invocations": 1,
                     }
                 }
@@ -910,6 +910,7 @@ def _invoke_bedrock_model(
             top_k=config["top_k"],
             top_p=config["top_p"],
             max_tokens=config["max_tokens"],
+            context="Classification",
         )
 
     def _create_unclassified_result(
diff --git a/lib/idp_common_pkg/idp_common/extraction/service.py b/lib/idp_common_pkg/idp_common/extraction/service.py
@@ -708,6 +708,7 @@ def process_document_section(self, document: Document, section_id: str) -> Docum
                 top_k=top_k,
                 top_p=top_p,
                 max_tokens=max_tokens,
+                context="Extraction",
             )
 
             total_duration = time.time() - request_start_time
diff --git a/lib/idp_common_pkg/idp_common/ocr/service.py b/lib/idp_common_pkg/idp_common/ocr/service.py
@@ -284,7 +284,7 @@ def _process_single_page(
         # Extract metering data
         feature_combo = self._feature_combo()
         metering = {
-            f"textract/{self._get_api_name()}{feature_combo}": {
+            f"OCR/textract/{self._get_api_name()}{feature_combo}": {
                 "pages": textract_result["DocumentMetadata"]["Pages"]
             }
         }
diff --git a/lib/idp_common_pkg/idp_common/summarization/service.py b/lib/idp_common_pkg/idp_common/summarization/service.py
@@ -221,6 +221,7 @@ def _invoke_bedrock_model(
             top_k=config["top_k"],
             top_p=config["top_p"],
             max_tokens=config["max_tokens"],
+            context="Summarization",
         )
 
     def _create_error_summary(self, error_message: str) -> DocumentSummary:
diff --git a/patterns/pattern-1/src/processresults_function/index.py b/patterns/pattern-1/src/processresults_function/index.py
@@ -549,10 +549,10 @@ def handler(event, context):
     
     # Add metering information
     document.metering = {
-        "bda/documents-custom": {
+        "BDAProject/bda/documents-custom": {
             "pages": custom_pages_count
         },
-        "bda/documents-standard": {
+        "BDAProject/bda/documents-standard": {
             "pages": standard_pages_count
         }
     }
diff --git a/src/ui/src/components/document-panel/DocumentPanel.jsx b/src/ui/src/components/document-panel/DocumentPanel.jsx
@@ -22,12 +22,27 @@ import useConfiguration from '../../hooks/use-configuration';
 
 const logger = new Logger('DocumentPanel');
 
-// Format the cost cell content based on whether it's a total row
-const formatCostCell = (item) => {
-  if (item.isTotal) {
-    return <Box fontWeight="bold">{`${item.note}: ${item.cost}`}</Box>;
+// Helper function to parse serviceApi key into context and service
+const parseServiceApiKey = (serviceApiKey) => {
+  const parts = serviceApiKey.split('/');
+  if (parts.length >= 3) {
+    const context = parts[0];
+    const serviceApi = parts.slice(1).join('/');
+    return { context, serviceApi };
   }
-  return item.cost;
+  // Fallback for keys that don't follow the new format (less than 3 parts) - set context to ''
+  return { context: '', serviceApi: serviceApiKey };
+};
+
+// Helper function to format cost cells
+const formatCostCell = (rowItem) => {
+  if (rowItem.isTotal) {
+    return <Box fontWeight="bold">{`${rowItem.note}: ${rowItem.cost}`}</Box>;
+  }
+  if (rowItem.isSubtotal) {
+    return <Box fontWeight="bold" color="text-body-secondary">{`${rowItem.note}: ${rowItem.cost}`}</Box>;
+  }
+  return rowItem.cost;
 };
 
 // Component to display metering information in a table
@@ -65,15 +80,18 @@ const MeteringTable = ({ meteringData, preCalculatedTotals }) => {
     return <Box>Loading pricing data...</Box>;
   }
 
-  // Transform metering data into table rows
-  const tableItems = [];
+  // Transform metering data into table rows with context parsing
+  const rawTableItems = [];
+  const contextTotals = {};
   let totalCost = 0;
 
-  Object.entries(meteringData).forEach(([serviceApi, metrics]) => {
+  Object.entries(meteringData).forEach(([originalServiceApiKey, metrics]) => {
+    const { context, serviceApi } = parseServiceApiKey(originalServiceApiKey);
+
     Object.entries(metrics).forEach(([unit, value]) => {
       const numericValue = Number(value);
 
-      // Look up the unit price from the pricing data
+      // Look up the unit price from the pricing data using the parsed serviceApi
       let unitPrice = null;
       let unitPriceDisplayValue = 'None';
       let cost = 0;
@@ -83,6 +101,13 @@ const MeteringTable = ({ meteringData, preCalculatedTotals }) => {
           unitPriceDisplayValue = `$${unitPrice}`;
           cost = numericValue * unitPrice;
           totalCost += cost;
+
+          // Track context totals
+          if (!contextTotals[context]) {
+            contextTotals[context] = 0;
+          }
+          contextTotals[context] += cost;
+
           logger.debug(`Found price for ${serviceApi}/${unit}: ${unitPriceDisplayValue}`);
         } else {
           logger.warn(`Invalid price for ${serviceApi}/${unit}, using None`);
@@ -91,34 +116,96 @@ const MeteringTable = ({ meteringData, preCalculatedTotals }) => {
         logger.debug(`No price found for ${serviceApi}/${unit}, using None`);
       }
 
-      tableItems.push({
+      rawTableItems.push({
+        context,
         serviceApi,
         unit,
         value: String(numericValue),
         unitCost: unitPriceDisplayValue,
         cost: unitPrice !== null ? `$${cost.toFixed(4)}` : 'N/A',
+        costValue: cost,
         isTotal: false,
+        isSubtotal: false,
       });
     });
   });
 
+  // Group items by context and add subtotals
+  const tableItems = [];
+  const contextGroups = {};
+
+  // Group raw items by context
+  rawTableItems.forEach((item) => {
+    if (!contextGroups[item.context]) {
+      contextGroups[item.context] = [];
+    }
+    contextGroups[item.context].push(item);
+  });
+
+  // Sort contexts in specific order: OCR, Classification, Extraction, Summarization
+  const contextOrder = ['BDAProject', 'OCR', 'Classification', 'Extraction', 'Summarization'];
+  const sortedContexts = Object.keys(contextGroups).sort((a, b) => {
+    const aIndex = contextOrder.indexOf(a);
+    const bIndex = contextOrder.indexOf(b);
+
+    // If both contexts are in the predefined order, sort by their position
+    if (aIndex !== -1 && bIndex !== -1) {
+      return aIndex - bIndex;
+    }
+
+    // If only one context is in the predefined order, it comes first
+    if (aIndex !== -1) return -1;
+    if (bIndex !== -1) return 1;
+
+    // If neither context is in the predefined order, sort alphabetically
+    return a.localeCompare(b);
+  });
+
+  sortedContexts.forEach((context) => {
+    // Add all items for this context
+    tableItems.push(...contextGroups[context]);
+
+    // Add subtotal row for this context
+    const contextTotal = contextTotals[context] || 0;
+    tableItems.push({
+      context: '',
+      serviceApi: '',
+      unit: '',
+      value: '',
+      unitCost: '',
+      cost: `$${contextTotal.toFixed(4)}`,
+      costValue: contextTotal,
+      isTotal: false,
+      isSubtotal: true,
+      note: `${context} Subtotal`,
+    });
+  });
+
   // Use preCalculatedTotals if provided, otherwise calculate locally
   const finalTotalCost = preCalculatedTotals ? preCalculatedTotals.totalCost : totalCost;
 
-  // Add total row
+  // Add overall total row
   tableItems.push({
+    context: '',
     serviceApi: '',
     unit: '',
     value: '',
     unitCost: '',
     cost: `$${finalTotalCost.toFixed(4)}`,
+    costValue: finalTotalCost,
     isTotal: true,
+    isSubtotal: false,
     note: 'Total',
   });
 
   return (
     <Table
       columnDefinitions={[
+        {
+          id: 'context',
+          header: 'Context',
+          cell: (rowItem) => rowItem.context,
+        },
         {
           id: 'serviceApi',
           header: 'Service/Api',
@@ -169,7 +256,10 @@ const calculateTotalCosts = (meteringData, documentItem, pricingData) => {
   let totalCost = 0;
 
   if (pricingData) {
-    Object.entries(meteringData).forEach(([serviceApi, metrics]) => {
+    Object.entries(meteringData).forEach(([originalServiceApiKey, metrics]) => {
+      // Parse the serviceApi key to remove context prefix
+      const { serviceApi } = parseServiceApiKey(originalServiceApiKey);
+
       Object.entries(metrics).forEach(([unit, value]) => {
         const numericValue = Number(value);
         if (pricingData[serviceApi] && pricingData[serviceApi][unit] !== undefined) {

Original file line number	Diff line number	Diff line change
`@@ -770,7 +770,7 @@ def classify_page_sagemaker(`
`770`	`770`
`771`	`771`	`# Add some metering data for consistency with Bedrock`
`772`	`772`	`metering = {`
`773`		`- "sagemaker/invoke_endpoint": {`
	`773`	`+ "Classification/sagemaker/invoke_endpoint": {`
`774`	`774`	`"invocations": 1,`
`775`	`775`	`}`
`776`	`776`	`}`
`@@ -910,6 +910,7 @@ def _invoke_bedrock_model(`
`910`	`910`	`top_k=config["top_k"],`
`911`	`911`	`top_p=config["top_p"],`
`912`	`912`	`max_tokens=config["max_tokens"],`
	`913`	`+ context="Classification",`
`913`	`914`	`)`
`914`	`915`
`915`	`916`	`def _create_unclassified_result(`
Original file line number	Diff line number	Diff line change
`@@ -708,6 +708,7 @@ def process_document_section(self, document: Document, section_id: str) -> Docum`
`708`	`708`	`top_k=top_k,`
`709`	`709`	`top_p=top_p,`
`710`	`710`	`max_tokens=max_tokens,`
	`711`	`+ context="Extraction",`
`711`	`712`	`)`
`712`	`713`
`713`	`714`	`total_duration = time.time() - request_start_time`
Original file line number	Diff line number	Diff line change
`@@ -284,7 +284,7 @@ def _process_single_page(`
`284`	`284`	`# Extract metering data`
`285`	`285`	`feature_combo = self._feature_combo()`
`286`	`286`	`metering = {`
`287`		`- f"textract/{self._get_api_name()}{feature_combo}": {`
	`287`	`+ f"OCR/textract/{self._get_api_name()}{feature_combo}": {`
`288`	`288`	`"pages": textract_result["DocumentMetadata"]["Pages"]`
`289`	`289`	`}`
`290`	`290`	`}`
Original file line number	Diff line number	Diff line change
`@@ -221,6 +221,7 @@ def _invoke_bedrock_model(`
`221`	`221`	`top_k=config["top_k"],`
`222`	`222`	`top_p=config["top_p"],`
`223`	`223`	`max_tokens=config["max_tokens"],`
	`224`	`+ context="Summarization",`
`224`	`225`	`)`
`225`	`226`
`226`	`227`	`def _create_error_summary(self, error_message: str) -> DocumentSummary:`
Original file line number	Diff line number	Diff line change
`@@ -549,10 +549,10 @@ def handler(event, context):`
`549`	`549`
`550`	`550`	`# Add metering information`
`551`	`551`	`document.metering = {`
`552`		`- "bda/documents-custom": {`
	`552`	`+ "BDAProject/bda/documents-custom": {`
`553`	`553`	`"pages": custom_pages_count`
`554`	`554`	`},`
`555`		`- "bda/documents-standard": {`
	`555`	`+ "BDAProject/bda/documents-standard": {`
`556`	`556`	`"pages": standard_pages_count`
`557`	`557`	`}`
`558`	`558`	`}`