aws-solutions-library-samples
diff --git a/‎CHANGELOG.md‎
Lines changed: 7 additions & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎patterns/pattern-1/src/hitl-process-function/index.py‎
Lines changed: 237 additions & 196 deletions b/‎patterns/pattern-1/src/hitl-process-function/index.py‎
Lines changed: 237 additions & 196 deletions
diff --git a/‎patterns/pattern-1/src/processresults_function/index.py‎
Lines changed: 33 additions & 26 deletions b/‎patterns/pattern-1/src/processresults_function/index.py‎
Lines changed: 33 additions & 26 deletions
diff --git a/‎patterns/pattern-1/statemachine/workflow.asl.json‎
Lines changed: 11 additions & 0 deletions b/‎patterns/pattern-1/statemachine/workflow.asl.json‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎patterns/pattern-1/template.yaml‎
Lines changed: 2 additions & 0 deletions b/‎patterns/pattern-1/template.yaml‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎patterns/pattern-2/template.yaml‎
Lines changed: 14 additions & 0 deletions b/‎patterns/pattern-2/template.yaml‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎patterns/pattern-3/template.yaml‎
Lines changed: 14 additions & 0 deletions b/‎patterns/pattern-3/template.yaml‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎samples/lending_package.pdf‎
-98.9 KB b/‎samples/lending_package.pdf‎
-98.9 KB
@@ -8,6 +8,13 @@ SPDX-License-Identifier: MIT-0
 
 ### Added
 
+- **Enhanced A2I Template and Workflow Management**
+  - Enhanced A2I template with improved user interface and clearer instructions for reviewers
+  - Added comprehensive instructions for reviewers in A2I template to guide the review process
+  - Implemented capture of failed review tasks with proper error handling and logging
+  - Added workflow orchestration control to stop processing when reviewer rejects A2I task
+  - Removed automatic A2I task creation when Pattern-1 Bedrock Data Automation (BDA) fails to classify document to appropriate Blueprint
+
 - **Dynamic Cost Calculation for Metering Data**
   - Added automated unit cost and estimated cost calculation to metering table with new `unit_cost` and `estimated_cost` columns
   - Dynamic pricing configuration loading from configuration
 
@@ -673,7 +673,7 @@ def start_human_loop(
         FlowDefinitionArn = ssm.get_parameter(Name=f"/{os.environ.get('METRIC_NAMESPACE', 'IDP')}/FlowDefinitionArn")['Parameter']['Value']
         human_review_id = generate_random_string(2)
         response = a2i_runtime_client.start_human_loop(
-            HumanLoopName=f"review-bda-{execution_id}-{human_review_id}",
+            HumanLoopName=f"review-bda-{human_review_id}-{execution_id}-{record_number}-{page_id_num}",
             FlowDefinitionArn=FlowDefinitionArn,
             HumanLoopInput={"InputContent": json.dumps(human_loop_input)}
         )
@@ -825,6 +825,7 @@ def process_segments(
 
     now = datetime.datetime.now().isoformat()
     hitl_triggered = False
+    overall_hitl_triggered = False
 
     for record_number, segment in enumerate(segment_metadata, start=1):
         logger.info(f"Processing segment for execution id: {execution_id}")
@@ -901,6 +902,7 @@ def process_segments(
             if low_confidence:
                 hitl_triggered = low_confidence
                 metrics.put_metric('HITLTriggered', 1)
+                overall_hitl_triggered = True
                 for page_number in page_indices:
                     page_str = str(page_number)
                     key_values = pagespecific_details['key_value_details'].get(page_str, [])
@@ -929,6 +931,7 @@ def process_segments(
         else:
             if enable_hitl == 'true':
                 std_hitl = 'true'
+                # std_hitl = None # HITL for standard output blueprint match is disabled until we have option to choose Blueprint in A2I
             else:
                 std_hitl = None 
             # Process standard output if no custom output match
@@ -940,7 +943,8 @@ def process_segments(
             page_array = list(range(start_page, end_page + 1))
             item.update({
                 "page_array": page_array,
-                "hitl_triggered": std_hitl,
+                # "hitl_triggered": std_hitl,
+                "hitl_triggered": None,
                 "extraction_bp_name": "None",
                 "extracted_result": std_output
             })
@@ -950,31 +954,34 @@ def process_segments(
                 record_number=record_number,
                 bp_match=segment.get('custom_output_status'),
                 extraction_bp_name="None",
-                hitl_triggered=std_hitl,
+                # hitl_triggered=std_hitl,
+                hitl_triggered=None,
                 page_array=page_array,
                 review_portal_url=SAGEMAKER_A2I_REVIEW_PORTAL_URL
             )
 
-            hitl_triggered = std_hitl
-            if enable_hitl == 'true':
-                for page_number in range(start_page, end_page + 1):
-                    ImageUri = f"s3://{output_bucket}/{object_key}/pages/{page_number}/image.jpg"
-                    try:
-                        human_loop_response = start_human_loop(
-                            execution_id=execution_id,
-                            kv_pairs=[],
-                            source_image_uri=ImageUri,
-                            bounding_boxes=[],
-                            blueprintName="",
-                            bp_confidence=0.00,
-                            confidenceThreshold=confidence_threshold,
-                            page_id=page_number,
-                            page_indices=page_array,
-                            record_number=record_number
-                        )
-                        logger.info(f"Triggered human loop for page {page_number}: {human_loop_response}")
-                    except Exception as e:
-                        logger.error(f"Failed to start human loop for page {page_number}: {str(e)}")
+            # hitl_triggered = std_hitl
+            hitl_triggered = None
+            # if enable_hitl == 'true':
+            # # if std_hitl: # HITL for standard output blueprint match is disabled until we have option to choose Blueprint in A2I
+            #     for page_number in range(start_page, end_page + 1):
+            #         ImageUri = f"s3://{output_bucket}/{object_key}/pages/{page_number}/image.jpg"
+            #         try:
+            #             human_loop_response = start_human_loop(
+            #                 execution_id=execution_id,
+            #                 kv_pairs=[],
+            #                 source_image_uri=ImageUri,
+            #                 bounding_boxes=[],
+            #                 blueprintName="",
+            #                 bp_confidence=0.00,
+            #                 confidenceThreshold=confidence_threshold,
+            #                 page_id=page_number,
+            #                 page_indices=page_array,
+            #                 record_number=record_number
+            #             )
+            #             logger.info(f"Triggered human loop for page {page_number}: {human_loop_response}")
+            #         except Exception as e:
+            #             logger.error(f"Failed to start human loop for page {page_number}: {str(e)}")
 
         document.hitl_metadata.append(hitl_metadata)
 
@@ -985,7 +992,7 @@ def process_segments(
             except Exception as e:
                 logger.error(f"Error saving to DynamoDB: {str(e)}")
 
-    return document, hitl_triggered
+    return document, overall_hitl_triggered
 
 def handler(event, context):
     """
@@ -1136,7 +1143,7 @@ def handler(event, context):
                             execution_id,
                             document
                         )
-                        if hitl_result:
+                        if hitl_result or hitl_triggered== "true":
                             hitl_triggered = "true"
                 elif isinstance(output_metadata, dict):
                     for asset_id, asset in output_metadata.items():
@@ -1149,7 +1156,7 @@ def handler(event, context):
                             execution_id,
                             document
                         )
-                        if hitl_result:
+                        if hitl_result or hitl_triggered== "true":
                             hitl_triggered = "true"
                 else:
                     logger.error("Unexpected output_metadata format in job_metadata.json")
 
@@ -108,6 +108,12 @@
                     "BackoffRate": 2
                 }
             ],
+            "Catch": [
+                {
+                    "ErrorEquals": ["HITLFailedException"],
+                    "Next": "HITLFailState"
+                }
+            ],
             "Next": "HITLStatusUpdate"
         },
         "HITLStatusUpdate": {
@@ -171,6 +177,11 @@
             "Type": "Fail",
             "Cause": "Data Automation Job Failed",
             "Error": "JobFailedException"
+        },
+        "HITLFailState": {
+            "Type": "Fail",
+            "Cause": "Human In The Loop Review Failed",
+            "Error": "HITLFailedException"
         }
     }
 }
@@ -878,6 +878,8 @@ Resources:
         detail:
           humanLoopStatus:
             - 'Completed'
+            - 'Failed'
+            - 'Stopped'
       State: 'ENABLED'
       Targets:
         - Arn: !GetAtt HITLProcessLambdaFunction.Arn
 
@@ -81,6 +81,19 @@ Parameters:
     Default: ""
     Description: "If you provided a Bedrock Guardrail Id above, provide the corresponding Guardrail version here"
 
+  EnableHITL:
+    Type: String
+    Default: "false"
+    AllowedValues:
+      - "true"
+      - "false"
+    Description: "Enable Human In The Loop (A2I) for document review"
+
+  SageMakerA2IReviewPortalURL:
+    Type: String
+    Default: ""
+    Description: "SageMaker A2I Review Portal URL for HITL workflows"
+
   ConfigurationDefaultS3Uri:
     Type: String
     Description: "S3 URI (s3://bucket/path/config.json) to import default configuration from S3"
@@ -105,6 +118,7 @@ Conditions:
   HasCustomClassificationModelARN : !Not [!Equals [!Ref CustomClassificationModelARN , ""]]
   HasCustomExtractionModelARN : !Not [!Equals [!Ref CustomExtractionModelARN , ""]]
   HasPermissionsBoundary: !Not [!Equals [!Ref PermissionsBoundaryArn, ""]]
+  IsHITLEnabled: !Equals [!Ref EnableHITL, "true"]
 
 
 Resources:
 
@@ -95,9 +95,23 @@ Parameters:
     AllowedPattern: "^(|arn:aws:iam::[0-9]{12}:policy/.+)$"
     ConstraintDescription: Must be empty or a valid IAM policy ARN
 
+  EnableHITL:
+    Type: String
+    Default: "false"
+    AllowedValues:
+      - "true"
+      - "false"
+    Description: "Enable Human In The Loop (A2I) for document review"
+
+  SageMakerA2IReviewPortalURL:
+    Type: String
+    Default: ""
+    Description: "SageMaker A2I Review Portal URL for HITL workflows"
+
 Conditions:
   HasGuardrailConfig: !And [!Not [!Equals [!Ref BedrockGuardrailId, ""]], !Not [!Equals [!Ref BedrockGuardrailVersion, ""]]]
   HasPermissionsBoundary: !Not [!Equals [!Ref PermissionsBoundaryArn, ""]]
+  IsHITLEnabled: !Equals [!Ref EnableHITL, "true"]
 
 Resources:
Original file line number	Diff line number	Diff line change
`@@ -108,6 +108,12 @@`
`108`	`108`	`"BackoffRate": 2`
`109`	`109`	`}`
`110`	`110`	`],`
	`111`	`+ "Catch": [`
	`112`	`+ {`
	`113`	`+ "ErrorEquals": ["HITLFailedException"],`
	`114`	`+ "Next": "HITLFailState"`
	`115`	`+ }`
	`116`	`+ ],`
`111`	`117`	`"Next": "HITLStatusUpdate"`
`112`	`118`	`},`
`113`	`119`	`"HITLStatusUpdate": {`
`@@ -171,6 +177,11 @@`
`171`	`177`	`"Type": "Fail",`
`172`	`178`	`"Cause": "Data Automation Job Failed",`
`173`	`179`	`"Error": "JobFailedException"`
	`180`	`+ },`
	`181`	`+ "HITLFailState": {`
	`182`	`+ "Type": "Fail",`
	`183`	`+ "Cause": "Human In The Loop Review Failed",`
	`184`	`+ "Error": "HITLFailedException"`
`174`	`185`	`}`
`175`	`186`	`}`
`176`	`187`	`}`