aws-samples · zalilias · Dec 16, 2024 · Jan 3, 2025 · benjymoses · Jan 15, 2025
diff --git a/serverless-message-processing/README.md b/serverless-message-processing/README.md
@@ -0,0 +1,58 @@
+# Serverless Message Processing Pattern
+
+## Overview
+An adaptable pattern for message processing using AWS serverless services, featuring error handling and automatic recovery mechanisms.
+
+## Core Components
+- API Gateway (message ingestion)
+- SQS Queues (main + DLQs)
+- Lambda Functions (processing + recovery)
+
+## Basic Flow
+1. Messages enter through API Gateway
+2. Main queue receives messages
+3. Processor Lambda handles messages
+4. Failed messages route to DLQs
+5. Decision maker attempts an automated recovery
+
+## Deployment
+# Build the SAM application
+   ```
+sam build
+   ```
+# Deploy the application
+   ```
+sam deploy --guided
+   ```
+
+## Key Features
+- Automatic retry mechanism
+- Segregation of recoverable/fatal errors
+- Extensible processing logic
+
+## API Reference
+# Send Message
+   ```
+
+POST /message
+Content-Type: application/json
+   ```
+   ```
+{
+    "messageType": "TYPE_A|TYPE_B|TYPE_C",
+    "payload": {},
+    "timestamp": "ISO8601_TIMESTAMP"
+}
+   ```
+
+
+## Adaptation Points
+- Message validation rules
+- Processing logic
+- Error handling strategies
+- Recovery mechanisms
+- Monitoring requirements
+- API Design
+
+## Note
+This is a sample pattern. Adapt security, scaling, and processing logic according to your requirements.
diff --git a/serverless-message-processing/example-pattern.json b/serverless-message-processing/example-pattern.json
@@ -0,0 +1,60 @@
+{
+    "title": "Step Functions to Athena",
+    "description": "Create a Step Functions workflow to query Amazon Athena.",
+    "language": "Python",
+    "level": "200",
+    "framework": "SAM",
+    "introBox": {
+      "headline": "How it works",
+      "text": [
+        "This sample project demonstrates how to use a serverless solution for processing and fixing malformed messages using SQS queues and Lambda functions",
+        "The system automatically handles message validation, applies fixes where possible, and routes messages to appropriate queues based on their fixability.",
+        "It has built-in error handling and detailed logging, it provides a robust framework for message processing that can be easily extended for specific business needs.",
+        "This pattern uses AWS Lambda for processing, multiple SQS queues for message routing, and includes 2 dead-letter queue (DLQ) for messages requiring human intervention or for auto-remediation."
+      ]
+    },
+    "gitHub": {
+      "template": {
+        "repoURL": "https://github.com/aws-samples/serverless-patterns/tree/main/serverless-messaging-processing",
+        "templateURL": "serverless-patterns/serverless-messaging-processing",
+        "projectFolder": "serverless-messaging-processing",
+        "templateFile": "template.yaml"
+      }
+    },
+    "resources": {
+      "bullets": [
+        {
+          "text": "Amazon SQS Docs",
+          "link": "https://docs.aws.amazon.com/AWSSimpleQueueService/latest/SQSDeveloperGuide/welcome.html"
+        },
+        {
+          "text": "Using dead-letter queues in Amazon SQS",
+          "link": "https://docs.aws.amazon.com/AWSSimpleQueueService/latest/SQSDeveloperGuide/sqs-dead-letter-queues.html"
+        }
+      ]
+    },
+    "deploy": {
+      "text": [
+      "sam build",
+      "sam deploy --guided"
+      ]
+    },
+    "testing": {
+      "text": [
+        "See the GitHub repo for detailed testing instructions."
+      ]
+    },
+    "cleanup": {
+      "text": [
+        "Delete the stack: <code>sam delete</code>."
+      ]
+    },
+    "authors": [
+      {
+        "name": "Ilias Ali",
+        "image": "link-to-your-photo.jpg",
+        "bio": "I am a Solutions Architect working at AWS based in the UK.",
+        "linkedin": "ilias-ali-0849991a4"
+      }
+    ]
+  }
diff --git a/serverless-message-processing/functions/decision_maker/app.py b/serverless-message-processing/functions/decision_maker/app.py
@@ -1,4 +1,5 @@
 import json
+import re
 import boto3
 import os
 import logging
@@ -14,109 +15,133 @@
 MAIN_QUEUE_URL = os.environ['MAIN_QUEUE_URL']
 FATAL_DLQ_URL = os.environ['FATAL_DLQ_URL']
 
-def can_fix_message(message):
+# Email validation pattern
+EMAIL_PATTERN = r'^[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\.[a-zA-Z]{2,}$'
+
+def fix_email(email):
     """
-    Determine if a message can be fixed automatically.
-
-    Extension points:
-    1. Add validation for specific message formats
-    2. Implement business-specific fix rules
-    3. Add data transformation logic
-    4. Implement retry strategies
-    5. Add validation against external systems
+    Attempt to fix common email format issues
+    Can be amended to other scenarios e.g. Downstream issues
     """
-    try:
-        # Basic message validation
-        # Add your validation logic here
-        return True
-    except Exception as e:
-        logger.error(f"Validation error: {str(e)}")
-        return False
+    # Remove multiple @ symbols, keep the last one
+    if email.count('@') > 1:
+        parts = email.split('@')
+        email = f"{parts[0]}@{parts[-1]}"
+
+    # Remove spaces
+    email = email.strip().replace(' ', '')
+
+    # Fix common typos in domain extensions
+    common_fixes = {
+        '.con': '.com',
+        '.vom': '.com',
+        '.comm': '.com',
+        '.orgg': '.org',
+        '.nett': '.net'
+    }
+
+    for wrong, right in common_fixes.items():
+        if email.endswith(wrong):
+            email = email[:-len(wrong)] + right
+
+    return email
 
-def fix_message(message):
+def can_fix_email(message):
     """
-    Apply fixes to the message.
-
-    Extension points:
-    1. Add data normalization
-    2. Implement field-specific fixes
-    3. Add data enrichment
-    4. Implement format conversion
-    5. Add validation rules
+    Check if the email in the message can be fixed
     """
-    try:
-        fixed_message = message.copy()
-        # Add your fix logic here
-        fixed_message['wasFixed'] = True
-        return fixed_message
-    except Exception as e:
-        logger.error(f"Fix error: {str(e)}")
-        return None
+    if 'email' not in message:
+        return False
+
+    email = message['email']
+    fixed_email = fix_email(email)
+
+    return bool(re.match(EMAIL_PATTERN, fixed_email))
+
 
 def lambda_handler(event, context):
     """
-    Process messages and route them based on fixability.
-
+    Processes messages from a DLQ that have already failed to be automatically processed, 
+    and attempts automated remediation and redelivery of the messages back to the main queue. 
+    If no suitable fixes can be applied, messages end up in a fatal DLQ where the typical 
+    approach of human intervention is required. 
+
     Flow:
     1. Attempt to fix message
     2. If fixable -> Main Queue
     3. If unfixable -> Fatal DLQ
 
     Extension points:
-    1. Add more sophisticated routing logic
+    1. Add more sophisticated routing logic- including a delay queue 
     2. Implement custom error handling
     3. Add message transformation
     4. Implement retry mechanisms
     5. Add monitoring and metrics
-    """
+
+   """
     processed_count = 0
 
     for record in event['Records']:
-        message_id = 'unknown'  # Initialize message_id with default value
-
         try:
+            # Parse the message body
             message = json.loads(record['body'])
-            message_id = record.get('messageId', 'unknown')
+            original_message_id = record.get('messageId', 'unknown')
 
-            logger.info(f"Processing message: {message_id}")
+            logger.info(f"Processing failed message: {original_message_id}")
 
-            if can_fix_message(message):
-                fixed_message = fix_message(message)
-                if fixed_message:
-                    # Send to main queue
-                    sqs.send_message(
-                        QueueUrl=MAIN_QUEUE_URL,
-                        MessageBody=json.dumps(fixed_message)
-                    )
-                    logger.info(f"Fixed message sent to main queue: {message_id}")
-                else:
-                    raise ValueError("Message fix failed")
+
+
+
+            # Option A: Try to fix malformed email
+
+            if can_fix_email(message) and not re.match(EMAIL_PATTERN, message['email']):
+                fixed_email = fix_email(message['email'])
+                logger.info(f"Fixed email from '{message['email']}' to '{fixed_email}'")
+
+                # Update the message with fixed email
+                message['email'] = fixed_email
+                message['emailWasFixed'] = True
+
+                # Send back to main queue
+                sqs.send_message(
+                    QueueUrl=MAIN_QUEUE_URL,
+                    MessageBody=json.dumps(message)
+                )
+
+                logger.info(f"Sent fixed message back to main queue: {original_message_id}")   
+
+            # Option B: Cannot fix - send to fatal DLQ
             else:
+                logger.warning(f"Message cannot be fixed, sending to fatal DLQ: {original_message_id}")
+
+                # Add failure reason if not present
+                if 'failureReason' not in message:
+                    message['failureReason'] = 'Unrecoverable error - could not fix message'
+
                 # Send to fatal DLQ
-                message['failureReason'] = 'Message cannot be automatically fixed'
                 sqs.send_message(
                     QueueUrl=FATAL_DLQ_URL,
                     MessageBody=json.dumps(message)
                 )
-                logger.warning(f"Message sent to fatal DLQ: {message_id}")
-
+
             processed_count += 1
 
         except Exception as e:
-            logger.error(f"Error processing message {message_id}: {str(e)}")
+            logger.error(f"Error processing message {original_message_id}: {str(e)}")
+            # If we can't process the decision, send to fatal DLQ
             try:
                 error_message = {
                     'originalMessage': record['body'],
-                    'failureReason': str(e),
+                    'failureReason': f"Decision maker error: {str(e)}",
                     'timestamp': context.invoked_function_arn
                 }
                 sqs.send_message(
                     QueueUrl=FATAL_DLQ_URL,
                     MessageBody=json.dumps(error_message)
                 )
-                logger.error(f"Error message sent to fatal DLQ: {message_id}")
+
             except Exception as fatal_e:
-                logger.critical(f"Fatal DLQ error: {str(fatal_e)}")
+                logger.critical(f"Could not send to fatal DLQ: {str(fatal_e)}")
                 raise
 
     return {

diff --git a/serverless-message-processing/functions/decision_maker/requirements.txt b/serverless-message-processing/functions/decision_maker/requirements.txt
@@ -1,2 +1 @@
 boto3==1.26.137
-jsonschema==4.17.3
diff --git a/serverless-message-processing/functions/processor/requirements.txt b/serverless-message-processing/functions/processor/requirements.txt
@@ -1,2 +1 @@
 boto3==1.26.137
-jsonschema==4.17.3