From e82625ffe73d3c9d3526683c7d6b7cd2fdeb1dfd Mon Sep 17 00:00:00 2001
From: Leonard Gerard <llgerard@amazon.com>
Date: Mon, 9 Jan 2023 17:02:15 -0800
Subject: [PATCH] Add SQS example implementing partial batch failure

---
 .../Cargo.toml                                |  16 ++
 .../README.md                                 |  18 ++
 .../src/main.rs                               | 159 ++++++++++++++++++
 3 files changed, 193 insertions(+)
 create mode 100644 examples/advanced-sqs-partial-batch-failures/Cargo.toml
 create mode 100644 examples/advanced-sqs-partial-batch-failures/README.md
 create mode 100644 examples/advanced-sqs-partial-batch-failures/src/main.rs

diff --git a/examples/advanced-sqs-partial-batch-failures/Cargo.toml b/examples/advanced-sqs-partial-batch-failures/Cargo.toml
new file mode 100644
index 00000000..04067948
--- /dev/null
+++ b/examples/advanced-sqs-partial-batch-failures/Cargo.toml
@@ -0,0 +1,16 @@
+[package]
+name = "advanced-sqs-partial-batch-failures"
+version = "0.1.0"
+edition = "2021"
+
+[dependencies]
+serde = "^1"
+serde_derive = "^1"
+serde_with = { version = "^2", features = ["json"], optional = true }
+serde_json = "^1"
+aws_lambda_events = "0.7.3"
+lambda_runtime = "0.7"
+tokio = { version = "1", features = ["macros"] }
+futures = "0.3"
+tracing = { version = "0.1", features = ["log"] }
+tracing-subscriber = { version = "0.3", default-features = false, features = ["fmt"] }
diff --git a/examples/advanced-sqs-partial-batch-failures/README.md b/examples/advanced-sqs-partial-batch-failures/README.md
new file mode 100644
index 00000000..7b10ca50
--- /dev/null
+++ b/examples/advanced-sqs-partial-batch-failures/README.md
@@ -0,0 +1,18 @@
+# AWS Lambda Function that receives events from SQS
+
+This example shows how to process events from an SQS queue using the partial batch failure feature.
+
+_Important note:_ your lambda sqs trigger *needs* to be configured with partial batch response support
+(the ` ReportBatchItemFailures` flag set to true), otherwise failed message will be not be reprocessed.
+For more details see:
+https://docs.aws.amazon.com/lambda/latest/dg/with-sqs.html#services-sqs-batchfailurereporting
+
+## Build & Deploy
+
+1. Install [cargo-lambda](https://github.com/cargo-lambda/cargo-lambda#installation)
+2. Build the function with `cargo lambda build --release`
+3. Deploy the function to AWS Lambda with `cargo lambda deploy --iam-role YOUR_ROLE`
+
+## Build for ARM 64
+
+Build the function with `cargo lambda build --release --arm64`
\ No newline at end of file
diff --git a/examples/advanced-sqs-partial-batch-failures/src/main.rs b/examples/advanced-sqs-partial-batch-failures/src/main.rs
new file mode 100644
index 00000000..254df031
--- /dev/null
+++ b/examples/advanced-sqs-partial-batch-failures/src/main.rs
@@ -0,0 +1,159 @@
+use aws_lambda_events::{
+    event::sqs::SqsEventObj,
+    sqs::{BatchItemFailure, SqsBatchResponse, SqsMessageObj},
+};
+use futures::Future;
+use lambda_runtime::{run, service_fn, Error, LambdaEvent};
+use serde::{de::DeserializeOwned, Deserialize, Serialize};
+use tracing::Instrument;
+
+/// [To customize] Your object definition, sent to the SQS queue triggering this lambda.
+#[derive(Deserialize, Serialize)]
+struct Data {
+    text: String,
+}
+
+/// [To customize] Your buisness logic to handle the payload of one SQS message.
+async fn data_handler(data: Data) -> Result<(), Error> {
+    // Some processing
+    tracing::info!(text = ?data.text, "processing data");
+    // simulate error
+    if data.text == "bad request" {
+        Err("Processing error".into())
+    } else {
+        Ok(())
+    }
+}
+
+/// Main function for the lambda executable.
+#[tokio::main]
+async fn main() -> Result<(), Error> {
+    tracing_subscriber::fmt()
+        .with_max_level(tracing::Level::INFO)
+        // disable printing the name of the module in every log line.
+        .with_target(false)
+        // disabling time is handy because CloudWatch will add the ingestion time.
+        .without_time()
+        .init();
+
+    run_sqs_partial_batch_failure(data_handler).await
+}
+
+/// This function will handle the message batches from SQS.
+/// It calls the provided user function `f` on every message concurrently and reports to SQS
+/// which message failed to be processed so that only those are retried.
+///
+/// Important note: your lambda sqs trigger *needs* to be configured with partial batch response support
+/// with the ` ReportBatchItemFailures` flag set to true, otherwise failed message will be dropped,
+/// for more details see:
+/// https://docs.aws.amazon.com/lambda/latest/dg/with-sqs.html#services-sqs-batchfailurereporting
+///
+///
+/// Note that if you are looking for parallel processing (multithread) instead of concurrent processing,
+/// you can do so by spawning a task inside your function `f`.
+async fn run_sqs_partial_batch_failure<T, D, R>(f: T) -> Result<(), Error>
+where
+    T: Fn(D) -> R,
+    D: DeserializeOwned,
+    R: Future<Output = Result<(), Error>>,
+{
+    run(service_fn(|e| batch_handler(|d| f(d), e))).await
+}
+
+/// Helper function to lift the user provided `f` function from message to batch of messages.
+/// See `run_sqs` for the easier function to use.
+async fn batch_handler<T, D, F>(
+    f: T,
+    event: LambdaEvent<SqsEventObj<serde_json::Value>>,
+) -> Result<SqsBatchResponse, Error>
+where
+    T: Fn(D) -> F,
+    F: Future<Output = Result<(), Error>>,
+    D: DeserializeOwned,
+{
+    tracing::trace!("Handling batch size {}", event.payload.records.len());
+    let create_task = |msg| {
+        // We need to keep the message_id to report failures to SQS
+        let SqsMessageObj {
+            message_id, body, ..
+        } = msg;
+        let span = tracing::span!(tracing::Level::INFO, "Handling SQS msg", message_id);
+        let task = async {
+            //TODO catch panics like the `run` function from lambda_runtime
+            f(serde_json::from_value(body)?).await
+        }
+        .instrument(span);
+        (message_id.unwrap_or_default(), task)
+    };
+    let (ids, tasks): (Vec<_>, Vec<_>) = event.payload.records.into_iter().map(create_task).unzip();
+    let results = futures::future::join_all(tasks).await; // Run tasks concurrently
+    let failure_items = ids
+        .into_iter()
+        .zip(results)
+        .filter_map(
+            // Only keep the message_id of failed tasks
+            |(id, res)| match res {
+                Ok(()) => None,
+                Err(err) => {
+                    tracing::error!("Failed to process msg {id}, {err}");
+                    Some(id)
+                }
+            },
+        )
+        .map(|id| BatchItemFailure {
+            item_identifier: id,
+        })
+        .collect();
+
+    Ok(SqsBatchResponse {
+        batch_item_failures: failure_items,
+    })
+}
+
+#[cfg(test)]
+mod test {
+    use lambda_runtime::Context;
+
+    use super::*;
+
+    #[derive(Serialize, Deserialize, Debug)]
+    struct UserData {
+        should_error: bool,
+    }
+    async fn user_fn(data: UserData) -> Result<(), Error> {
+        if data.should_error {
+            Err("Processing Error".into())
+        } else {
+            Ok(())
+        }
+    }
+
+    #[tokio::test]
+    async fn test() -> () {
+        let msg_to_fail: SqsMessageObj<serde_json::Value> = serde_json::from_str(
+            r#"{
+                "messageId": "1",
+                "body": "{\"should_error\": true}"
+            }"#,
+        )
+        .unwrap();
+        let msg_to_succeed: SqsMessageObj<serde_json::Value> = serde_json::from_str(
+            r#"{
+                "messageId": "0",
+                "body": "{\"should_error\" : false}"
+            }"#,
+        )
+        .unwrap();
+
+        let lambda_event = LambdaEvent {
+            payload: SqsEventObj {
+                records: vec![msg_to_fail, msg_to_succeed],
+            },
+            context: Context::default(),
+        };
+
+        let r = batch_handler(user_fn, lambda_event).await.unwrap();
+        assert_eq!(r.batch_item_failures.len(), 1);
+        assert_eq!(r.batch_item_failures[0].item_identifier, "1");
+    }
+}