From ec0fb0da801e69d05db96901db876f9a5ca24a11 Mon Sep 17 00:00:00 2001 From: Tian Chu Date: Mon, 4 Oct 2021 23:00:15 -0400 Subject: [PATCH 1/2] Ignore non-utf8 characters --- aws/logs_monitoring/parsing.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/aws/logs_monitoring/parsing.py b/aws/logs_monitoring/parsing.py index 5cf4ada7d..0522676a4 100644 --- a/aws/logs_monitoring/parsing.py +++ b/aws/logs_monitoring/parsing.py @@ -200,7 +200,7 @@ def s3_handler(event, context, metadata): else: # Check if using multiline log regex pattern # and determine whether line or pattern separated logs - data = data.decode("utf-8") + data = data.decode("utf-8", errors='ignore') if DD_MULTILINE_LOG_REGEX_PATTERN and multiline_regex_start_pattern.match(data): split_data = multiline_regex.split(data) else: From 445ceba7fd0595e51f427f2567c9216e7730d828 Mon Sep 17 00:00:00 2001 From: Tian Chu Date: Mon, 4 Oct 2021 23:06:59 -0400 Subject: [PATCH 2/2] lint --- aws/logs_monitoring/parsing.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/aws/logs_monitoring/parsing.py b/aws/logs_monitoring/parsing.py index 0522676a4..6ac7e7b79 100644 --- a/aws/logs_monitoring/parsing.py +++ b/aws/logs_monitoring/parsing.py @@ -200,7 +200,7 @@ def s3_handler(event, context, metadata): else: # Check if using multiline log regex pattern # and determine whether line or pattern separated logs - data = data.decode("utf-8", errors='ignore') + data = data.decode("utf-8", errors="ignore") if DD_MULTILINE_LOG_REGEX_PATTERN and multiline_regex_start_pattern.match(data): split_data = multiline_regex.split(data) else: