MITLibraries · ghukill · Sep 5, 2023 · Aug 31, 2023 · Aug 31, 2023 · Sep 1, 2023
diff --git a/.gitignore b/.gitignore
@@ -132,4 +132,7 @@ dmypy.json
 .DS_Store
 
 # VSCode
-.vscode/
+.vscode/
+
+# PyCharm
+.idea/
diff --git a/Makefile b/Makefile
@@ -22,13 +22,16 @@ update: install # update all python dependencies
 	pipenv update --dev
 
 ## ---- Test commands ---- ##
-test: # run tests and print coverage report
-	pipenv run coverage run --source=lambdas -m pytest -vv
+test: # Run tests and print a coverage report
+	pipenv run coverage run --source=lambdas -m pytest -vv -m "not integration"
 	pipenv run coverage report -m
 
 coveralls: test
 	pipenv run coverage lcov -o ./coverage/lcov.info
 
+test-integration:
+	pipenv run pytest -vv -s -m "integration"
+
 ## ---- Code quality and safety commands ###
 
 # linting commands

diff --git a/README.md b/README.md
@@ -29,61 +29,31 @@ Required env variables:
 - `WORKSPACE=dev`: env for local development, set by Terraform in AWS environments.
 - `SENTRY_DSN`: only needed in production.
 
-### To verify local changes in Dev1
+### Integration Tests for Dev1
 
-- Ensure your aws cli is configured with credentials for the Dev1 account.
-- Ensure you have the above env variables set in your .env, matching those in our Dev1 environment.
-- Add the following to your .env: `LAMBDA_FUNCTION_URL=<the Dev1 lambda function URL>`
-- Publish the lambda function:
+Some minimal integration tests are provided for checking the deployed webhook handling lambda, defined as `integration` type pytest tests.  These tests check the following:
+  * lambda function URL is operational
+  * `GET` and `POST` requests are received
+  * deployed lambda has adequate permissions to communicate with S3, StepFunctions, etc.
 
-  ```bash
-  make publish-dev
-  make update-lambda-dev
-  ```
+Other notes about tests:
+  * tests are limited to `Dev1` environment
+  * AWS `AWSAdministratorAccess` role credentials must be set on developer machine
+  * environment variable `WORKSPACE=dev` must be set
+    * no other environment variables are required, these are all retrieved from deployed context
 
-#### GET request example
+#### Steps to run integration tests
 
-- Send a GET request with challenge phrase to the lambda function URL:
-
-  ```bash
-  pipenv run python -c "from lambdas.helpers import send_get_to_lambda_function_url; print(send_get_to_lambda_function_url('your challenge phrase'))"
-  ```
-
-  Observe output: `your challenge phrase`
-
-#### POST request examples
-
-- Send a POST request mimicking a webhook POST (not a POD or TIMDEX export job)
-
-  ```bash
-  pipenv run python -c "from lambdas.helpers import send_post_to_lambda_function_url, SAMPLE_WEBHOOK_POST_BODY; print(send_post_to_lambda_function_url(SAMPLE_WEBHOOK_POST_BODY))"
-  ```
-
-  Observe output: `Webhook POST request received and validated, no action taken.`
-
-- Send a POST request mimicking a POD export job webhook
-  _Note_: sending a request that mimics a POD export JOB_END will trigger the entire POD workflow, which is fine _in Dev1 only_ for testing.
-
-  Add the following to your .env:
-  - `VALID_POD_EXPORT_DATE=<the date of a POD export with files in the Dev1 S3 export bucket, in "YYYY-MM-DD" format>` Note: if it's been a while since the last POD export from Alma sandbox, there may be no files in the Dev1 S3 export bucket and you may need to run the publishing job from the sandbox.
-
-  ```bash
-  pipenv run python -c "from lambdas.helpers import send_post_to_lambda_function_url, SAMPLE_POD_EXPORT_JOB_END_WEBHOOK_POST_BODY; print(send_post_to_lambda_function_url(SAMPLE_POD_EXPORT_JOB_END_WEBHOOK_POST_BODY))"
-  ```
-
-  Observe output: `Webhook POST request received and validated, PPOD pipeline initiated.` and then check the Dev1 ppod state machine logs to confirm the entire process ran!
-
-- Send a POST request mimicking a TIMDEX export job webhook
-  _Note_: sending a request that mimics a TIMDEX export JOB_END will trigger the entire TIMDEX workflow, which is fine _in Dev1 only_ for testing.
-
-  Add the following to your .env:
-  - `VALID_TIMDEX_EXPORT_DATE=<the date of a TIMDEX export with files in the Dev1 S3 export bucket, in "YYYY-MM-DD" format>` Note: if it's been a while since the last TIMDEX export from Alma sandbox, there may be no files in the Dev1 S3 export bucket and you may need to run the publishing job from the sandbox.
-
-  ```bash
-  pipenv run python -c "from lambdas.helpers import send_post_to_lambda_function_url, SAMPLE_TIMDEX_EXPORT_JOB_END_WEBHOOK_POST_BODY; print(send_post_to_lambda_function_url(SAMPLE_TIMDEX_EXPORT_JOB_END_WEBHOOK_POST_BODY))"
-  ```
+Update docker image to ensure local changes are deployed to `Dev1`:
+```shell
+make publish-dev
+make update-lambda-dev
+```
 
-  Observe output: `Webhook POST request received and validated, TIMDEX pipeline initiated.` and then check the Dev1 timdex state machine logs to confirm the entire process ran!
+Run tests against deployed assets:
+```shell
+make test-integration
+```
 
 ## Running locally with Docker
 

diff --git a/lambdas/helpers.py b/lambdas/helpers.py
@@ -5,43 +5,6 @@
 
 import requests
 
-SAMPLE_WEBHOOK_POST_BODY = {
-    "action": "JOB_END",
-    "job_instance": {
-        "name": "Not a POD export job",
-    },
-}
-
-SAMPLE_POD_EXPORT_JOB_END_WEBHOOK_POST_BODY = {
-    "action": "JOB_END",
-    "job_instance": {
-        "name": os.getenv("ALMA_POD_EXPORT_JOB_NAME", "PPOD Export"),
-        "end_time": os.getenv("VALID_POD_EXPORT_DATE", "2022-05-23"),
-        "status": {"value": "COMPLETED_SUCCESS"},
-        "counter": [
-            {
-                "type": {"value": "label.new.records", "desc": "New Records"},
-                "value": "1",
-            },
-        ],
-    },
-}
-
-SAMPLE_TIMDEX_EXPORT_JOB_END_WEBHOOK_POST_BODY = {
-    "action": "JOB_END",
-    "job_instance": {
-        "name": "Publishing Platform Job TIMDEX EXPORT to Dev1 DAILY",
-        "status": {"value": "COMPLETED_SUCCESS"},
-        "end_time": os.getenv("VALID_TIMDEX_EXPORT_DATE", "2022-10-24"),
-        "counter": [
-            {
-                "type": {"value": "label.new.records", "desc": "New Records"},
-                "value": "1",
-            },
-        ],
-    },
-}
-
 
 def generate_signature(message_body: dict) -> str:
     secret = os.environ["ALMA_CHALLENGE_SECRET"]

diff --git a/pyproject.toml b/pyproject.toml
@@ -8,6 +8,10 @@ exclude = ["tests/"]
 
 [tool.pytest.ini_options]
 log_level = "INFO"
+markers = [
+    "unit: unit tests",
+    "integration: integration tests"
+]
 
 [tool.ruff]
 target-version = "py311"
@@ -25,7 +29,8 @@ ignore = [
     # project-specific
     "D100",
     "D103",
-    "D104"
+    "D104",
+    "G002"
 ]
 
 # allow autofix behavior for specified rules

diff --git a/tests/conftest.py b/tests/conftest.py
@@ -1,16 +1,23 @@
+# ruff: noqa: G004
 import datetime
+import logging
 import os
 import urllib
 from importlib import reload
 
+import boto3
 import botocore.session
 import pytest
 import requests_mock
+from botocore.exceptions import ClientError
 from botocore.stub import Stubber
 
+import lambdas.helpers
 import lambdas.webhook
 from lambdas.webhook import lambda_handler
 
+ORIGINAL_ENV = os.environ.copy()
+
 
 @pytest.fixture(autouse=True)
 def _test_env():
@@ -154,3 +161,176 @@ def stubbed_bursar_sfn_client():
     with Stubber(sfn) as stubber:
         stubber.add_response("start_execution", expected_response, expected_params)
         yield sfn
+
+
+@pytest.fixture
+def _set_integration_tests_env_vars() -> None:
+    """Fixture to set os environment variables by retrieving data from AWS.
+
+    Because mocked AWS credentials are set in the testing environment, this temporary
+    reinstating of the calling environment (e.g. developer's machine) when the tests
+    began is required.  Once data about deployed assets, e.g. lambda function URL and
+    deployed environment variables, is retrieved, the testing environment is used again.
+    """
+    # backup current, test env
+    test_env = os.environ.copy()
+
+    # set os.environ as original env before testing framework
+    # ruff: noqa: B003
+    os.environ = ORIGINAL_ENV
+
+    try:
+        if not os.getenv("WORKSPACE"):
+            # ruff: noqa: TRY301, TRY002, TRY003, EM101
+            raise Exception("WORKSPACE env var must be set for integration tests")
+
+        # get lambda configurations
+        lambda_client = boto3.client("lambda")
+        lambda_function_config = lambda_client.get_function_configuration(
+            FunctionName=f"alma-webhook-lambdas-{os.getenv('WORKSPACE').lower()}"
+        )
+        lambda_function_env_vars = lambda_function_config["Environment"]["Variables"]
+        lambda_function_url = lambda_client.get_function_url_config(
+            FunctionName=f"alma-webhook-lambdas-{os.getenv('WORKSPACE').lower()}"
+        )["FunctionUrl"]
+
+        # get values from parameter store
+        ssm_client = boto3.client("ssm")
+        ssm_client.get_parameter(Name="/apps/almahook/alma-pod-export-job-name")[
+            "Parameter"
+        ]["Value"]
+        ppod_state_machine_arn = ssm_client.get_parameter(
+            Name="/apps/almahook/ppod-state-machine-arn"
+        )["Parameter"]["Value"]
+        timdex_state_machine_arn = ssm_client.get_parameter(
+            Name="/apps/almahook/timdex-ingest-state-machine-arn"
+        )["Parameter"]["Value"]
+
+    except:
+        logging.exception("could not retrieve lambda configurations via boto3")
+        raise
+    finally:
+        # reset testing env vars
+        os.environ = test_env
+
+    # set env vars
+    os.environ["LAMBDA_FUNCTION_URL"] = lambda_function_url
+    os.environ["ALMA_CHALLENGE_SECRET"] = lambda_function_env_vars[
+        "ALMA_CHALLENGE_SECRET"
+    ]
+    os.environ["ALMA_POD_EXPORT_JOB_NAME"] = "Publishing Platform Job PPOD EXPORT to Dev1"
+    os.environ["PPOD_STATE_MACHINE_ARN"] = ppod_state_machine_arn
+    os.environ["VALID_POD_EXPORT_DATE"] = "2023-08-15"  # matches fixture date
+    os.environ["TIMDEX_STATE_MACHINE_ARN"] = timdex_state_machine_arn
+    os.environ["VALID_TIMDEX_EXPORT_DATE"] = "2023-08-15"  # matches fixture date
+
+
+@pytest.fixture
+def _integration_tests_s3_fixtures(_set_integration_tests_env_vars) -> None:
+    """Upload integration test fixtures to S3, if they don't already exist.
+
+    These s3 files are used by deployed assets during integration tests.  This fixture
+    relies on _set_integration_tests_env_vars as a dependency to ensure AWS credentials
+    have not been clobbered by testing env vars.
+    """
+    s3 = boto3.client("s3")
+
+    def check_and_upload_file(bucket, key):
+        try:
+            s3.head_object(Bucket=bucket, Key=key + "foo")
+            logging.info(f"File s3://{bucket}/{key} already exists, nothing to do!")
+        except ClientError as e:
+            error_code = int(e.response["Error"]["Code"])
+            # ruff: noqa: PLR2004
+            if error_code == 404:
+                logging.info(f"File s3://{bucket}/{key} not found. Uploading...")
+                local_file_path = os.path.join("tests", "fixtures", os.path.basename(key))
+                if os.path.exists(local_file_path):
+                    s3.upload_file(local_file_path, bucket, key)
+                    logging.info(f"File uploaded to s3://{bucket}/{key}")
+                else:
+                    msg = f"Fixture file {local_file_path} does not exist."
+                    logging.exception(msg)
+                    raise FileNotFoundError(msg) from None
+            else:
+                raise
+
+    # Specify your bucket and key
+    fixtures = [
+        (
+            "dev-sftp-shared",
+            "exlibris/pod/POD_ALMA_EXPORT_20230815_220844[016]_new.tar.gz",
+        ),
+        (
+            "dev-sftp-shared",
+            "exlibris/timdex/TIMDEX_ALMA_EXPORT_DAILY_20230815_220844[016]_new.tar.gz",
+        ),
+    ]
+    for bucket, key in fixtures:
+        check_and_upload_file(bucket, key)
+
+
+@pytest.fixture
+def sample_webhook_post_body() -> dict:
+    return {
+        "action": "JOB_END",
+        "job_instance": {
+            "name": "Not a POD export job",
+        },
+    }
+
+
+@pytest.fixture
+def sample_pod_export_job_end_webhook_post_body() -> dict:
+    return {
+        "action": "JOB_END",
+        "job_instance": {
+            "name": os.getenv("ALMA_POD_EXPORT_JOB_NAME", "PPOD Export"),
+            "end_time": os.getenv("VALID_POD_EXPORT_DATE", "2022-05-23"),
+            "status": {"value": "COMPLETED_SUCCESS"},
+            "counter": [
+                {
+                    "type": {"value": "label.new.records", "desc": "New Records"},
+                    "value": "1",
+                },
+            ],
+        },
+    }
+
+
+@pytest.fixture
+def sample_timdex_export_job_end_webhook_post_body() -> dict:
+    return {
+        "action": "JOB_END",
+        "job_instance": {
+            "name": "Publishing Platform Job TIMDEX EXPORT to Dev1 DAILY",
+            "status": {"value": "COMPLETED_SUCCESS"},
+            "end_time": os.getenv("VALID_TIMDEX_EXPORT_DATE", "2022-10-24"),
+            "counter": [
+                {
+                    "type": {"value": "label.new.records", "desc": "New Records"},
+                    "value": "1",
+                },
+            ],
+        },
+    }
+
+
+def pytest_collection_modifyitems(config, items):
+    """Hook that is run after all tests collected, which allows for modification pre-run.
+
+    https://docs.pytest.org/en/7.1.x/reference/reference.html#pytest.hookspec.pytest_collection_modifyitems
+    """
+    # skip integration tests if WORKSPACE is not 'dev'
+    allowed_test_environments = ["dev"]
+    for item in items:
+        if (
+            item.get_closest_marker("integration")
+            and os.getenv("WORKSPACE") not in allowed_test_environments
+        ):
+            item.add_marker(
+                pytest.mark.skip(
+                    reason="integration tests currently only support environments: %s"
+                    % allowed_test_environments
+                )
+            )
diff --git a/tests/fixtures/POD_ALMA_EXPORT_20230815_220844[016]_new.tar.gz b/tests/fixtures/POD_ALMA_EXPORT_20230815_220844[016]_new.tar.gz
diff --git a/tests/fixtures/TIMDEX_ALMA_EXPORT_DAILY_20230815_220844[016]_new.tar.gz b/tests/fixtures/TIMDEX_ALMA_EXPORT_DAILY_20230815_220844[016]_new.tar.gz
diff --git a/tests/integration/__init__.py b/tests/integration/__init__.py