marketredesign · marijnvanderhorst · Nov 3, 2022 · Oct 20, 2022 · Oct 20, 2022 · Oct 26, 2022
diff --git a/.idea/pricecypher_python_sdk.iml b/.idea/pricecypher_python_sdk.iml
diff --git a/README.md b/README.md
@@ -26,9 +26,15 @@ datasets.get_transactions(DATASET_ID, AGGREGATE, columns)
 ```
 
 ### Contracts
-The `Script` or `ScopeScript` abstract classes can be extended with their abstract methods implemented to create 
-scripts usable in other services. The `ScopeScript` in particular is intended for scripts that calculate values of 
-certain scopes for transactions. See the documentation on the abstract functions for further specifics.
+The `Script`, `ScopeScript`, and `QualityTestScript` abstract classes can be extended with their abstract methods
+implemented to create scripts usable in other services. 
+
+The `ScopeScript` in particular is intended for scripts that calculate values of certain scopes for transactions. 
+
+The `QualityTestScript` is intended for scripts that check the quality of a data intake and produce a standardized
+output that can be visualized and/or used by other services.
+
+See the documentation on the abstract functions for further specifics.
 
 ## Development
 
@@ -51,7 +57,7 @@ The SDK that this package provides is contained in the top-level package content
 ## Authors
 
 * **Marijn van der Horst** - *Initial work*
-* **Pieter Voors** - *Contracts*
+* **Pieter Voors** - *Contracts for Script and ScopeScript*
 
 See also the list of [contributors](https://github.com/marketredesign/pricecypher_python_sdk/contributors) who participated in this project.
 

diff --git a/setup.cfg b/setup.cfg
@@ -1,6 +1,6 @@
 [metadata]
 name = pricecypher-sdk
-version = 0.4.1
+version = 0.5.0
 author = Deloitte Consulting B.V.
 description = Python wrapper around the different PriceCypher APIs
 long_description = file: README.md
@@ -23,6 +23,7 @@ install_requires =
     requests>=2.14.0
     marshmallow-dataclass>=8.5.3
     pandas>=1.4.1
+    numpy>=1.18.5
     typeguard>=2.13.3
 
 [options.packages.find]

diff --git a/src/pricecypher/contracts/QualityTestScript.py b/src/pricecypher/contracts/QualityTestScript.py
@@ -0,0 +1,26 @@
+from abc import ABC, abstractmethod
+from typing import Optional, Any
+
+from pricecypher.contracts import Script, TestSuite
+
+
+class QualityTestScript(Script, ABC):
+    """
+    The abstract QualityTestScript class serves as an interaction contract such that by extending it with its
+        methods implemented, a script can be created that performs data quality tests on a dataset, which can then be
+        used in a generalized yet controlled setting.
+    """
+
+    def execute(self, business_cell_id: Optional[int], bearer_token: str, user_input: dict[Any: Any]) -> Any:
+        return self.execute_tests(business_cell_id, bearer_token)
+
+    @abstractmethod
+    def execute_tests(self, business_cell_id: Optional[int], bearer_token: str) -> TestSuite:
+        """
+        Execute the script to calculate the values of some scope for the given transactions.
+
+        :param business_cell_id: Business cell to execute the script for, or None if running the script for all.
+        :param bearer_token: Bearer token to use for additional requests.
+        :return: List of all test results that were performed by the test script.
+        """
+        raise NotImplementedError
diff --git a/src/pricecypher/contracts/__init__.py b/src/pricecypher/contracts/__init__.py
@@ -1,2 +1,5 @@
+from .enums import *
+from .dataclasses import *
 from .Script import Script
 from .ScopeScript import ScopeScript
+from .QualityTestScript import QualityTestScript
diff --git a/src/pricecypher/contracts/dataclasses/TestResult.py b/src/pricecypher/contracts/dataclasses/TestResult.py
@@ -0,0 +1,85 @@
+from dataclasses import dataclass
+from typing import Union
+
+from pricecypher.contracts import TestStatus
+
+
+@dataclass
+class ElementTestResult:
+    """
+    Defines a test result of one element of a test.
+
+    key (str): Unique identifier of this element test result (lowercase kebab-case), e.g. 'nr_null'.
+
+    label (str): Label of the element test result for displaying purposes, e.g. 'NULL values'.
+
+    value (str or int): The formatted value of the element test result, e.g. '23,734'.
+    """
+    key: str
+    label: str
+    value: Union[str, int]
+
+
+@dataclass
+class ElementTest:
+    """
+    Defines the test of a single element of a test case, having one or multiple test results. For instance, one element
+    could be a single column of one test that checks the number of NULL values for all columns of a dataset.
+
+    label (str): Label of this single element of the test for displaying purposes, e.g. the name of the column.
+
+    message (str): Short message that describes the test results for displaying purposes, e.g. 'The column has no NULL'.
+
+    results (list[ElementTestResult]): The test results for this single element. For instance, a count of the total
+                                       number of values, a count of the NULL values, and the percentage of NULL values.
+    """
+    label: str
+    message: str
+    status: TestStatus
+    results: list[ElementTestResult]
+
+
+@dataclass
+class TestResult:
+    """
+    Defines one test case with overall status result and multiple test results.
+
+    key (str): Unique identifier of the test (lowercase kebab-case), e.g. 'expect_no_null_values'.
+
+    label (str): Label of the test for displaying purposes, e.g. 'Expect no NULL values in the dataset.'
+
+    coverage (str): Short description to display what is covered by the test, e.g. '10 columns' or 'All transactions'.
+
+    status (TestStatus): Overall status of the test.
+
+    element_label (str): Label to display what the different test elements represent, e.g. 'Column' or 'Dataset'.
+
+    elements (list[ElementTest]): Test results of all the different elements in the test. For instance, the test
+                                  results of all the columns of the dataset.
+    """
+    key: str
+    label: str
+    coverage: str
+    status: TestStatus
+    element_label: str
+    elements: list[ElementTest]
+
+
+@dataclass
+class TestSuite:
+    """
+    One quality test script always produces one TestSuite response. A test suite (usually) contains multiple test cases.
+    It also defines a category that can be used by front-ends to group multiple test suites together.
+
+    label (str): Label of the test suite, e.g. 'Completeness'.
+
+    key (str): Unique identifier of the test suite (lowercase kebab-case), e.g. 'basic-completeness'.
+
+    category_key (str): Unique identifier of the category this test suite is in, e.g. 'basic' or 'advanced'.
+
+    test_results (list[TestResult]): All test cases of this test suite, with their results.
+    """
+    label: str
+    key: str
+    category_key: str
+    test_results: list[TestResult]
diff --git a/src/pricecypher/contracts/dataclasses/__init__.py b/src/pricecypher/contracts/dataclasses/__init__.py
@@ -0,0 +1 @@
+from .TestResult import *
diff --git a/src/pricecypher/contracts/enums/TestStatus.py b/src/pricecypher/contracts/enums/TestStatus.py
@@ -0,0 +1,7 @@
+from enum import Enum
+
+
+class TestStatus(str, Enum):
+    success = "success"
+    warning = "warning"
+    fail = "fail"
diff --git a/src/pricecypher/contracts/enums/__init__.py b/src/pricecypher/contracts/enums/__init__.py
@@ -0,0 +1 @@
+from .TestStatus import TestStatus
diff --git a/src/pricecypher/datasets.py b/src/pricecypher/datasets.py
@@ -147,7 +147,7 @@ def get_transactions(
         :param bool aggregate: If true, the transactions will be grouped on all categorical columns that have no
             aggregation method specified.
         :param list columns: Desired columns in the resulting dataframe. Each column must be a dict. Each column must
-            have either a `representation` or a `name_dataset` specified. The following properties are optional.
+            have a `representation`, `scope_id`, or `name_dataset` specified. The following properties are optional.
                 `filter`: value or list of values the resulting transactions should be filtered on.
                 `aggregate`: aggregation method that should be used for this column. When aggregating and no
                     aggregation method is specified, the method that is used is determined by the underlying dataset

diff --git a/src/pricecypher/encoders/JsonEncoder.py b/src/pricecypher/encoders/JsonEncoder.py
@@ -0,0 +1,21 @@
+import dataclasses
+import numpy as np
+
+from json import JSONEncoder
+
+
+class PriceCypherJsonEncoder(JSONEncoder):
+    """
+    JSON encoder that can properly serialize dataclasses and numpy numbers.
+    """
+    def default(self, obj):
+        if dataclasses.is_dataclass(obj):
+            return dataclasses.asdict(obj)
+        elif isinstance(obj, np.integer):
+            return int(obj)
+        elif isinstance(obj, np.floating):
+            return float(obj)
+        elif isinstance(obj, np.ndarray):
+            return obj.tolist()
+
+        return super().default(obj)
diff --git a/src/pricecypher/encoders/__init__.py b/src/pricecypher/encoders/__init__.py
@@ -0,0 +1 @@
+from .JsonEncoder import PriceCypherJsonEncoder