Refactoring and addition of DataManager

milesgranger · May 5, 2018 · 2c83ab8 · 2c83ab8
1 parent b1dc75c
commit 2c83ab8
Show file tree

Hide file tree

Showing 86 changed files with 194 additions and 30 deletions.
diff --git a/.gitignore b/.gitignore
@@ -10,8 +10,6 @@ __pycache__/
 *.py[cod]
 *$py.class
 *.sqlite
-*.gz
-*.csv
 *.pkl
 output.txt
 
@@ -101,12 +99,3 @@ ENV/
 
 # Rope project settings
 .ropeproject
-/raw_data_persist.sqlite
-/imgs/
-/node_modules/
-!/static/js/bundle.js
-/static/js/bundle.js
-/opplett/static/js/bundle.js
-opplett/static/js/
-!/opplett/static/js/
-/opplett/data/data.csv
diff --git a/hemlock_highway/__init__.py b/hemlock_highway/__init__.py
@@ -1,2 +1 @@
-
 __version__ = "0.0.1dev"
diff --git a/hemlock_highway/__main__.py b/hemlock_highway/__main__.py
@@ -9,7 +9,7 @@
     sys.path.append(PATH)
 
 from hemlock_highway.server import app
-from hemlock_highway.config import Config
+from hemlock_highway.server.config import Config
 
 config = Config()
 

diff --git a/hemlock_highway/data_manager/README.md b/hemlock_highway/data_manager/README.md
@@ -0,0 +1,6 @@
+## Data Manager
+
+Logic to handle the pre-processing of uploaded data
+
+The resulting object which handles the parsing of raw data into a format
+suitable for a `Pipeline` object is part of the end model's pre-processing step. 
diff --git a/hemlock_highway/data_manager/__init__.py b/hemlock_highway/data_manager/__init__.py
@@ -0,0 +1 @@
+from .manager import DataManager
diff --git a/hemlock_highway/data_manager/manager.py b/hemlock_highway/data_manager/manager.py
@@ -0,0 +1,51 @@
+# -*- coding: utf-8 -*-
+
+import io
+import boto3
+import pandas as pd
+from hemlock_highway.settings import PROJECT_CONFIG
+
+
+class DataManager:
+
+    X, y = pd.DataFrame(), pd.Series()
+
+    def __new__(cls, *args, **kwargs):
+        cls.s3_client = boto3.client('s3', region_name=PROJECT_CONFIG.AWS_REGION)
+        return super().__new__(cls)
+
+    def __init__(self, data_endpoint: str, target_column: str, **read_args):
+        """
+        Load the head of data stored at either a bucket location, or an http endpoint
+
+        Parameters
+        ----------
+        data_endpoint: str  - Either an s3 bucket or an http endpoint
+        target_column: str  - After loading the dataset, this is designated as the target column
+        read_args: dict     - Any additional pandas.read_csv() kwargs
+        """
+        self.data_endpoint = data_endpoint
+        self.target_column = target_column
+        self.read_args = read_args
+
+    def load(self):
+        """
+        Execute the load from either http or s3
+        """
+        if self.data_endpoint.startswith('http://') or self.data_endpoint.startswith('https://'):
+            self.X = pd.read_csv(filepath_or_buffer=self.data_endpoint, **self.read_args)
+        else:
+            resp = self.s3_client.get_object(Bucket=self.data_endpoint.split('/')[0],
+                                             Key='/'.join(self.data_endpoint.split('/')[1:])
+                                             )
+            if resp['ResponseMetadata']['HTTPStatusCode'] == 200:
+                self.X = pd.read_csv(io.BytesIO(resp['Body'].read()), **self.read_args)
+            else:
+                raise IOError(f'Error fetching dataset from S3: {resp}')
+
+        self.y = self.X[self.target_column]
+        self.X = self.X[[col for col in self.X.columns if col != self.target_column]]
+
+    @property
+    def _loaded(self):
+        return self.X.shape[0] > 0 if hasattr(self.X, 'shape') else False
diff --git a/hemlock_highway/ml/README.md b/hemlock_highway/ml/README.md
@@ -0,0 +1,2 @@
+This package contains models suitable for use
+by the `model_runner` and `server` resources.
diff --git a/hemlock_highway/ml/models/abc_model.py b/hemlock_highway/ml/models/abc_model.py
@@ -5,11 +5,13 @@
 import zlib
 import pickle
 
+from hemlock_highway.settings import PROJECT_CONFIG
+
 
 class AbcHemlockModel:
 
     def __new__(cls, *args, **kwargs):
-        cls.client = boto3.client('s3', region_name='us-east-1')
+        cls.s3_client = boto3.client('s3', region_name=PROJECT_CONFIG.AWS_REGION)
         return super().__new__(cls)
 
     @staticmethod
@@ -29,8 +31,8 @@ def dump(self, bucket: str, key: str, name: str):
         Dump a model to s3
         """
         model_out = zlib.compress(pickle.dumps(self))
-        self.client.create_bucket(Bucket=bucket)
-        resp = self.client.put_object(Bucket=bucket, Key=f'{key}/{name}', Body=model_out)
+        self.s3_client.create_bucket(Bucket=bucket)
+        resp = self.s3_client.put_object(Bucket=bucket, Key=f'{key}/{name}', Body=model_out)
         if resp['ResponseMetadata']['HTTPStatusCode'] == 200:
             return True
         else:
@@ -42,7 +44,7 @@ def load(cls, bucket: str, key: str, name: str):
         """
         Load a model from S3
         """
-        model = cls().client.get_object(Bucket=bucket, Key=f'{key}/{name}')['Body'].read()
+        model = cls().s3_client.get_object(Bucket=bucket, Key=f'{key}/{name}')['Body'].read()
         model = pickle.loads(zlib.decompress(model))
         return model
 

diff --git a/hemlock_highway/model_runner/README.md b/hemlock_highway/model_runner/README.md
@@ -0,0 +1,3 @@
+## Model Runner
+
+API service to take requests to train a model or make predictions
diff --git a/hemlock_highway/api/__init__.py → hemlock_highway/model_runner/__init__.py b/hemlock_highway/api/__init__.py → hemlock_highway/model_runner/__init__.py
diff --git a/hemlock_highway/server/__init__.py b/hemlock_highway/server/__init__.py
@@ -0,0 +1 @@
+from .server import app
diff --git a/hemlock_highway/server/api/__init__.py b/hemlock_highway/server/api/__init__.py
@@ -0,0 +1 @@
+from .v1 import api_v1_blueprint
diff --git a/hemlock_highway/api/v1/__init__.py → hemlock_highway/server/api/v1/__init__.py b/hemlock_highway/api/v1/__init__.py → hemlock_highway/server/api/v1/__init__.py
diff --git a/...ighway/api/v1/pluggable_views/__init__.py → ...server/api/v1/pluggable_views/__init__.py b/...ighway/api/v1/pluggable_views/__init__.py → ...server/api/v1/pluggable_views/__init__.py
diff --git a/hemlock_highway/api/v1/views.py → hemlock_highway/server/api/v1/views.py b/hemlock_highway/api/v1/views.py → hemlock_highway/server/api/v1/views.py
diff --git a/hemlock_highway/config.py → hemlock_highway/server/config.py b/hemlock_highway/config.py → hemlock_highway/server/config.py
diff --git a/hemlock_highway/server.py → hemlock_highway/server/server.py b/hemlock_highway/server.py → hemlock_highway/server/server.py
@@ -2,12 +2,12 @@
 
 from flask import Flask, request
 
-from hemlock_highway.config import Config
+from hemlock_highway.server.config import Config
 
 # blueprints
-from hemlock_highway.api.v1 import api_v1_blueprint
-from hemlock_highway.ui import ui_blueprint
-from hemlock_highway.user_mgmt import google_auth_blueprint
+from hemlock_highway.server.api import api_v1_blueprint
+from hemlock_highway.server.ui import ui_blueprint
+from hemlock_highway.server.user_mgmt import google_auth_blueprint
 
 
 app = Flask(__name__)
@@ -19,6 +19,6 @@
 app.register_blueprint(google_auth_blueprint, url_prefix='/google-login')
 
 
-@app.route('/echo')
-def echo():
-    return request.args.get('word')
+@app.route('/health-check')
+def health_check():
+    return 'ahola', 200
diff --git a/hemlock_highway/ui/__init__.py → hemlock_highway/server/ui/__init__.py b/hemlock_highway/ui/__init__.py → hemlock_highway/server/ui/__init__.py
diff --git a/hemlock_highway/ui/static/css/bootstrap.css → ...ighway/server/ui/static/css/bootstrap.css b/hemlock_highway/ui/static/css/bootstrap.css → ...ighway/server/ui/static/css/bootstrap.css
diff --git a/...k_highway/ui/static/css/bootstrap.min.css → ...ay/server/ui/static/css/bootstrap.min.css b/...k_highway/ui/static/css/bootstrap.min.css → ...ay/server/ui/static/css/bootstrap.min.css
diff --git a/...ghway/ui/static/css/stylish-portfolio.css → ...erver/ui/static/css/stylish-portfolio.css b/...ghway/ui/static/css/stylish-portfolio.css → ...erver/ui/static/css/stylish-portfolio.css
diff --git a/.../static/font-awesome/css/font-awesome.css → .../static/font-awesome/css/font-awesome.css b/.../static/font-awesome/css/font-awesome.css → .../static/font-awesome/css/font-awesome.css
diff --git a/...tic/font-awesome/css/font-awesome.min.css → ...tic/font-awesome/css/font-awesome.min.css b/...tic/font-awesome/css/font-awesome.min.css → ...tic/font-awesome/css/font-awesome.min.css
diff --git a/...static/font-awesome/fonts/FontAwesome.otf → ...static/font-awesome/fonts/FontAwesome.otf b/...static/font-awesome/fonts/FontAwesome.otf → ...static/font-awesome/fonts/FontAwesome.otf
diff --git a/...ont-awesome/fonts/fontawesome-webfont.eot → ...ont-awesome/fonts/fontawesome-webfont.eot b/...ont-awesome/fonts/fontawesome-webfont.eot → ...ont-awesome/fonts/fontawesome-webfont.eot
diff --git a/...ont-awesome/fonts/fontawesome-webfont.svg → ...ont-awesome/fonts/fontawesome-webfont.svg b/...ont-awesome/fonts/fontawesome-webfont.svg → ...ont-awesome/fonts/fontawesome-webfont.svg
diff --git a/...ont-awesome/fonts/fontawesome-webfont.ttf → ...ont-awesome/fonts/fontawesome-webfont.ttf b/...ont-awesome/fonts/fontawesome-webfont.ttf → ...ont-awesome/fonts/fontawesome-webfont.ttf
diff --git a/...nt-awesome/fonts/fontawesome-webfont.woff → ...nt-awesome/fonts/fontawesome-webfont.woff b/...nt-awesome/fonts/fontawesome-webfont.woff → ...nt-awesome/fonts/fontawesome-webfont.woff
diff --git a/...t-awesome/fonts/fontawesome-webfont.woff2 → ...t-awesome/fonts/fontawesome-webfont.woff2 b/...t-awesome/fonts/fontawesome-webfont.woff2 → ...t-awesome/fonts/fontawesome-webfont.woff2
diff --git a/...ui/static/font-awesome/less/animated.less → ...ui/static/font-awesome/less/animated.less b/...ui/static/font-awesome/less/animated.less → ...ui/static/font-awesome/less/animated.less
diff --git a/...ic/font-awesome/less/bordered-pulled.less → ...ic/font-awesome/less/bordered-pulled.less b/...ic/font-awesome/less/bordered-pulled.less → ...ic/font-awesome/less/bordered-pulled.less
diff --git a/...way/ui/static/font-awesome/less/core.less → ...ver/ui/static/font-awesome/less/core.less b/...way/ui/static/font-awesome/less/core.less → ...ver/ui/static/font-awesome/less/core.less
diff --git a/...static/font-awesome/less/fixed-width.less → ...static/font-awesome/less/fixed-width.less b/...static/font-awesome/less/fixed-width.less → ...static/font-awesome/less/fixed-width.less
diff --git a/...tatic/font-awesome/less/font-awesome.less → ...tatic/font-awesome/less/font-awesome.less b/...tatic/font-awesome/less/font-awesome.less → ...tatic/font-awesome/less/font-awesome.less
diff --git a/...ay/ui/static/font-awesome/less/icons.less → ...er/ui/static/font-awesome/less/icons.less b/...ay/ui/static/font-awesome/less/icons.less → ...er/ui/static/font-awesome/less/icons.less
diff --git a/...y/ui/static/font-awesome/less/larger.less → ...r/ui/static/font-awesome/less/larger.less b/...y/ui/static/font-awesome/less/larger.less → ...r/ui/static/font-awesome/less/larger.less
diff --git a/...way/ui/static/font-awesome/less/list.less → ...ver/ui/static/font-awesome/less/list.less b/...way/ui/static/font-awesome/less/list.less → ...ver/ui/static/font-awesome/less/list.less
diff --git a/...y/ui/static/font-awesome/less/mixins.less → ...r/ui/static/font-awesome/less/mixins.less b/...y/ui/static/font-awesome/less/mixins.less → ...r/ui/static/font-awesome/less/mixins.less
diff --git a/...way/ui/static/font-awesome/less/path.less → ...ver/ui/static/font-awesome/less/path.less b/...way/ui/static/font-awesome/less/path.less → ...ver/ui/static/font-awesome/less/path.less
diff --git a/...ic/font-awesome/less/rotated-flipped.less → ...ic/font-awesome/less/rotated-flipped.less b/...ic/font-awesome/less/rotated-flipped.less → ...ic/font-awesome/less/rotated-flipped.less
diff --git a/.../ui/static/font-awesome/less/stacked.less → .../ui/static/font-awesome/less/stacked.less b/.../ui/static/font-awesome/less/stacked.less → .../ui/static/font-awesome/less/stacked.less
diff --git a/...i/static/font-awesome/less/variables.less → ...i/static/font-awesome/less/variables.less b/...i/static/font-awesome/less/variables.less → ...i/static/font-awesome/less/variables.less
diff --git a/...i/static/font-awesome/scss/_animated.scss → ...i/static/font-awesome/scss/_animated.scss b/...i/static/font-awesome/scss/_animated.scss → ...i/static/font-awesome/scss/_animated.scss
diff --git a/...c/font-awesome/scss/_bordered-pulled.scss → ...c/font-awesome/scss/_bordered-pulled.scss b/...c/font-awesome/scss/_bordered-pulled.scss → ...c/font-awesome/scss/_bordered-pulled.scss
diff --git a/...ay/ui/static/font-awesome/scss/_core.scss → ...er/ui/static/font-awesome/scss/_core.scss b/...ay/ui/static/font-awesome/scss/_core.scss → ...er/ui/static/font-awesome/scss/_core.scss
diff --git a/...tatic/font-awesome/scss/_fixed-width.scss → ...tatic/font-awesome/scss/_fixed-width.scss b/...tatic/font-awesome/scss/_fixed-width.scss → ...tatic/font-awesome/scss/_fixed-width.scss
diff --git a/...y/ui/static/font-awesome/scss/_icons.scss → ...r/ui/static/font-awesome/scss/_icons.scss b/...y/ui/static/font-awesome/scss/_icons.scss → ...r/ui/static/font-awesome/scss/_icons.scss
diff --git a/.../ui/static/font-awesome/scss/_larger.scss → .../ui/static/font-awesome/scss/_larger.scss b/.../ui/static/font-awesome/scss/_larger.scss → .../ui/static/font-awesome/scss/_larger.scss
diff --git a/...ay/ui/static/font-awesome/scss/_list.scss → ...er/ui/static/font-awesome/scss/_list.scss b/...ay/ui/static/font-awesome/scss/_list.scss → ...er/ui/static/font-awesome/scss/_list.scss
diff --git a/.../ui/static/font-awesome/scss/_mixins.scss → .../ui/static/font-awesome/scss/_mixins.scss b/.../ui/static/font-awesome/scss/_mixins.scss → .../ui/static/font-awesome/scss/_mixins.scss
diff --git a/...ay/ui/static/font-awesome/scss/_path.scss → ...er/ui/static/font-awesome/scss/_path.scss b/...ay/ui/static/font-awesome/scss/_path.scss → ...er/ui/static/font-awesome/scss/_path.scss
diff --git a/...c/font-awesome/scss/_rotated-flipped.scss → ...c/font-awesome/scss/_rotated-flipped.scss b/...c/font-awesome/scss/_rotated-flipped.scss → ...c/font-awesome/scss/_rotated-flipped.scss
diff --git a/...ui/static/font-awesome/scss/_stacked.scss → ...ui/static/font-awesome/scss/_stacked.scss b/...ui/static/font-awesome/scss/_stacked.scss → ...ui/static/font-awesome/scss/_stacked.scss
diff --git a/.../static/font-awesome/scss/_variables.scss → .../static/font-awesome/scss/_variables.scss b/.../static/font-awesome/scss/_variables.scss → .../static/font-awesome/scss/_variables.scss
diff --git a/...tatic/font-awesome/scss/font-awesome.scss → ...tatic/font-awesome/scss/font-awesome.scss b/...tatic/font-awesome/scss/font-awesome.scss → ...tatic/font-awesome/scss/font-awesome.scss
diff --git a/...ic/fonts/glyphicons-halflings-regular.eot → ...ic/fonts/glyphicons-halflings-regular.eot b/...ic/fonts/glyphicons-halflings-regular.eot → ...ic/fonts/glyphicons-halflings-regular.eot
diff --git a/...ic/fonts/glyphicons-halflings-regular.svg → ...ic/fonts/glyphicons-halflings-regular.svg b/...ic/fonts/glyphicons-halflings-regular.svg → ...ic/fonts/glyphicons-halflings-regular.svg
diff --git a/...ic/fonts/glyphicons-halflings-regular.ttf → ...ic/fonts/glyphicons-halflings-regular.ttf b/...ic/fonts/glyphicons-halflings-regular.ttf → ...ic/fonts/glyphicons-halflings-regular.ttf
diff --git a/...c/fonts/glyphicons-halflings-regular.woff → ...c/fonts/glyphicons-halflings-regular.woff b/...c/fonts/glyphicons-halflings-regular.woff → ...c/fonts/glyphicons-halflings-regular.woff
diff --git a/.../fonts/glyphicons-halflings-regular.woff2 → .../fonts/glyphicons-halflings-regular.woff2 b/.../fonts/glyphicons-halflings-regular.woff2 → .../fonts/glyphicons-halflings-regular.woff2
diff --git a/hemlock_highway/ui/static/img/bg.jpg → hemlock_highway/server/ui/static/img/bg.jpg b/hemlock_highway/ui/static/img/bg.jpg → hemlock_highway/server/ui/static/img/bg.jpg
diff --git a/hemlock_highway/ui/static/img/callout.jpg → ..._highway/server/ui/static/img/callout.jpg b/hemlock_highway/ui/static/img/callout.jpg → ..._highway/server/ui/static/img/callout.jpg
diff --git a/...ock_highway/ui/static/img/portfolio-1.jpg → ...hway/server/ui/static/img/portfolio-1.jpg b/...ock_highway/ui/static/img/portfolio-1.jpg → ...hway/server/ui/static/img/portfolio-1.jpg
diff --git a/...ock_highway/ui/static/img/portfolio-2.jpg → ...hway/server/ui/static/img/portfolio-2.jpg b/...ock_highway/ui/static/img/portfolio-2.jpg → ...hway/server/ui/static/img/portfolio-2.jpg
diff --git a/...ock_highway/ui/static/img/portfolio-3.jpg → ...hway/server/ui/static/img/portfolio-3.jpg b/...ock_highway/ui/static/img/portfolio-3.jpg → ...hway/server/ui/static/img/portfolio-3.jpg
diff --git a/...ock_highway/ui/static/img/portfolio-4.jpg → ...hway/server/ui/static/img/portfolio-4.jpg b/...ock_highway/ui/static/img/portfolio-4.jpg → ...hway/server/ui/static/img/portfolio-4.jpg
diff --git a/hemlock_highway/ui/static/js/bootstrap.js → ..._highway/server/ui/static/js/bootstrap.js b/hemlock_highway/ui/static/js/bootstrap.js → ..._highway/server/ui/static/js/bootstrap.js
diff --git a/...ock_highway/ui/static/js/bootstrap.min.js → ...hway/server/ui/static/js/bootstrap.min.js b/...ock_highway/ui/static/js/bootstrap.min.js → ...hway/server/ui/static/js/bootstrap.min.js
diff --git a/hemlock_highway/ui/static/js/jquery.js → ...ock_highway/server/ui/static/js/jquery.js b/hemlock_highway/ui/static/js/jquery.js → ...ock_highway/server/ui/static/js/jquery.js
diff --git a/hemlock_highway/ui/templates/index.html → ...ck_highway/server/ui/templates/index.html b/hemlock_highway/ui/templates/index.html → ...ck_highway/server/ui/templates/index.html
diff --git a/hemlock_highway/ui/views.py → hemlock_highway/server/ui/views.py b/hemlock_highway/ui/views.py → hemlock_highway/server/ui/views.py
@@ -4,7 +4,7 @@
 from flask import redirect, url_for, current_app, render_template
 from flask.blueprints import Blueprint
 from flask_dance.contrib.google import google
-from hemlock_highway.user_mgmt.user import User
+from hemlock_highway.server.user_mgmt.user import User
 
 MODULE_PATH = os.path.dirname(os.path.abspath(__file__))
 

diff --git a/hemlock_highway/user_mgmt/__init__.py → hemlock_highway/server/user_mgmt/__init__.py b/hemlock_highway/user_mgmt/__init__.py → hemlock_highway/server/user_mgmt/__init__.py
diff --git a/hemlock_highway/user_mgmt/auth.py → hemlock_highway/server/user_mgmt/auth.py b/hemlock_highway/user_mgmt/auth.py → hemlock_highway/server/user_mgmt/auth.py
@@ -1,7 +1,7 @@
 # -*- coding: utf-8 -*-
 
 from flask_dance.contrib.google import make_google_blueprint
-from hemlock_highway.config import Config
+from hemlock_highway.server.config import Config
 
 config = Config()
 

diff --git a/hemlock_highway/user_mgmt/user.py → hemlock_highway/server/user_mgmt/user.py b/hemlock_highway/user_mgmt/user.py → hemlock_highway/server/user_mgmt/user.py
diff --git a/hemlock_highway/settings.py b/hemlock_highway/settings.py
@@ -0,0 +1,17 @@
+# -*- coding: utf-8 -*-
+
+import os
+
+
+class ProjectConfig:
+
+    # Directories
+    REPO_ROOT_DIR = os.path.join(os.path.dirname(os.path.abspath(__file__)), '..')
+    HEMLOCK_HIGHWAY_MODULE_ROOT_DIR = os.path.join(REPO_ROOT_DIR, 'hemlock_highway')
+    TEST_ROOT_DIR = os.path.join(REPO_ROOT_DIR, 'tests')
+    TEST_DATA_DIR = os.path.join(TEST_ROOT_DIR, 'data')
+
+    AWS_REGION = 'eu-west-1'
+
+
+PROJECT_CONFIG = ProjectConfig()
diff --git a/tests/data/basic_integer_data.csv b/tests/data/basic_integer_data.csv
@@ -0,0 +1,8 @@
+col1,col2,target
+1,2,3
+2,3,5
+3,4,7
+4,5,9
+5,6,11
+6,7,13
+7,8,15
diff --git a/tests/test_data_manager/__init__.py b/tests/test_data_manager/__init__.py
diff --git a/tests/test_data_manager/test_data_manager.py b/tests/test_data_manager/test_data_manager.py
@@ -0,0 +1,58 @@
+# -*- coding: utf-8 -*-
+
+import os
+import unittest
+import moto
+
+import botocore.exceptions
+from .utils import fake_data_on_s3
+
+
+
+class DataManagerTestCase(unittest.TestCase):
+
+    def setUp(self):
+
+        # Test data directory
+        self.DATA_PATH = os.path.join(os.path.dirname(os.path.abspath(__file__)), '..', 'data')
+
+    @fake_data_on_s3(local_dataset='basic_integer_data.csv', bucket='test', key='data/basic.csv')
+    def test_basic_integer_data_load(self):
+        """
+        Test the basic loading of a dataset.
+        """
+        from hemlock_highway.data_manager import DataManager
+        dm = DataManager(data_endpoint='test/data/basic.csv', target_column='target')
+        self.assertFalse(dm._loaded, msg='DataManger should not load data on initialization! Reports it is loaded!')
+        dm.load()
+        self.assertTrue(dm._loaded, msg='After asking to load data, DataManager is reporting it is not loaded!')
+        self.assertTrue(dm.X.shape[0] > 0, msg='DataManager reports it is loaded, but does not have any data in X!')
+
+    @moto.mock_s3
+    def test_load_non_existant_data(self):
+        """
+        Test IOError when trying to load a non-existant dataset.
+        """
+        from hemlock_highway.data_manager import DataManager
+        dm = DataManager(data_endpoint='test/data/basic.csv', target_column='target')
+
+        # Should raise an exception when trying to load a dataset that doesn't exist.
+        with self.assertRaises(botocore.exceptions.ClientError):
+            dm.load()
+
+    def test_load_from_http(self):
+        """
+        Ensure dataloader can load a dataset via http
+        """
+        from hemlock_highway.data_manager import DataManager
+        dm = DataManager(
+            data_endpoint='https://raw.githubusercontent.com/uiuc-cse/data-fa14/gh-pages/data/iris.csv',
+            target_column='species'
+        )
+        dm.load()
+        self.assertTrue('petal_length' in dm.X.columns,
+                        msg=f'Expected "petal_length" to be in X, but found {dm.X.columns}')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/tests/test_data_manager/utils.py b/tests/test_data_manager/utils.py
@@ -0,0 +1,19 @@
+# -*- coding: utf-8 -*-
+
+import os
+import boto3
+import moto
+from contextlib import contextmanager
+from hemlock_highway.settings import PROJECT_CONFIG
+
+
+@contextmanager
+def fake_data_on_s3(local_dataset, bucket, key):
+
+    with moto.mock_s3():
+        s3 = boto3.client('s3', region_name=PROJECT_CONFIG.AWS_REGION)
+        s3.create_bucket(Bucket=bucket)
+        with open(os.path.join(PROJECT_CONFIG.TEST_DATA_DIR, local_dataset), 'rb') as f:
+            s3.put_object(Bucket=bucket, Key=key, Body=f.read())
+
+        yield
diff --git a/tests/test_ml/__init__.py b/tests/test_ml/__init__.py
diff --git a/tests/test_models.py → tests/test_ml/test_models.py b/tests/test_models.py → tests/test_ml/test_models.py
diff --git a/tests/test_model_runner/__init__.py b/tests/test_model_runner/__init__.py
diff --git a/tests/test_server/__init__.py b/tests/test_server/__init__.py
diff --git a/tests/test_api_v1.py → tests/test_server/test_api_v1.py b/tests/test_api_v1.py → tests/test_server/test_api_v1.py
@@ -15,12 +15,19 @@ def setUp(self):
         self.app = app.test_client()
 
     def test_sanity(self):
-        resp = self.app.get('/echo?word=hello')
-        self.assertTrue(b'hello' in resp.data)
+        resp = self.app.get('/health-check')
+        self.assertTrue(resp.status_code == 200)
 
     def test_available_models(self):
         resp = self.app.get('/api/v1/available-models')
-        self.assertTrue(b'HemlockRandomForestClassifier' in resp.data)
+        models = json.loads(resp.data)
+
+        # Should return a list of strings, each the name of some valid model
+        self.assertTrue(isinstance(models, list))
+        self.assertTrue(isinstance(models[-1], str))
+
+        # Verify at least this known implemented model is in there.
+        self.assertTrue('HemlockRandomForestClassifier' in models)
 
     @moto.mock_s3
     def test_server_model_dump_load(self):

diff --git a/tests/test_user_mgmt.py → tests/test_server/test_user_mgmt.py b/tests/test_user_mgmt.py → tests/test_server/test_user_mgmt.py
@@ -2,7 +2,7 @@
 
 import unittest
 from hemlock_highway.server import app
-from tests.utils import fake_google_authenticated_user
+from tests.test_server.utils import fake_google_authenticated_user
 
 
 class UserMgmtTestCase(unittest.TestCase):

diff --git a/tests/utils.py → tests/test_server/utils.py b/tests/utils.py → tests/test_server/utils.py