/
test_maven_emr.py
46 lines (40 loc) · 1.77 KB
/
test_maven_emr.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
from moto import mock_emr
import mock
from rudra.deployments.emr_scripts.maven_emr import MavenEMR
class MockEMRConfig(mock.Mock):
def __init__(self, *args, **kwargs):
super().__init__(*args, **kwargs)
def get_config(self):
return dict(
Instances={
'InstanceCount': 1,
'KeepJobFlowAliveWhenNoSteps': True,
'MasterInstanceType': 'c3.medium',
'Placement': {'AvailabilityZone': 'us-east-1a'},
'SlaveInstanceType': 'c3.xlarge',
},
JobFlowRole='EMR_EC2_DefaultRole',
LogUri='s3://fake_bucket/log',
Name='HPF_training',
ServiceRole='EMR_DefaultRole',
VisibleToAllUsers=True)
class TestMavenEMR:
@mock.patch('rudra.deployments.emr_scripts.maven_emr.EMRConfig', new_callable=MockEMRConfig)
@mock.patch.dict('os.environ', {'AWS_S3_ACCESS_KEY_ID': 'fake_id',
'AWS_S3_SECRET_ACCESS_KEY': 'fake_secret'})
@mock_emr
def test_run_job(self, _emr_config_mocked):
maven_emr = MavenEMR()
input_dict = {'environment': 'dev',
'data_version': '2019-01-01',
'bucket_name': 'fake_bucket',
'hyper_params': {"key1": 'value1', 'key2': 'value2'},
'github_repo': 'https://github.com/fabric8-analytics/f8a-hpf-insights'}
response = maven_emr.run_job(input_dict)
status_code = response.get(
'ResponseMetadata', {}).get('HTTPStatusCode')
assert status_code == 200
job_flow_id = response.get('JobFlowId')
assert job_flow_id
job_status = maven_emr.aws_emr.get_status(job_flow_id)
assert job_status.get('State') == 'WAITING'