<!--
#  Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
#
#    Licensed under the Apache License, Version 2.0 (the "License").
#    You may not use this file except in compliance with the License.
#    You may obtain a copy of the License at
#
#        http://www.apache.org/licenses/LICENSE-2.0
#
#    Unless required by applicable law or agreed to in writing, software
#    distributed under the License is distributed on an "AS IS" BASIS,
#    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#    See the License for the specific language governing permissions and
#    limitations under the License.
-->

# Sample notebook to build a Jupyter Image with Spark Kernel.

## Content
1. [Configuration](#Configuration)
2. [Build Image](#Build-Image)
2. [Running Container using the profile](#Running-container)


### Configuration

In [None]:
profile_name='spark'
image_name = 'spark'
folder_name = 'spark'

### Build Image

Lets see how  orbit build image works...

In [None]:
!orbit build image --help

get our orbit env and team names

In [None]:
env_name = %env AWS_ORBIT_ENV
team_name = %env AWS_ORBIT_TEAM_SPACE
user_name = %env USERNAME
namespace = %env AWS_ORBIT_USER_SPACE
(env_name,team_name, user_name, namespace)

Repository name will be created from the image name prefixed by the env context.  Users are only able to manipulate ECR repos that start with 'orbit-{env_name}/users/'

In [None]:
repository_name = (f"orbit-{env_name}/users/{image_name}")
repository_name

In [None]:
!aws ecr delete-repository --repository-name $repository_name --force

In [None]:
%cd ~/shared/samples/notebooks/I-Image/$folder_name

adding a file to our docker as an example

In [None]:
pwd = %pwd
pwd

Now lets run the command

In [None]:
%%time

output = !orbit build image -e $env_name -d $pwd -n $image_name
output

Lets get the image address from the output of the previous command

In [None]:
look_for = 'ECR Image Address='
image = None
for o in output:
    if look_for in o:
        image = o[o.index(look_for) + len(look_for):]
        print(image)

assert(image != None)       
    

In [None]:
# check that the image was built
import json
print(repository_name)
images = !aws ecr list-images --repository-name $repository_name
images = "".join(images)
im = json.loads(images)
print(im['imageIds'])
assert(len(im['imageIds']) > 0)

### Building the podsetting for the Image

In [None]:
import json

customname = "orbit-custom-spark-image-"+team_name

with open("podsetting_spark.yaml", "w") as file:
    file.write("""
    kind: PodSetting
    apiVersion: orbit.aws/v1
    metadata:
      labels:
        orbit/env: {env_name}
        orbit/space: team
        orbit/team: {team_name}
      name: {customname}
      namespace: {team_name}
    spec:
      containerSelector:
        jsonpath: metadata.labels.app
      desc: SPARK Custom Image example {customname}
      env:
        - name: custom_name
          value: custom_value
      image: >-
        {image}
      podSelector:
        matchExpressions:
          - key: orbit/{customname}
            operator: Exists
      resources:
        limits:
          cpu: '1.0'
          memory: 1Gi
        requests:
          cpu: '1.0'
          memory: 1Gi
      securityContext:
        runAsUser: 1000
    """.format(team_name=team_name,env_name=env_name,customname=customname,image=image)
)


In [None]:
!kubectl apply -f podsetting_spark.yaml -n {team_name}

### Running container 

Lets run a container using the profile and image we created

In [None]:
import json
run = {
      "compute": {
          "container" : {
              "p_concurrent": "1"
          },
          "node_type": "ec2",
          "podsetting":customname,
          "labels": {
            "my-jobid": customname
          } 
      },
      "tasks":  [{
          "notebookName": "test-image.ipynb",
          "sourcePath": pwd,
          "targetPath": f"/home/jovyan/shared/regression/notebooks/I-Image/{folder_name}",
          "params": {
          }
        }]
 }

with open("run.json", 'w') as f:
    json.dump(run, f)

In [None]:
%%time

!orbit run notebook --env $env_name --team $team_name --user testing --wait --tail-logs run.json

!kubectl delete job -l my-jobid={customname}

!kubectl delete podsetting {customname} -n {namespace}