diff --git a/demos/demos-v1.yaml b/demos/demos-v1.yaml index a9854db9..16e8f3bc 100644 --- a/demos/demos-v1.yaml +++ b/demos/demos-v1.yaml @@ -1,34 +1,23 @@ --- demos: - trino-taxi-data: - description: Demo loading 2.5 years of New York taxi data into S3 bucket, creating a Trino table and a Superset dashboard - documentation: https://docs.stackable.tech/stackablectl/stable/demos/trino-taxi-data.html - stackableStack: trino-superset-s3 + airflow-scheduled-job: + description: Activate a simple Airflow DAG to run continuously at a set interval + stackableStack: airflow labels: - - trino - - superset - - minio - - s3 - - ny-taxi-data + - airflow + - job-scheduling manifests: - - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/trino-taxi-data/load-test-data.yaml - - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/trino-taxi-data/create-table-in-trino.yaml - - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/trino-taxi-data/setup-superset.yaml - kafka-druid-water-level-data: - description: Demo ingesting water level data into Kafka, streaming it into Druid and creating a Superset dashboard - documentation: https://docs.stackable.tech/stackablectl/stable/demos/kafka-druid-water-level-data.html - stackableStack: kafka-druid-superset-s3 + - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/airflow-scheduled-job/enable-and-run-dag.yaml + hbase-hdfs-load-cycling-data: + description: Copy data from S3 bucket to an HBase table + stackableStack: hdfs-hbase labels: - - kafka - - druid - - superset - - minio - - s3 - - water-levels + - hbase + - hdfs + - cycling-tripdata manifests: - - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/kafka-druid-water-level-data/ingest-test-data.yaml - - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/kafka-druid-water-level-data/create-druid-ingestion-job.yaml - - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/kafka-druid-water-level-data/setup-superset.yaml + - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/hbase-hdfs-load-cycling-data/01-distcp-cycling-data.yaml + - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/hbase-hdfs-load-cycling-data/02-create-hfile-and-import-to-hbase.yaml nifi-kafka-druid-earthquake-data: description: Demo ingesting earthquake data into Kafka using NiFi, streaming it into Druid and creating a Superset dashboard documentation: https://docs.stackable.tech/stackablectl/stable/demos/nifi-kafka-druid-earthquake-data.html @@ -45,21 +34,33 @@ demos: - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/nifi-kafka-druid-earthquake-data/create-nifi-ingestion-job.yaml - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/nifi-kafka-druid-earthquake-data/create-druid-ingestion-job.yaml - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/nifi-kafka-druid-earthquake-data/setup-superset.yaml - hbase-hdfs-load-cycling-data: - description: Copy data from S3 bucket to an HBase table - stackableStack: hdfs-hbase + nifi-kafka-druid-water-level-data: + description: Demo ingesting water level data into Kafka using NiFi, streaming it into Druid and creating a Superset dashboard + documentation: https://docs.stackable.tech/stackablectl/stable/demos/nifi-kafka-druid-water-level-data.html + stackableStack: nifi-kafka-druid-superset-s3 labels: - - hbase - - hdfs - - cycling-tripdata + - nifi + - kafka + - druid + - superset + - minio + - s3 + - water-levels manifests: - - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/hbase-hdfs-load-cycling-data/01-distcp-cycling-data.yaml - - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/hbase-hdfs-load-cycling-data/02-create-hfile-and-import-to-hbase.yaml - airflow-scheduled-job: - description: Activate a simple Airflow DAG to run continously at a set interval - stackableStack: airflow + - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/nifi-kafka-druid-water-level-data/create-nifi-ingestion-job.yaml # TODO + - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/nifi-kafka-druid-water-level-data/create-druid-ingestion-job.yaml # TODO + - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/nifi-kafka-druid-water-level-data/setup-superset.yaml # TODO + trino-taxi-data: + description: Demo loading 2.5 years of New York taxi data into S3 bucket, creating a Trino table and a Superset dashboard + documentation: https://docs.stackable.tech/stackablectl/stable/demos/trino-taxi-data.html + stackableStack: trino-superset-s3 labels: - - airflow - - job-scheduling + - trino + - superset + - minio + - s3 + - ny-taxi-data manifests: - - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/airflow-scheduled-job/enable-and-run-dag.yaml \ No newline at end of file + - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/trino-taxi-data/load-test-data.yaml + - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/trino-taxi-data/create-table-in-trino.yaml + - plainYaml: https://raw.githubusercontent.com/stackabletech/stackablectl/main/demos/trino-taxi-data/setup-superset.yaml diff --git a/demos/hbase-hdfs-load-cycling-data/01-distcp-cycling-data.yaml b/demos/hbase-hdfs-load-cycling-data/01-distcp-cycling-data.yaml index 40da3092..4f9a9bd0 100644 --- a/demos/hbase-hdfs-load-cycling-data/01-distcp-cycling-data.yaml +++ b/demos/hbase-hdfs-load-cycling-data/01-distcp-cycling-data.yaml @@ -6,11 +6,6 @@ metadata: spec: template: spec: - restartPolicy: OnFailure - volumes: - - name: config-volume-hdfs - configMap: - name: hdfs containers: - name: distcp-cycling-data image: docker.stackable.tech/stackable/hadoop:3.3.3-stackable0.1.0 @@ -19,10 +14,10 @@ spec: value: "/stackable/conf/hdfs" - name: HADOOP_HOME value: "/stackable/hadoop" - - name: HADOOP_CLASSPATH # no hadoop_classpath env available in container. Need to add classpath + /stackable/hadoop-3.3.3/share/hadoop/tools/lib/hadoop-aws-3.3.3.jar + /stackable/hadoop-3.3.3/share/hadoop/tools/lib/aws-java-sdk-bundle-1.11.1026.jar - value: "/stackable/hadoop/etc/hadoop:/stackable/hadoop/share/hadoop/common/lib/kerby-config-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/jaxb-api-2.2.11.jar:/stackable/hadoop/share/hadoop/common/lib/javax.servlet-api-3.1.0.jar:/stackable/hadoop/share/hadoop/common/lib/commons-daemon-1.0.13.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-jaxrs-1.9.13.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-client-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/reload4j-1.2.18.3.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-http-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/avro-1.7.7.jar:/stackable/hadoop/share/hadoop/common/lib/re2j-1.1.jar:/stackable/hadoop/share/hadoop/common/lib/jsch-0.1.55.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-core-2.13.2.jar:/stackable/hadoop/share/hadoop/common/lib/hadoop-auth-3.3.3.jar:/stackable/hadoop/share/hadoop/common/lib/animal-sniffer-annotations-1.17.jar:/stackable/hadoop/share/hadoop/common/lib/jersey-json-1.19.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-identity-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-simplekdc-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/commons-io-2.8.0.jar:/stackable/hadoop/share/hadoop/common/lib/protobuf-java-2.5.0.jar:/stackable/hadoop/share/hadoop/common/lib/jcip-annotations-1.0-1.jar:/stackable/hadoop/share/hadoop/common/lib/woodstox-core-5.3.0.jar:/stackable/hadoop/share/hadoop/common/lib/jaxb-impl-2.2.3-1.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-server-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/zookeeper-3.5.6.jar:/stackable/hadoop/share/hadoop/common/lib/commons-lang3-3.12.0.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-common-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/jsr311-api-1.1.1.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-crypto-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-util-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/accessors-smart-2.4.7.jar:/stackable/hadoop/share/hadoop/common/lib/commons-logging-1.1.3.jar:/stackable/hadoop/share/hadoop/common/lib/jersey-core-1.19.jar:/stackable/hadoop/share/hadoop/common/lib/paranamer-2.3.jar:/stackable/hadoop/share/hadoop/common/lib/hadoop-annotations-3.3.3.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-security-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/commons-text-1.4.jar:/stackable/hadoop/share/hadoop/common/lib/gson-2.8.9.jar:/stackable/hadoop/share/hadoop/common/lib/asm-5.0.4.jar:/stackable/hadoop/share/hadoop/common/lib/jersey-servlet-1.19.jar:/stackable/hadoop/share/hadoop/common/lib/commons-math3-3.1.1.jar:/stackable/hadoop/share/hadoop/common/lib/listenablefuture-9999.0-empty-to-avoid-conflict-with-guava.jar:/stackable/hadoop/share/hadoop/common/lib/kerby-pkix-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/netty-3.10.6.Final.jar:/stackable/hadoop/share/hadoop/common/lib/jul-to-slf4j-1.7.36.jar:/stackable/hadoop/share/hadoop/common/lib/curator-recipes-4.2.0.jar:/stackable/hadoop/share/hadoop/common/lib/hadoop-shaded-guava-1.1.1.jar:/stackable/hadoop/share/hadoop/common/lib/kerby-xdr-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/httpcore-4.4.13.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-mapper-asl-1.9.13.jar:/stackable/hadoop/share/hadoop/common/lib/curator-client-4.2.0.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-util-ajax-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/kerby-asn1-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/commons-configuration2-2.1.1.jar:/stackable/hadoop/share/hadoop/common/lib/commons-net-3.6.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-servlet-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-xml-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/kerby-util-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-io-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/commons-compress-1.21.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-server-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/commons-collections-3.2.2.jar:/stackable/hadoop/share/hadoop/common/lib/j2objc-annotations-1.1.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-xc-1.9.13.jar:/stackable/hadoop/share/hadoop/common/lib/jersey-server-1.19.jar:/stackable/hadoop/share/hadoop/common/lib/httpclient-4.5.13.jar:/stackable/hadoop/share/hadoop/common/lib/stax2-api-4.2.1.jar:/stackable/hadoop/share/hadoop/common/lib/jettison-1.1.jar:/stackable/hadoop/share/hadoop/common/lib/curator-framework-4.2.0.jar:/stackable/hadoop/share/hadoop/common/lib/guava-27.0-jre.jar:/stackable/hadoop/share/hadoop/common/lib/dnsjava-2.1.7.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-annotations-2.13.2.jar:/stackable/hadoop/share/hadoop/common/lib/commons-beanutils-1.9.4.jar:/stackable/hadoop/share/hadoop/common/lib/audience-annotations-0.5.0.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-databind-2.13.2.2.jar:/stackable/hadoop/share/hadoop/common/lib/failureaccess-1.0.jar:/stackable/hadoop/share/hadoop/common/lib/hadoop-shaded-protobuf_3_7-1.1.1.jar:/stackable/hadoop/share/hadoop/common/lib/json-smart-2.4.7.jar:/stackable/hadoop/share/hadoop/common/lib/snappy-java-1.1.8.2.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-core-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/jakarta.activation-api-1.2.1.jar:/stackable/hadoop/share/hadoop/common/lib/jsr305-3.0.2.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-admin-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/token-provider-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-util-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/slf4j-reload4j-1.7.36.jar:/stackable/hadoop/share/hadoop/common/lib/zookeeper-jute-3.5.6.jar:/stackable/hadoop/share/hadoop/common/lib/nimbus-jose-jwt-9.8.1.jar:/stackable/hadoop/share/hadoop/common/lib/slf4j-api-1.7.36.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-webapp-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-core-asl-1.9.13.jar:/stackable/hadoop/share/hadoop/common/lib/jsp-api-2.1.jar:/stackable/hadoop/share/hadoop/common/lib/metrics-core-3.2.4.jar:/stackable/hadoop/share/hadoop/common/lib/checker-qual-2.5.2.jar:/stackable/hadoop/share/hadoop/common/lib/commons-codec-1.15.jar:/stackable/hadoop/share/hadoop/common/lib/commons-cli-1.2.jar:/stackable/hadoop/share/hadoop/common/hadoop-nfs-3.3.3.jar:/stackable/hadoop/share/hadoop/common/hadoop-kms-3.3.3.jar:/stackable/hadoop/share/hadoop/common/hadoop-common-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/common/hadoop-common-3.3.3.jar:/stackable/hadoop/share/hadoop/common/hadoop-registry-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs:/stackable/hadoop/share/hadoop/hdfs/lib/kerby-config-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jaxb-api-2.2.11.jar:/stackable/hadoop/share/hadoop/hdfs/lib/javax.servlet-api-3.1.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-daemon-1.0.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-jaxrs-1.9.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-client-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/reload4j-1.2.18.3.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-http-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/avro-1.7.7.jar:/stackable/hadoop/share/hadoop/hdfs/lib/re2j-1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jsch-0.1.55.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-core-2.13.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/hadoop-auth-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/lib/animal-sniffer-annotations-1.17.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jersey-json-1.19.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-identity-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-simplekdc-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-io-2.8.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/protobuf-java-2.5.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jcip-annotations-1.0-1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/okhttp-2.7.5.jar:/stackable/hadoop/share/hadoop/hdfs/lib/woodstox-core-5.3.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jaxb-impl-2.2.3-1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-server-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/zookeeper-3.5.6.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-lang3-3.12.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-common-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jsr311-api-1.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-crypto-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-util-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/accessors-smart-2.4.7.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-logging-1.1.3.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jersey-core-1.19.jar:/stackable/hadoop/share/hadoop/hdfs/lib/paranamer-2.3.jar:/stackable/hadoop/share/hadoop/hdfs/lib/hadoop-annotations-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-security-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-text-1.4.jar:/stackable/hadoop/share/hadoop/hdfs/lib/gson-2.8.9.jar:/stackable/hadoop/share/hadoop/hdfs/lib/asm-5.0.4.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jersey-servlet-1.19.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-math3-3.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/listenablefuture-9999.0-empty-to-avoid-conflict-with-guava.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerby-pkix-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/netty-3.10.6.Final.jar:/stackable/hadoop/share/hadoop/hdfs/lib/curator-recipes-4.2.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/hadoop-shaded-guava-1.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerby-xdr-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/httpcore-4.4.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-mapper-asl-1.9.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/leveldbjni-all-1.8.jar:/stackable/hadoop/share/hadoop/hdfs/lib/curator-client-4.2.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-util-ajax-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerby-asn1-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-configuration2-2.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-net-3.6.jar:/stackable/hadoop/share/hadoop/hdfs/lib/okio-1.6.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-servlet-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-xml-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerby-util-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-io-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-compress-1.21.jar:/stackable/hadoop/share/hadoop/hdfs/lib/netty-all-4.1.68.Final.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-server-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-collections-3.2.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/j2objc-annotations-1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-xc-1.9.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jersey-server-1.19.jar:/stackable/hadoop/share/hadoop/hdfs/lib/httpclient-4.5.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/stax2-api-4.2.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jettison-1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/curator-framework-4.2.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/guava-27.0-jre.jar:/stackable/hadoop/share/hadoop/hdfs/lib/dnsjava-2.1.7.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-annotations-2.13.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-beanutils-1.9.4.jar:/stackable/hadoop/share/hadoop/hdfs/lib/audience-annotations-0.5.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-databind-2.13.2.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/json-simple-1.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/failureaccess-1.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/hadoop-shaded-protobuf_3_7-1.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/json-smart-2.4.7.jar:/stackable/hadoop/share/hadoop/hdfs/lib/snappy-java-1.1.8.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-core-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jakarta.activation-api-1.2.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jsr305-3.0.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-admin-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/token-provider-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-util-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/zookeeper-jute-3.5.6.jar:/stackable/hadoop/share/hadoop/hdfs/lib/nimbus-jose-jwt-9.8.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-webapp-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-core-asl-1.9.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/checker-qual-2.5.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-codec-1.15.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-cli-1.2.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-nfs-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-httpfs-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-rbf-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-native-client-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-native-client-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-client-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-rbf-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-client-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-jobclient-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-nativetask-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-core-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-shuffle-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-examples-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-jobclient-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-hs-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-hs-plugins-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-app-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-uploader-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-common-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn:/stackable/hadoop/share/hadoop/yarn/lib/jersey-client-1.19.jar:/stackable/hadoop/share/hadoop/yarn/lib/jetty-jndi-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/json-io-2.5.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/jackson-jaxrs-json-provider-2.13.2.jar:/stackable/hadoop/share/hadoop/yarn/lib/snakeyaml-1.26.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax.websocket-api-1.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/swagger-annotations-1.5.4.jar:/stackable/hadoop/share/hadoop/yarn/lib/asm-analysis-9.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/jackson-module-jaxb-annotations-2.13.2.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax-websocket-client-impl-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/jetty-client-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/jakarta.xml.bind-api-2.3.3.jar:/stackable/hadoop/share/hadoop/yarn/lib/fst-2.50.jar:/stackable/hadoop/share/hadoop/yarn/lib/ehcache-3.3.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/objenesis-2.6.jar:/stackable/hadoop/share/hadoop/yarn/lib/websocket-servlet-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/websocket-api-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/bcprov-jdk15on-1.60.jar:/stackable/hadoop/share/hadoop/yarn/lib/bcpkix-jdk15on-1.60.jar:/stackable/hadoop/share/hadoop/yarn/lib/asm-commons-9.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/jetty-plus-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/geronimo-jcache_1.0_spec-1.0-alpha-1.jar:/stackable/hadoop/share/hadoop/yarn/lib/jackson-jaxrs-base-2.13.2.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax.ws.rs-api-2.1.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/HikariCP-java7-2.4.12.jar:/stackable/hadoop/share/hadoop/yarn/lib/jersey-guice-1.19.jar:/stackable/hadoop/share/hadoop/yarn/lib/java-util-1.9.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/asm-tree-9.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/websocket-client-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/jline-3.9.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/guice-4.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/mssql-jdbc-6.2.1.jre7.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax.inject-1.jar:/stackable/hadoop/share/hadoop/yarn/lib/jna-5.2.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax-websocket-server-impl-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/websocket-server-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/guice-servlet-4.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/jetty-annotations-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/aopalliance-1.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax.websocket-client-api-1.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/metrics-core-3.2.4.jar:/stackable/hadoop/share/hadoop/yarn/lib/websocket-common-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-applications-distributedshell-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-services-core-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-api-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-applications-unmanaged-am-launcher-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-timeline-pluginstorage-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-web-proxy-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-common-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-resourcemanager-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-applications-mawo-core-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-services-api-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-client-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-applicationhistoryservice-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-tests-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-sharedcachemanager-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-router-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-registry-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-common-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-nodemanager-3.3.3.jar:/stackable/hadoop-3.3.3/share/hadoop/tools/lib/hadoop-aws-3.3.3.jar:/stackable/hadoop-3.3.3/share/hadoop/tools/lib/aws-java-sdk-bundle-1.11.1026.jar" - name: HADOOP_USER_NAME value: "stackable" + - name: HADOOP_CLASSPATH # no hadoop_classpath env available in container. Need to add classpath + /stackable/hadoop-3.3.3/share/hadoop/tools/lib/hadoop-aws-3.3.3.jar + /stackable/hadoop-3.3.3/share/hadoop/tools/lib/aws-java-sdk-bundle-1.11.1026.jar + value: "/stackable/hadoop/etc/hadoop:/stackable/hadoop/share/hadoop/common/lib/kerby-config-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/jaxb-api-2.2.11.jar:/stackable/hadoop/share/hadoop/common/lib/javax.servlet-api-3.1.0.jar:/stackable/hadoop/share/hadoop/common/lib/commons-daemon-1.0.13.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-jaxrs-1.9.13.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-client-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/reload4j-1.2.18.3.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-http-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/avro-1.7.7.jar:/stackable/hadoop/share/hadoop/common/lib/re2j-1.1.jar:/stackable/hadoop/share/hadoop/common/lib/jsch-0.1.55.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-core-2.13.2.jar:/stackable/hadoop/share/hadoop/common/lib/hadoop-auth-3.3.3.jar:/stackable/hadoop/share/hadoop/common/lib/animal-sniffer-annotations-1.17.jar:/stackable/hadoop/share/hadoop/common/lib/jersey-json-1.19.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-identity-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-simplekdc-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/commons-io-2.8.0.jar:/stackable/hadoop/share/hadoop/common/lib/protobuf-java-2.5.0.jar:/stackable/hadoop/share/hadoop/common/lib/jcip-annotations-1.0-1.jar:/stackable/hadoop/share/hadoop/common/lib/woodstox-core-5.3.0.jar:/stackable/hadoop/share/hadoop/common/lib/jaxb-impl-2.2.3-1.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-server-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/zookeeper-3.5.6.jar:/stackable/hadoop/share/hadoop/common/lib/commons-lang3-3.12.0.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-common-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/jsr311-api-1.1.1.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-crypto-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-util-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/accessors-smart-2.4.7.jar:/stackable/hadoop/share/hadoop/common/lib/commons-logging-1.1.3.jar:/stackable/hadoop/share/hadoop/common/lib/jersey-core-1.19.jar:/stackable/hadoop/share/hadoop/common/lib/paranamer-2.3.jar:/stackable/hadoop/share/hadoop/common/lib/hadoop-annotations-3.3.3.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-security-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/commons-text-1.4.jar:/stackable/hadoop/share/hadoop/common/lib/gson-2.8.9.jar:/stackable/hadoop/share/hadoop/common/lib/asm-5.0.4.jar:/stackable/hadoop/share/hadoop/common/lib/jersey-servlet-1.19.jar:/stackable/hadoop/share/hadoop/common/lib/commons-math3-3.1.1.jar:/stackable/hadoop/share/hadoop/common/lib/listenablefuture-9999.0-empty-to-avoid-conflict-with-guava.jar:/stackable/hadoop/share/hadoop/common/lib/kerby-pkix-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/netty-3.10.6.Final.jar:/stackable/hadoop/share/hadoop/common/lib/jul-to-slf4j-1.7.36.jar:/stackable/hadoop/share/hadoop/common/lib/curator-recipes-4.2.0.jar:/stackable/hadoop/share/hadoop/common/lib/hadoop-shaded-guava-1.1.1.jar:/stackable/hadoop/share/hadoop/common/lib/kerby-xdr-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/httpcore-4.4.13.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-mapper-asl-1.9.13.jar:/stackable/hadoop/share/hadoop/common/lib/curator-client-4.2.0.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-util-ajax-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/kerby-asn1-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/commons-configuration2-2.1.1.jar:/stackable/hadoop/share/hadoop/common/lib/commons-net-3.6.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-servlet-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-xml-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/kerby-util-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-io-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/commons-compress-1.21.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-server-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/commons-collections-3.2.2.jar:/stackable/hadoop/share/hadoop/common/lib/j2objc-annotations-1.1.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-xc-1.9.13.jar:/stackable/hadoop/share/hadoop/common/lib/jersey-server-1.19.jar:/stackable/hadoop/share/hadoop/common/lib/httpclient-4.5.13.jar:/stackable/hadoop/share/hadoop/common/lib/stax2-api-4.2.1.jar:/stackable/hadoop/share/hadoop/common/lib/jettison-1.1.jar:/stackable/hadoop/share/hadoop/common/lib/curator-framework-4.2.0.jar:/stackable/hadoop/share/hadoop/common/lib/guava-27.0-jre.jar:/stackable/hadoop/share/hadoop/common/lib/dnsjava-2.1.7.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-annotations-2.13.2.jar:/stackable/hadoop/share/hadoop/common/lib/commons-beanutils-1.9.4.jar:/stackable/hadoop/share/hadoop/common/lib/audience-annotations-0.5.0.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-databind-2.13.2.2.jar:/stackable/hadoop/share/hadoop/common/lib/failureaccess-1.0.jar:/stackable/hadoop/share/hadoop/common/lib/hadoop-shaded-protobuf_3_7-1.1.1.jar:/stackable/hadoop/share/hadoop/common/lib/json-smart-2.4.7.jar:/stackable/hadoop/share/hadoop/common/lib/snappy-java-1.1.8.2.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-core-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/jakarta.activation-api-1.2.1.jar:/stackable/hadoop/share/hadoop/common/lib/jsr305-3.0.2.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-admin-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/token-provider-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/kerb-util-1.0.1.jar:/stackable/hadoop/share/hadoop/common/lib/slf4j-reload4j-1.7.36.jar:/stackable/hadoop/share/hadoop/common/lib/zookeeper-jute-3.5.6.jar:/stackable/hadoop/share/hadoop/common/lib/nimbus-jose-jwt-9.8.1.jar:/stackable/hadoop/share/hadoop/common/lib/slf4j-api-1.7.36.jar:/stackable/hadoop/share/hadoop/common/lib/jetty-webapp-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/common/lib/jackson-core-asl-1.9.13.jar:/stackable/hadoop/share/hadoop/common/lib/jsp-api-2.1.jar:/stackable/hadoop/share/hadoop/common/lib/metrics-core-3.2.4.jar:/stackable/hadoop/share/hadoop/common/lib/checker-qual-2.5.2.jar:/stackable/hadoop/share/hadoop/common/lib/commons-codec-1.15.jar:/stackable/hadoop/share/hadoop/common/lib/commons-cli-1.2.jar:/stackable/hadoop/share/hadoop/common/hadoop-nfs-3.3.3.jar:/stackable/hadoop/share/hadoop/common/hadoop-kms-3.3.3.jar:/stackable/hadoop/share/hadoop/common/hadoop-common-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/common/hadoop-common-3.3.3.jar:/stackable/hadoop/share/hadoop/common/hadoop-registry-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs:/stackable/hadoop/share/hadoop/hdfs/lib/kerby-config-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jaxb-api-2.2.11.jar:/stackable/hadoop/share/hadoop/hdfs/lib/javax.servlet-api-3.1.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-daemon-1.0.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-jaxrs-1.9.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-client-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/reload4j-1.2.18.3.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-http-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/avro-1.7.7.jar:/stackable/hadoop/share/hadoop/hdfs/lib/re2j-1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jsch-0.1.55.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-core-2.13.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/hadoop-auth-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/lib/animal-sniffer-annotations-1.17.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jersey-json-1.19.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-identity-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-simplekdc-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-io-2.8.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/protobuf-java-2.5.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jcip-annotations-1.0-1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/okhttp-2.7.5.jar:/stackable/hadoop/share/hadoop/hdfs/lib/woodstox-core-5.3.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jaxb-impl-2.2.3-1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-server-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/zookeeper-3.5.6.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-lang3-3.12.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-common-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jsr311-api-1.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-crypto-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-util-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/accessors-smart-2.4.7.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-logging-1.1.3.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jersey-core-1.19.jar:/stackable/hadoop/share/hadoop/hdfs/lib/paranamer-2.3.jar:/stackable/hadoop/share/hadoop/hdfs/lib/hadoop-annotations-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-security-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-text-1.4.jar:/stackable/hadoop/share/hadoop/hdfs/lib/gson-2.8.9.jar:/stackable/hadoop/share/hadoop/hdfs/lib/asm-5.0.4.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jersey-servlet-1.19.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-math3-3.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/listenablefuture-9999.0-empty-to-avoid-conflict-with-guava.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerby-pkix-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/netty-3.10.6.Final.jar:/stackable/hadoop/share/hadoop/hdfs/lib/curator-recipes-4.2.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/hadoop-shaded-guava-1.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerby-xdr-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/httpcore-4.4.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-mapper-asl-1.9.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/leveldbjni-all-1.8.jar:/stackable/hadoop/share/hadoop/hdfs/lib/curator-client-4.2.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-util-ajax-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerby-asn1-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-configuration2-2.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-net-3.6.jar:/stackable/hadoop/share/hadoop/hdfs/lib/okio-1.6.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-servlet-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-xml-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerby-util-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-io-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-compress-1.21.jar:/stackable/hadoop/share/hadoop/hdfs/lib/netty-all-4.1.68.Final.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-server-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-collections-3.2.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/j2objc-annotations-1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-xc-1.9.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jersey-server-1.19.jar:/stackable/hadoop/share/hadoop/hdfs/lib/httpclient-4.5.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/stax2-api-4.2.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jettison-1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/curator-framework-4.2.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/guava-27.0-jre.jar:/stackable/hadoop/share/hadoop/hdfs/lib/dnsjava-2.1.7.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-annotations-2.13.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-beanutils-1.9.4.jar:/stackable/hadoop/share/hadoop/hdfs/lib/audience-annotations-0.5.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-databind-2.13.2.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/json-simple-1.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/failureaccess-1.0.jar:/stackable/hadoop/share/hadoop/hdfs/lib/hadoop-shaded-protobuf_3_7-1.1.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/json-smart-2.4.7.jar:/stackable/hadoop/share/hadoop/hdfs/lib/snappy-java-1.1.8.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-core-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jakarta.activation-api-1.2.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jsr305-3.0.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-admin-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/token-provider-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/kerb-util-1.0.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/zookeeper-jute-3.5.6.jar:/stackable/hadoop/share/hadoop/hdfs/lib/nimbus-jose-jwt-9.8.1.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jetty-webapp-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/hdfs/lib/jackson-core-asl-1.9.13.jar:/stackable/hadoop/share/hadoop/hdfs/lib/checker-qual-2.5.2.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-codec-1.15.jar:/stackable/hadoop/share/hadoop/hdfs/lib/commons-cli-1.2.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-nfs-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-httpfs-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-rbf-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-native-client-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-native-client-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-client-3.3.3.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-rbf-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/hdfs/hadoop-hdfs-client-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-jobclient-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-nativetask-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-core-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-shuffle-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-examples-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-jobclient-3.3.3-tests.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-hs-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-hs-plugins-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-app-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-uploader-3.3.3.jar:/stackable/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-client-common-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn:/stackable/hadoop/share/hadoop/yarn/lib/jersey-client-1.19.jar:/stackable/hadoop/share/hadoop/yarn/lib/jetty-jndi-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/json-io-2.5.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/jackson-jaxrs-json-provider-2.13.2.jar:/stackable/hadoop/share/hadoop/yarn/lib/snakeyaml-1.26.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax.websocket-api-1.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/swagger-annotations-1.5.4.jar:/stackable/hadoop/share/hadoop/yarn/lib/asm-analysis-9.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/jackson-module-jaxb-annotations-2.13.2.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax-websocket-client-impl-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/jetty-client-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/jakarta.xml.bind-api-2.3.3.jar:/stackable/hadoop/share/hadoop/yarn/lib/fst-2.50.jar:/stackable/hadoop/share/hadoop/yarn/lib/ehcache-3.3.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/objenesis-2.6.jar:/stackable/hadoop/share/hadoop/yarn/lib/websocket-servlet-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/websocket-api-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/bcprov-jdk15on-1.60.jar:/stackable/hadoop/share/hadoop/yarn/lib/bcpkix-jdk15on-1.60.jar:/stackable/hadoop/share/hadoop/yarn/lib/asm-commons-9.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/jetty-plus-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/geronimo-jcache_1.0_spec-1.0-alpha-1.jar:/stackable/hadoop/share/hadoop/yarn/lib/jackson-jaxrs-base-2.13.2.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax.ws.rs-api-2.1.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/HikariCP-java7-2.4.12.jar:/stackable/hadoop/share/hadoop/yarn/lib/jersey-guice-1.19.jar:/stackable/hadoop/share/hadoop/yarn/lib/java-util-1.9.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/asm-tree-9.1.jar:/stackable/hadoop/share/hadoop/yarn/lib/websocket-client-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/jline-3.9.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/guice-4.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/mssql-jdbc-6.2.1.jre7.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax.inject-1.jar:/stackable/hadoop/share/hadoop/yarn/lib/jna-5.2.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax-websocket-server-impl-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/websocket-server-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/guice-servlet-4.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/jetty-annotations-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/lib/aopalliance-1.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/javax.websocket-client-api-1.0.jar:/stackable/hadoop/share/hadoop/yarn/lib/metrics-core-3.2.4.jar:/stackable/hadoop/share/hadoop/yarn/lib/websocket-common-9.4.43.v20210629.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-applications-distributedshell-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-services-core-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-api-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-applications-unmanaged-am-launcher-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-timeline-pluginstorage-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-web-proxy-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-common-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-resourcemanager-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-applications-mawo-core-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-services-api-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-client-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-applicationhistoryservice-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-tests-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-sharedcachemanager-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-router-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-registry-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-common-3.3.3.jar:/stackable/hadoop/share/hadoop/yarn/hadoop-yarn-server-nodemanager-3.3.3.jar:/stackable/hadoop-3.3.3/share/hadoop/tools/lib/hadoop-aws-3.3.3.jar:/stackable/hadoop-3.3.3/share/hadoop/tools/lib/aws-java-sdk-bundle-1.11.1026.jar" command: ["bash", "-c", "bin/hdfs dfs -mkdir -p /data/raw \ && bin/hadoop distcp -D fs.s3a.aws.credentials.provider=org.apache.hadoop.fs.s3a.AnonymousAWSCredentialsProvider \ s3a://public-backup-nyc-tlc/cycling-tripdata/demo-cycling-tripdata.csv.gz \ @@ -30,3 +25,9 @@ spec: volumeMounts: - name: config-volume-hdfs mountPath: /stackable/conf/hdfs + volumes: + - name: config-volume-hdfs + configMap: + name: hdfs + restartPolicy: OnFailure + backoffLimit: 50 diff --git a/demos/hbase-hdfs-load-cycling-data/02-create-hfile-and-import-to-hbase.yaml b/demos/hbase-hdfs-load-cycling-data/02-create-hfile-and-import-to-hbase.yaml index 70c89f66..79f625da 100644 --- a/demos/hbase-hdfs-load-cycling-data/02-create-hfile-and-import-to-hbase.yaml +++ b/demos/hbase-hdfs-load-cycling-data/02-create-hfile-and-import-to-hbase.yaml @@ -6,7 +6,6 @@ metadata: spec: template: spec: - restartPolicy: OnFailure containers: - name: create-hfile-and-import-to-hbase image: docker.stackable.tech/stackable/hbase:2.4.12-stackable0.2.0 @@ -43,3 +42,5 @@ spec: - name: config-volume-hdfs configMap: name: hdfs + restartPolicy: OnFailure + backoffLimit: 50 diff --git a/demos/kafka-druid-water-level-data/ingest-test-data.yaml b/demos/kafka-druid-water-level-data/ingest-test-data.yaml deleted file mode 100644 index 848d1ec5..00000000 --- a/demos/kafka-druid-water-level-data/ingest-test-data.yaml +++ /dev/null @@ -1,96 +0,0 @@ ---- -apiVersion: batch/v1 -kind: Job -metadata: - name: ingest-test-data -spec: - template: - spec: - containers: - - name: ingest-test-data - image: docker.stackable.tech/stackable/testing-tools:0.1.0-stackable0.1.0 - command: ["bash", "-c", "python -u /tmp/script/script.py"] - volumeMounts: - - name: script - mountPath: /tmp/script - restartPolicy: OnFailure - volumes: - - name: script - configMap: - name: ingest-test-data-script - restartPolicy: Never - backoffLimit: 50 # It can take some time until Kafka is ready ---- -apiVersion: v1 -kind: ConfigMap -metadata: - name: ingest-test-data-script -data: - script.py: | - import json - from kafka3 import KafkaProducer - import pandas as pd - import time - - HISTORY_DAYS = 31 - # At a maximum scrape once every minute. - # In practice it will take longer than a minute to scrape, so the loop will be busy. - # This will result in a continuos stream of data. - LIVE_UPDATE_INTERVAL_S = 60 - - BOOTSTRAP_SERVERS = "kafka:9092" # For local testing / developing replace it, afterwards change back to kafka:9092 - STATIONS_TOPIC = "stations" - MEASUREMENTS_TOPIC = "measurements" - - print(f"Producing station records to topic {STATIONS_TOPIC} with bootstrap servers {BOOTSTRAP_SERVERS}\n") - producer = KafkaProducer(bootstrap_servers=BOOTSTRAP_SERVERS) - - stations = pd.read_json("https://www.pegelonline.wsv.de/webservices/rest-api/v2/stations.json") - print(f"Stations:\n{stations}") - for station in stations.index: - station_json = stations.loc[station].to_json() - producer.send(STATIONS_TOPIC, str.encode(station_json)) - - print(f"Producing measurement records of the last {HISTORY_DAYS} days to topic {MEASUREMENTS_TOPIC} with bootstrap servers {BOOTSTRAP_SERVERS}\n") - - # Using separate loop to first send stations and the measurements afterwards - for station in stations.index: - station = stations.loc[station] - station_uuid = station["uuid"] - url = f"https://www.pegelonline.wsv.de/webservices/rest-api/v2/stations/{station_uuid}/W/measurements.json?start=P{HISTORY_DAYS}D" - try: - measurements = pd.read_json(url) - except Exception as err: - print(f"[WARN] Could not read measurements for station {station['longname']} ({station_uuid}): {err}") - continue - measurements['station_uuid'] = station_uuid - for measurement in measurements.index: - measurement_json = measurements.loc[measurement].to_json() - producer.send(MEASUREMENTS_TOPIC, str.encode(measurement_json)) - - print(f"Send {len(measurements)} measurements for station {station['longname']}") - - - print(f"Finished loading {HISTORY_DAYS} days of historic data, now starting live streaming") - while True: - starttime = time.time() - measurement_counter = 0 - measurement_failed_counter = 0 - for station_uuid in stations["uuid"]: - url = f"https://www.pegelonline.wsv.de/webservices/rest-api/v2/stations/{station_uuid}/W/currentmeasurement.json" - try: - measurement = pd.read_json(url, typ='series') - except Exception as err: - measurement_failed_counter += 1 - continue - - measurement = { - "timestamp": int(time.time() * 1000), - "value": measurement["value"], - "station_uuid": station_uuid - } - measurement_json = json.dumps(measurement, separators=(',', ':')) - producer.send(MEASUREMENTS_TOPIC, str.encode(measurement_json)) - measurement_counter += 1 - print(f"Send {measurement_counter} measurements in {int(time.time() - starttime)}s ({measurement_failed_counter} failed)") - time.sleep(max(0, LIVE_UPDATE_INTERVAL_S - ((time.time() - starttime)))) diff --git a/demos/nifi-kafka-druid-earthquake-data/create-druid-ingestion-job.yaml b/demos/nifi-kafka-druid-earthquake-data/create-druid-ingestion-job.yaml index 0cb3173a..c1dce1e3 100644 --- a/demos/nifi-kafka-druid-earthquake-data/create-druid-ingestion-job.yaml +++ b/demos/nifi-kafka-druid-earthquake-data/create-druid-ingestion-job.yaml @@ -13,13 +13,12 @@ spec: volumeMounts: - name: ingestion-job-spec mountPath: /tmp/ingestion-job-spec - restartPolicy: OnFailure volumes: - name: ingestion-job-spec configMap: name: create-druid-ingestion-job-spec - restartPolicy: Never - backoffLimit: 50 # It can take some time until Druid is ready + restartPolicy: OnFailure + backoffLimit: 50 --- apiVersion: v1 kind: ConfigMap diff --git a/demos/nifi-kafka-druid-earthquake-data/create-nifi-ingestion-job.yaml b/demos/nifi-kafka-druid-earthquake-data/create-nifi-ingestion-job.yaml index 9f659183..d5abf9da 100644 --- a/demos/nifi-kafka-druid-earthquake-data/create-nifi-ingestion-job.yaml +++ b/demos/nifi-kafka-druid-earthquake-data/create-nifi-ingestion-job.yaml @@ -18,13 +18,12 @@ spec: valueFrom: fieldRef: fieldPath: metadata.namespace - restartPolicy: OnFailure volumes: - name: script configMap: name: create-nifi-ingestion-job-script - restartPolicy: Never - backoffLimit: 50 # It can take some time until NiFI is ready + restartPolicy: OnFailure + backoffLimit: 50 --- apiVersion: v1 kind: ConfigMap diff --git a/demos/nifi-kafka-druid-earthquake-data/setup-superset.yaml b/demos/nifi-kafka-druid-earthquake-data/setup-superset.yaml index ae198611..8dd7ed98 100644 --- a/demos/nifi-kafka-druid-earthquake-data/setup-superset.yaml +++ b/demos/nifi-kafka-druid-earthquake-data/setup-superset.yaml @@ -13,13 +13,12 @@ spec: volumeMounts: - name: script mountPath: /tmp/script - restartPolicy: OnFailure volumes: - name: script configMap: name: setup-superset-script - restartPolicy: Never - backoffLimit: 50 # It can take some time until Superset is ready + restartPolicy: OnFailure + backoffLimit: 50 --- apiVersion: v1 kind: ConfigMap diff --git a/demos/nifi-kafka-druid-water-level-data/IngestWaterLevelsToKafka.xml b/demos/nifi-kafka-druid-water-level-data/IngestWaterLevelsToKafka.xml new file mode 100644 index 00000000..87a599e6 --- /dev/null +++ b/demos/nifi-kafka-druid-water-level-data/IngestWaterLevelsToKafka.xml @@ -0,0 +1,4317 @@ + +