Skip to content

tspannhw/ScyllaFLiPSTheStream

main
Switch branches/tags

Name already in use

A tag already exists with the provided branch name. Many Git commands accept both tag and branch names, so creating this branch may cause unexpected behavior. Are you sure you want to create this branch?
Code

Latest commit

 

Git stats

Files

Permalink
Failed to load latest commit information.
Type
Name
Latest commit message
Commit time
December 12, 2021 15:37
December 12, 2021 15:37
February 7, 2022 07:59
December 17, 2021 16:32
December 14, 2021 10:21
March 15, 2022 14:38
December 14, 2021 09:40
December 13, 2021 15:19
December 14, 2021 10:47
December 13, 2021 09:56
December 14, 2021 10:39
December 14, 2021 21:04
December 14, 2021 10:18

ScyllaFLiPSTheStream

Scylla FLiPS The Stream With Apache Pulsar

Create on Ubuntu

sudo systemctl start docker
docker run --name devscylla --hostname devscylla -d scylladb/scylla --smp 1
docker container restart devscylla
docker ps
docker logs devscylla  | tail
docker exec -it devscylla nodetool status

bin/pulsar-admin sink stop --name scylla-test-sink --namespace default --tenant public

bin/pulsar-admin sinks delete --tenant public --namespace default --name scylla-test-sink

bin/pulsar-admin topics create persistent://public/default/chatresult2

bin/pulsar-admin sinks create --tenant public --namespace default --name "scylla-test-sink" --sink-type cassandra --sink-config-file conf/scylla.yml --inputs chatresult2


HTML

CSS/JS


<link rel="stylesheet" type="text/css" href="https://cdn.datatables.net/v/dt/jszip-2.5.0/dt-1.11.3/b-2.1.1/b-html5-2.1.1/b-print-2.1.1/cr-1.5.5/date-1.1.1/sc-2.0.5/datatables.min.css"/>
 
<script type="text/javascript" src="https://cdnjs.cloudflare.com/ajax/libs/pdfmake/0.1.36/pdfmake.min.js"></script>
<script type="text/javascript" src="https://cdnjs.cloudflare.com/ajax/libs/pdfmake/0.1.36/vfs_fonts.js"></script>
<script type="text/javascript" src="https://cdn.datatables.net/v/dt/jszip-2.5.0/dt-1.11.3/b-2.1.1/b-html5-2.1.1/b-print-2.1.1/cr-1.5.5/date-1.1.1/sc-2.0.5/datatables.min.js"></script>

Info

bin/pulsar-client consume "persistent://public/default/scyllacdcsource -s "cdcreader" -n 0

ScyllaDB Queries

docker exec -it devscylla cqlsh

CREATE KEYSPACE pulsar_test_keyspace WITH replication = {'class':'SimpleStrategy', 'replication_factor':1};


use pulsar_test_keyspace;

 CREATE TABLE pulsar_test_table (key text PRIMARY KEY, col text);

desc pulsar_test_keyspace;

cqlsh:pulsar_test_keyspace> select col from pulsar_test_table where key like '%NiFi%' ALLOW FILTERING;

 col
-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
                                                           {"id": "(10109,17,-1,-1)", "sentiment": "Positive", "userInfo": "StreamNative Blog User 5000", "comment": "Apache Spark, Apache Pulsar, Apache NiFi and Apache Flink are awesome projects.", "contactInfo": "Tim Spann, Developer Advocate @ StreamNative"}
                                                                                                                {"id": "(10109,19,-1,-1)", "sentiment": "Positive", "userInfo": "Tim Spann", "comment": "Apache Spark, Apache Pulsar, Apache NiFi and Apache Flink are awesome projects.", "contactInfo": "tim@spark"}
                                                                                                                {"id": "(10109,22,-1,-1)", "sentiment": "Positive", "userInfo": "Tim Spann", "comment": "Apache Spark, Apache Pulsar, Apache NiFi and Apache Flink are awesome projects.", "contactInfo": "tim@spark"}
  {"id": "(4518,1,-1,-1)", "sentiment": "Positive", "userInfo": "Tim Spann", "comment": "We all know that Apache Pulsar along with Apache Flink, Apache Spark, Apache NiFi and Scylla DB are the best options for modern streaming data applications.", "contactInfo": "Tim Spann, Developer Advocate @ StreamNative"}
                                                                                                                {"id": "(10109,18,-1,-1)", "sentiment": "Positive", "userInfo": "Tim Spann", "comment": "Apache Spark, Apache Pulsar, Apache NiFi and Apache Flink are awesome projects.", "contactInfo": "tim@spark"}
                                                                                                                {"id": "(10109,20,-1,-1)", "sentiment": "Positive", "userInfo": "Tim Spann", "comment": "Apache Spark, Apache Pulsar, Apache NiFi and Apache Flink are awesome projects.", "contactInfo": "tim@spark"}
                                                                                                                           {"id": "(4518,5,-1,-1)", "sentiment": "Positive", "userInfo": "Tim Spann", "comment": "Scylla\nApache Pulsar\nApache Flink\nApache Spark\nApache NiFi", "contactInfo": "NYC Pulsar Meetup"}
 {"id": "(4518,2,-1,-1)", "sentiment": "Positive", "userInfo": "Tim Spann", "comment": "We all know that Apache Pulsar along with Apache Flink, Apache Spark, Apache NiFi and Scylla DB are the best options for modern streaming data applications.", "contactInfo": "Tim Spann - Developer Advocate @ StreamNative"}
                                                                                                                {"id": "(10109,21,-1,-1)", "sentiment": "Positive", "userInfo": "Tim Spann", "comment": "Apache Spark, Apache Pulsar, Apache NiFi and Apache Flink are awesome projects.", "contactInfo": "tim@spark"}
  {"id": "(4518,0,-1,-1)", "sentiment": "Positive", "userInfo": "Tim Spann", "comment": "We all know that Apache Pulsar along with Apache Flink, Apache Spark, Apache NiFi and Scylla DB are the best options for modern streaming data applications.", "contactInfo": "Tim Spann, Developer Advocate @ StreamNative"}
                                                           {"id": "(10109,16,-1,-1)", "sentiment": "Positive", "userInfo": "StreamNative Blog User 5000", "comment": "Apache Spark, Apache Pulsar, Apache NiFi and Apache Flink are awesome projects.", "contactInfo": "Tim Spann, Developer Advocate @ StreamNative"}

---MORE--- 
(11 rows)
cqlsh:pulsar_test_keyspace> select col from pulsar_test_table where key like '%matrix%' ALLOW FILTERING;

 col
------------------------------------------------------------------------------------------------------------------------------
 {"id": "(10109,23,-1,-1)", "sentiment": "Neutral", "userInfo": "Tim Spann", "comment": "matrix", "contactInfo": "tim@spark"}

---MORE--- 

cqlsh:pulsar_test_keyspace> desc pulsar_test_table;

CREATE TABLE pulsar_test_keyspace.pulsar_test_table (
    key text PRIMARY KEY,
    col text
) WITH bloom_filter_fp_chance = 0.01
    AND caching = {'keys': 'ALL', 'rows_per_partition': 'ALL'}
    AND comment = ''
    AND compaction = {'class': 'SizeTieredCompactionStrategy'}
    AND compression = {'sstable_compression': 'org.apache.cassandra.io.compress.LZ4Compressor'}
    AND crc_check_chance = 1.0
    AND dclocal_read_repair_chance = 0.0
    AND default_time_to_live = 0
    AND gc_grace_seconds = 864000
    AND max_index_interval = 2048
    AND memtable_flush_period_in_ms = 0
    AND min_index_interval = 128
    AND read_repair_chance = 0.0
    AND speculative_retry = '99.0PERCENTILE';
CREATE INDEX pulsar_test_table_col_idx ON pulsar_test_keyspace.pulsar_test_table (col);

CREATE MATERIALIZED VIEW pulsar_test_keyspace.pulsar_test_table_col_idx_index AS
    SELECT col, idx_token, key
    FROM pulsar_test_keyspace.pulsar_test_table
    WHERE col IS NOT NULL
    PRIMARY KEY (col, idx_token, key)
    WITH CLUSTERING ORDER BY (idx_token ASC, key ASC)
    AND bloom_filter_fp_chance = 0.01
    AND caching = {'keys': 'ALL', 'rows_per_partition': 'ALL'}
    AND comment = ''
    AND compaction = {'class': 'SizeTieredCompactionStrategy'}
    AND compression = {'sstable_compression': 'org.apache.cassandra.io.compress.LZ4Compressor'}
    AND crc_check_chance = 1.0
    AND dclocal_read_repair_chance = 0.0
    AND default_time_to_live = 0
    AND gc_grace_seconds = 864000
    AND max_index_interval = 2048
    AND memtable_flush_period_in_ms = 0
    AND min_index_interval = 128
    AND read_repair_chance = 0.0
    AND speculative_retry = '99.0PERCENTILE';

cdc = {'postimage': 'false', 'preimage': 'false', 'ttl': '86400', 'enabled': 'true', 'delta': 'full'}

Reference

About

Scylla FLiPS The Stream With Apache Pulsar

Resources

License

Stars

Watchers

Forks

Releases

No releases published

Packages

No packages published