# Sintetic Software Used  To Analysis of Cassandra's Performance

## Imports

In [1]:
from cassandra.cluster import Cluster
from cassandra.auth import PlainTextAuthProvider
import time

## Database configuration

### Database Structure
<pre>+-----------------------+ 
|        table          |
+-----------------------+
| A0 | UUID        |    |
| A1 | INT         | PK |
| A2 | BIGINT      |    |
| A3 | DOUBLE      |    |
| A4 | VARCHAR(26) |    |
| A5 | TEXT        |    |
| A6 | DATE        |    |
| A7 | TIMESTAMP   |    |
+-----------------------+</pre>

In [2]:
cluster = Cluster(['localhost'], auth_provider=PlainTextAuthProvider('cassandra', 'cassandra'))
session = cluster.connect()

# Set User
# session.execute('ALTER USER cassandra WITH PASSWORD \'cassandra\'')

# Create KeySpace
session.execute('CREATE KEYSPACE IF NOT EXISTS analysis WITH replication = {\'class\': \'SimpleStrategy\', \'replication_factor\': 1}')

# Use KeySpace created
session.set_keyspace('analysis')

# Create Table
session.execute("CREATE TABLE IF NOT EXISTS \"table\" ("+
                "A0 uuid, "+
                "A1 int PRIMARY KEY, "+
                "A2 bigint, "+
                "A3 double, "+
                "A4 varchar, "+
                "A5 text, "+
                "A6 date, "+
                "A7 timestamp )")
rows = session.execute('select * from system_schema.columns')
print('+----------------------------------+')
print('|              table               |')
print('+----------------------------------+')
for row in rows:
    if row.table_name == 'table':
        print('|', row.column_name, '|', row.type, ' '*(9-len(row.type)), '|',  row.kind, ' '*(13-len(row.kind)), '|')
print('+----------------------------------+')

+----------------------------------+
|              table               |
+----------------------------------+
| a0 | uuid       | regular        |
| a1 | int        | partition_key  |
| a2 | bigint     | regular        |
| a3 | double     | regular        |
| a4 | text       | regular        |
| a5 | text       | regular        |
| a6 | date       | regular        |
| a7 | timestamp  | regular        |
+----------------------------------+


## Meta data

* R is the number of iterations <br />
* BI is the size of a block of insertions<br />
* BU is the size of a block of updates<br />
* BS is the size of a block of selections<br />

In [3]:
R = 60
BI = BU = BS = 500000
control = 1

## Definition of functions

In [4]:
def insert(control):
    initialTime = time.time()
    for i in range(BI):
        session.execute('INSERT INTO "table" (A0, A1, A2, A3, A4, A5, A6, A7) VALUES ('+
                        'uuid(), '+
                        str(control)+', '+
                        '9223372036854775807, '+
                        '1.2, '+
                        '\'abcdefghijklmnopqrstuvwxy\', '+
                        '\'Lorem ipsum dolor sit amet, consectetur adipiscing elit. Integer ultricies lorem metus, vel finibus risus convallis sit amet. Nam auctor ex et ipsum euismod, vel consectetur eros blandit. Sed sit amet enim vitae nisi varius molestie. Maecenas in tortor sem. Ut sit amet lobortis erat, ac egestas libero. Nunc id purus sodales, dictum massa gravida, condimentum diam. Maecenas eu vulputate nunc, vitae tempor odio. Orci varius natoque penatibus et magnis dis parturient montes, nascetur ridiculus mus. Duis vitae turpis quam. Maecenas at dui at justo vehicula scelerisque eu in eros. Sed volutpat, magna nec pretium tincidunt, risus nibh posuere mauris, quis feugiat augue lorem ut nunc. Lorem ipsum dolor sit amet, consectetur adipiscing elit. In eu tellus nec nulla ultricies efficitur. Interdum et malesuada fames ac ante ipsum primis in faucibus. \', '+
                        'toDate(dateof(now())), '+
                        'dateof(now())'+
                        ')')
        control += 1
    return (time.time() - initialTime), control

In [5]:
def update(control):
    initialTime = time.time()
    for i in range(BI):
        session.execute('UPDATE "table" SET '+
                        'A2 = 9223372036854775800, '+
                        'A3 = 1.3, '+
                        'A4 = \'abbdefghijklmnopqrstuvwxy\', '+
                        'A5 = \'Lorem ipsum dolor site amet, consectetur adipiscing elit. Integer ultricies lorem metus, vel finibus risus convallis sit amet. Nam auctor ex et ipsum euismod, vel consectetur eros blandit. Sed sit amet enim vitae nisi varius molestie. Maecenas in tortor sem. Ut sit amet lobortis erat, ac egestas libero. Nunc id purus sodales, dictum massa gravida, condimentum diam. Maecenas eu vulputate nunc, vitae tempor odio. Orci varius natoque penatibus et magnis dis parturient montes, nascetur ridiculus mus. Duis vitae turpis quam. Maecenas at dui at justo vehicula scelerisque eu in eros. Sed volutpat, magna nec pretium tincidunt, risus nibh posuere mauris, quis feugiat augue lorem ut nunc. Lorem ipsum dolor sit amet, consectetur adipiscing elit. In eu tellus nec nulla ultricies efficitur. Interdum et malesuada fames ac ante ipsum primis in faucibus. \', '+
                        'A6 = toDate(dateof(now())), '+
                        'A7 = dateof(now())'+
                        'WHERE A1 = '+str(control))
        control += 1
    return (time.time() - initialTime), control

In [6]:
def select(control):
    initialTime = time.time()
    for i in range(BI):
        session.execute('SELECT * FROM "table" WHERE A1 = '+str(control))
        control += 1
    return (time.time() - initialTime), control

## Storage

In [7]:
insertTimes = []
updateTimes = []
selectTimes = []

## DO IT

In [8]:
for j in range(R):
    t, control = insert(control)
    insertTimes.append(t)
    print('Insert', insertTimes)
for j in range(R):
    t, control = update(control)
    updateTimes.append(t)
    print('Update', updateTimes)
for j in range(R):
    t, control = select(control)
    selectTimes.append(t)
    print('Select', selectTimes)

UnboundLocalError: local variable 'control' referenced before assignment

## Insert Times

In [None]:
print(insertTimes)

## Update Times

In [None]:
print(updateTimes)

## Select Times

In [None]:
print(selectTimes)