In [1]:
# Import required packages
import pymongo
from pymongo import MongoClient
import pandas as pd
from pprint import pprint
from time import sleep
from json import dumps
from kafka import KafkaProducer
import random
import datetime as dt

In [2]:
# Import data file
hotspotTERRA=pd.read_csv('hotspot_TERRA_streaming.csv')

In [3]:
def publish_message(producer_instance, topic_name, data):
    try:
        producer_instance.send(topic_name, value=data)
        print('Message published successfully. Data: ' + str(data))
    except Exception as ex:
        print('Exception in publishing message.')
        print(str(ex))

In [4]:
def connect_kafka_producer():
    _producer = None
    try:
        _producer = KafkaProducer(bootstrap_servers=['localhost:9092'],
                                  value_serializer=lambda x: dumps(x).encode('ascii'),
                                  api_version=(0, 10))
    except Exception as ex:
        print('Exception while connecting Kafka.')
        print(str(ex))
    finally:
        return _producer

In [None]:
if __name__ == '__main__':
    # Assign topic name
    topic = 'hotspot_TERRA_streaming'
    
    print('Publishing records..')
    producer = connect_kafka_producer()
    while True:
        try:
            # Select a random row
            i=random.randrange(hotspotTERRA.shape[0]) 
            # Get current time
            datetime = str(dt.datetime.now().strftime("%d/%m/%Y %H-%M-%S"))
            # Turn into dictionary
            message = hotspotTERRA.iloc[i].astype('float').to_dict()
            # Add sender ID to dictionary
            message["sender_id"]= 3  
            # Add current time information to the dictionary
            message["created_time"]=datetime   
            #Publish meassage
            publish_message(producer, topic, message) 
            # Stream every 10-30 seconds
            sleep(random.randint(10,30))              
        except KeyboardInterrupt:
            print('stop publishing records')
            break

Publishing records..
Message published successfully. Data: {'sender_id': 3, 'latitude': -36.7771, 'surface_temperature_celcius': 54.0, 'longitude': 143.5148, 'confidence': 81.0, 'created_time': '23/05/2019 22-15-28'}
Message published successfully. Data: {'sender_id': 3, 'latitude': -36.3452, 'surface_temperature_celcius': 42.0, 'longitude': 145.8969, 'confidence': 64.0, 'created_time': '23/05/2019 22-15-57'}
Message published successfully. Data: {'sender_id': 3, 'latitude': -37.5949, 'surface_temperature_celcius': 98.0, 'longitude': 142.6857, 'confidence': 100.0, 'created_time': '23/05/2019 22-16-11'}
Message published successfully. Data: {'sender_id': 3, 'latitude': -35.2464, 'surface_temperature_celcius': 45.0, 'longitude': 141.1143, 'confidence': 98.0, 'created_time': '23/05/2019 22-16-23'}
Message published successfully. Data: {'sender_id': 3, 'latitude': -36.995, 'surface_temperature_celcius': 37.0, 'longitude': 148.268, 'confidence': 56.0, 'created_time': '23/05/2019 22-16-33'}


Message published successfully. Data: {'sender_id': 3, 'latitude': -37.4786, 'surface_temperature_celcius': 45.0, 'longitude': 141.4578, 'confidence': 70.0, 'created_time': '23/05/2019 22-30-10'}
Message published successfully. Data: {'sender_id': 3, 'latitude': -37.9625, 'surface_temperature_celcius': 58.0, 'longitude': 143.5474, 'confidence': 84.0, 'created_time': '23/05/2019 22-30-29'}
Message published successfully. Data: {'sender_id': 3, 'latitude': -36.6599, 'surface_temperature_celcius': 44.0, 'longitude': 144.6129, 'confidence': 68.0, 'created_time': '23/05/2019 22-30-56'}
Message published successfully. Data: {'sender_id': 3, 'latitude': -37.6745, 'surface_temperature_celcius': 48.0, 'longitude': 142.9848, 'confidence': 75.0, 'created_time': '23/05/2019 22-31-18'}
Message published successfully. Data: {'sender_id': 3, 'latitude': -37.0856, 'surface_temperature_celcius': 45.0, 'longitude': 143.8728, 'confidence': 71.0, 'created_time': '23/05/2019 22-31-28'}
Message published su