This Python script reads in a tab-delimited *.txt of the top 4600 Spotify songs of 2024 and adds title, album, artist, release date, ranking, and stream count to a sqlite DB as three tables. Note that splitting on '\t' results in a cleaner DB output compared to splitting on ',' from a *.csv. [Source data here](https://www.kaggle.com/datasets/nelgiriyewithana/most-streamed-spotify-songs-2024?select=Most+Streamed+Spotify+Songs+2024.csv)

In [1]:
import sqlite3

conn = sqlite3.connect('trackdb.sqlite')
cur = conn.cursor()

# Make some fresh tables using executescript()
cur.executescript('''
DROP TABLE IF EXISTS Artist;
DROP TABLE IF EXISTS Album;
DROP TABLE IF EXISTS Track;

CREATE TABLE Artist (
    id  INTEGER NOT NULL PRIMARY KEY AUTOINCREMENT UNIQUE,
    name    TEXT UNIQUE
);

CREATE TABLE Album (
    id  INTEGER NOT NULL PRIMARY KEY AUTOINCREMENT UNIQUE,
    artist_id  INTEGER,
    title   TEXT UNIQUE
);

CREATE TABLE Track (
    id  INTEGER NOT NULL PRIMARY KEY 
        AUTOINCREMENT UNIQUE,
    title TEXT  UNIQUE,
    album_id  INTEGER,
    release_date TEXT, rank_2024 INTEGER, spotify_streams INTEGER
);
''')

handle = open('spotify2024.txt')


for line in handle:
    line = line.strip();
    pieces = line.split('\t')
    if len(pieces) < 6 : continue

    track = pieces[0]
    album = pieces[1]
    artist = pieces[2]
    release_date = pieces[3]
    rank_2024 = pieces[5]
    spotify_streams = pieces[7]
    
    print(track, album, artist, release_date, rank_2024, spotify_streams)

    cur.execute('''INSERT OR IGNORE INTO Artist (name) 
        VALUES ( ? )''', ( artist, ) )
    cur.execute('SELECT id FROM Artist WHERE name = ? ', (artist, ))
    artist_id = cur.fetchone()[0]

    cur.execute('''INSERT OR IGNORE INTO Album (title, artist_id) 
        VALUES ( ?, ? )''', ( album, artist_id ) )
    cur.execute('SELECT id FROM Album WHERE title = ? ', (album, ))
    album_id = cur.fetchone()[0]

    cur.execute('''INSERT OR REPLACE INTO Track
        (title, album_id, release_date, rank_2024, spotify_streams) 
        VALUES ( ?, ?, ?, ?, ? )''', 
        ( track, album_id, release_date, rank_2024, spotify_streams ) )

    conn.commit()
   