# Master Discogs Database

In [2]:
## Basic stuff
%load_ext autoreload
%autoreload
from IPython.core.display import display, HTML
display(HTML("<style>.container { width:100% !important; }</style>"))
display(HTML("""<style>div.output_area{max-height:10000px;overflow:scroll;}</style>"""))

## Python Version
import sys
print("Python: {0}".format(sys.version))


################################################################################
## General Stuff
################################################################################
from ioUtils import saveJoblib, loadJoblib, saveFile, getFile
import urllib
from urllib.parse import quote
from collections import Counter
from artist import artist
from searchUtils import findExt, findSubExt, findPatternExt, findNearest
from timeUtils import clock, elapsed
from fsUtils import moveFile, setFile, setDir, setSubDir, isFile, isDir, mkDir
from fileUtils import getFileBasics, getBasename
from time import sleep


################################################################################
## Music Stuff
################################################################################

### MultiArtist
from multiArtist import multiartist

### My Music DB
from myMusicDBMap import myMusicDBMap

### Master DB code
from masterdb import discConv, isKnownAlbum, directoryName
from masterdb import getSlimArtistDB, getArtistNameToIDMap
from masterdb import getMusicData, getRowByIndex

### General
from discogsBase import discogs

### Discogs
from artistsDC import artistsDC
from artistDC import artistDC
from discogsUtils import discogsUtils
from albums import albums
from album import album, albumURLInfo

### AllMusic
from artistsAM import artistsAM
from artistAM import artistAM
from discogsUtils import allmusicUtils

### MusicBrainz
from artistsMB import artistsMB
from artistMB import artistMB
from discogsUtils import musicbrainzUtils

## AceBootlegs
from artistAB import artistAB
from artistsAB import artistsAB
from discogsUtils import acebootlegsUtils

## RateYourMusic
from artistRM import artistRM
from artistsRM import artistsRM
from discogsUtils import rateyourmusicUtils

## LastFM
from artistLM import artistLM
from artistsLM import artistsLM
from discogsUtils import lastfmUtils

## DatPiff
from artistDP import artistDP
from artistsDP import artistsDP
from discogsUtils import datpiffUtils

## RockCorner
from artistRC import artistRC
from artistsRC import artistsRC
from discogsUtils import rockcornerUtils

## CDandLP
from artistCL import artistCL
from artistsCL import artistsCL
from discogsUtils import cdandlpUtils

## MusicStack
from artistMS import artistMS
from artistsMS import artistsMS
from discogsUtils import musicstackUtils

## MetalStorm
from artistMT import artistMT
from artistsMT import artistsMT
from discogsUtils import metalstormUtils


import datetime as dt
start = dt.datetime.now()
print("Notebook Last Run Initiated: "+str(start))

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


Python: 3.7.3 (default, Mar 27 2019, 16:54:48) 
[Clang 4.0.1 (tags/RELEASE_401/final)]
Notebook Last Run Initiated: 2020-04-11 19:21:13.601657


In [9]:
%load_ext autoreload
%autoreload

discAM   = discogs('allmusic')
artsAM   = artistsAM(discAM)
dutilsAM = allmusicUtils()

discDC   = discogs('discogs')
artsDC   = artistsDC(discDC)
dutilsDC = discogsUtils()

discMB   = discogs('musicbrainz')
artsMB   = artistsMB(discMB)
dutilsMB = musicbrainzUtils()

discAB   = discogs('acebootlegs')
artsAB   = artistsAB(discAB)
dutilsAB = acebootlegsUtils()

discRM   = discogs('rateyourmusic')
artsRM   = artistsRM(discRM)
dutilsRM = rateyourmusicUtils()

discLM   = discogs('lastfm')
artsLM   = artistsLM(discLM)
dutilsLM = lastfmUtils()

discDP   = discogs('datpiff')
artsDP   = artistsDP(discDP)
dutilsDP = datpiffUtils()

discRC   = discogs('rockcorner')
artsRC   = artistsRC(discRC)
dutilsRC = rockcornerUtils()

discCL   = discogs('cdandlp')
artsCL   = artistsRC(discCL)
dutilsCL = cdandlpUtils()

discMS   = discogs('musicstack')
artsMS   = artistsMS(discMS)
dutilsMS = musicstackUtils()

discMT   = discogs('metalstorm')
artsMT   = artistsMT(discMT)
dutilsMT = metalstormUtils()

_, _ = clock("Last Run")

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sun Apr 12, 2020 12:53:13 for Last Run


# Create Dictionary Lookup Files

## Artist ID --> Ref and Name

#### AllMusic

In [10]:
%load_ext autoreload
%autoreload

####################################################################################################
## Create Artist ID Lookup
####################################################################################################
from lookup import createArtistIDMap
createArtistIDMap(discAM)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getSlimArtistDB
discSlimArtistAMDB = getSlimArtistDB(discAM, force=True)
discSlimArtistAMDB.head()


####################################################################################################
## Create Artist ID to Album ID Lookup
####################################################################################################
from lookup import createArtistAlbumIDMap
createArtistAlbumIDMap(discAM)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getArtistAlbumsDB
discArtistAMAlbumsDB = getArtistAlbumsDB(discAM, force=True)
discArtistAMAlbumsDB.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sun Apr 12, 2020 12:53:15 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/0-Metadata.p  	0 382
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/1-Metadata.p  	1 746
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/10-Metadata.p  	2 1163
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/11-Metadata.p  	3 1537
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/12-Metadata.p  	4 1941
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/13-Metadata.p  	5 2323
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/14-Metadata.p  	6 2682
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/15-Metadata.p  	7 3040
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/16-Metadata.p  	8 3433
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/17-Metadata.p  	9 3824
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/18-Metadata.p  	10 4188
/Volumes/Biggy/Discog/artists-allmu

  --> This file is 836.3kB.
Saved data to /Volumes/Biggy/Discog/db-allmusic/ArtistIDToVariations.p
  --> This file is 836.3kB.
Current Time is Sun Apr 12, 2020 12:53:19 for Done with Creating Artist DBs
Process [Done with Creating Artist DBs] took 4 seconds.
Current Time is Sun Apr 12, 2020 12:53:19 for 
Loading ArtistID Data
Creating Pandas DataFrame for 38716 Artists
	Shape --> (38716, 1)
  Finding Real Artist Name
	Shape --> (38716, 3)
  Removing None Artist
	Shape --> (38716, 3)
  Finding Disc Artist Name
	Shape --> (38716, 4)
DataFrame Shape is (38716, 4)
Current Time is Sun Apr 12, 2020 12:53:20 for Done with 
Process [Done with 
Saving Master Artist DB File
  --> This file is 2.9MB.
Current Time is Sun Apr 12, 2020 12:53:21 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/0-MediaMetadata.p 	382       1782      4706      
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/1-MediaMetadata.p 	746       3460      9524      
/Volumes/Biggy/Discog/artists-all

/Volumes/Biggy/Discog/artists-allmusic-db/metadata/73-MediaMetadata.p 	27831     126075    349241    
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/74-MediaMetadata.p 	28220     127729    354038    
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/75-MediaMetadata.p 	28620     130030    360255    
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/76-MediaMetadata.p 	29016     132580    366469    
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/77-MediaMetadata.p 	29400     134287    371279    
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/78-MediaMetadata.p 	29781     135665    375734    
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/79-MediaMetadata.p 	30159     137647    380203    
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/8-MediaMetadata.p 	30556     139627    385139    
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/80-MediaMetadata.p 	30976     142245    391236    
/Volumes/Biggy/Discog/artists-allmusic-db/metadata/81-MediaMetadata.p 	31376     14

Unnamed: 0,Albums
3100,"{'Albums': {'0000476912': 'Ohla Quem Chega', '..."
3500,"{'Albums': {}, 'Single/EP': {'0000934205': 'Ge..."
6000,{'Albums': {'0000237785': 'Eyes of the Basilis...
7300,"{'Albums': {}, 'Album': {'0000089708': 'Motiva..."
15100,"{'Albums': {'0000597370': 'Life Rays', '000035..."


#### MusicBrainz

In [11]:
%load_ext autoreload
%autoreload

####################################################################################################
## Create Artist ID Lookup
####################################################################################################
from lookup import createArtistIDMap
createArtistIDMap(discMB)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getSlimArtistDB
discSlimArtistMBDB = getSlimArtistDB(discMB, force=True)
discSlimArtistMBDB.head()


####################################################################################################
## Create Artist ID to Album ID Lookup
####################################################################################################
from lookup import createArtistAlbumIDMap
createArtistAlbumIDMap(discMB)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getArtistAlbumsDB
discArtistMBAlbumsDB = getArtistAlbumsDB(discMB, force=True)
discArtistMBAlbumsDB.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sun Apr 12, 2020 12:54:07 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/0-Metadata.p  	0 557
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/1-Metadata.p  	1 1107
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/10-Metadata.p  	2 1680
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/11-Metadata.p  	3 2256
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/12-Metadata.p  	4 2795
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/13-Metadata.p  	5 3377
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/14-Metadata.p  	6 3909
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/15-Metadata.p  	7 4459
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/16-Metadata.p  	8 5020
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/17-Metadata.p  	9 5568
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/18-Metadata.p  	10 6099
/

  --> This file is 2.8MB.
Saved data to /Volumes/Biggy/Discog/db-musicbrainz/ArtistIDToRef.p
  --> This file is 2.8MB.
Saving 55519 entries to /Volumes/Biggy/Discog/db-musicbrainz/ArtistIDToName.p

Saving data to /Volumes/Biggy/Discog/db-musicbrainz/ArtistIDToName.p
  --> This file is 2.0MB.
Saved data to /Volumes/Biggy/Discog/db-musicbrainz/ArtistIDToName.p
  --> This file is 2.0MB.
Saving 55519 entries to /Volumes/Biggy/Discog/db-musicbrainz/ArtistIDToVariations.p

Saving data to /Volumes/Biggy/Discog/db-musicbrainz/ArtistIDToVariations.p
  --> This file is 2.2MB.
Saved data to /Volumes/Biggy/Discog/db-musicbrainz/ArtistIDToVariations.p
  --> This file is 2.2MB.
Current Time is Sun Apr 12, 2020 12:54:12 for Done with Creating Artist DBs
Process [Done with Creating Artist DBs] took 5 seconds.
Current Time is Sun Apr 12, 2020 12:54:12 for 
Loading ArtistID Data
Creating Pandas DataFrame for 55519 Artists
	Shape --> (55519, 1)
  Finding Real Artist Name
	Shape --> (55519, 3)
  Removing 

/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/67-MediaMetadata.p 	36125     0         210517    
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/68-MediaMetadata.p 	36713     0         214132    
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/69-MediaMetadata.p 	37260     0         217408    
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/7-MediaMetadata.p 	37809     0         220782    
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/70-MediaMetadata.p 	38351     0         224137    
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/71-MediaMetadata.p 	38909     0         227525    
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/72-MediaMetadata.p 	39467     0         230722    
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/73-MediaMetadata.p 	40033     0         234354    
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/74-MediaMetadata.p 	40551     0         237026    
/Volumes/Biggy/Discog/artists-musicbrainz-db/metadata/75

Unnamed: 0,Albums
100442956818207492535169252608810699800,{'Album': {27770537760962693970507350008002514...
100547417529436851599898351146314554400,{}
101067819862970238038942897476434995600,{'Album': {10822236411089444077640107176594516...
102601962926749501316989527386285051500,{'Album': {30058500140618681019331294204264380...
102930867198372774019969168577092619200,{'Album': {16944562643412015066836422387591452...


In [12]:
cntr = Counter()
for k,v in discArtistMBAlbumsDB["Albums"].to_dict().items():
    for k2,v2 in v.items():
        cntr[k2] += len(v2)
cntr.most_common()

[('Album', 129996),
 ('Album + Compilation', 63783),
 ('Single', 57958),
 ('EP', 19758),
 ('Album + Live', 13578),
 ('Album + Soundtrack', 7798),
 ('Unspecified type', 4913),
 ('Other', 3772),
 ('Album + Compilation + DJ-mix', 2674),
 ('Single + Remix', 2610),
 ('Other + Audiobook', 2511),
 ('Album + Mixtape/Street', 2503),
 ('Album + Remix', 1771),
 ('Other + Audio drama', 1231),
 ('Compilation', 924),
 ('Album + Audiobook', 672),
 ('EP + Live', 617),
 ('EP + Remix', 561),
 ('Album + Compilation + Live', 554),
 ('Single + Soundtrack', 537),
 ('Other + Spokenword', 537),
 ('Live', 498),
 ('Album + DJ-mix', 386),
 ('Single + Live', 374),
 ('EP + Demo', 314),
 ('Remix', 290),
 ('EP + Compilation', 281),
 ('Album + Demo', 245),
 ('Album + Compilation + Soundtrack', 243),
 ('Other + Compilation', 228),
 ('Broadcast', 223),
 ('Album + Compilation + Remix', 183),
 ('Audiobook', 178),
 ('Album + Spokenword', 147),
 ('Other + Live', 144),
 ('EP + Soundtrack', 142),
 ('Album + Audio drama', 142

In [13]:
if False:
    import json
    keys = [x[0] for x in cntr.most_common()]
    keys = [x for x in keys if x not in primary]
    keys = [x for x in keys if x not in secondary]
    keys = [x for x in keys if x not in tertiary]
    keys = [x for x in keys if x not in fourth]
    #tertiary = [x for x in keys if x.startswith("Single") or x.startswith("EP")]
    #print(json.dumps(fourth))
    #json.dumps(tertiary)
    #secondary = [x for x in keys if x.find("Compilation") != -1]
    #json.dumps(keys)
    #keys

#### Discogs

In [14]:
%load_ext autoreload
%autoreload

####################################################################################################
## Create Artist ID Lookup
####################################################################################################
from lookup import createArtistIDMap
createArtistIDMap(discDC)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getSlimArtistDB
discSlimArtistDCDB = getSlimArtistDB(discDC, force=True)
discSlimArtistDCDB.head()


####################################################################################################
## Create Artist ID to Album ID Lookup
####################################################################################################
from lookup import createArtistAlbumIDMap
createArtistAlbumIDMap(discDC)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getArtistAlbumsDB
discArtistDCAlbumsDB = getArtistAlbumsDB(discDC, force=True)
discArtistDCAlbumsDB.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sun Apr 12, 2020 12:54:45 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-discogs-db/metadata/0-Metadata.p  	0 7119
/Volumes/Biggy/Discog/artists-discogs-db/metadata/1-Metadata.p  	1 14504
/Volumes/Biggy/Discog/artists-discogs-db/metadata/10-Metadata.p  	2 21675
/Volumes/Biggy/Discog/artists-discogs-db/metadata/11-Metadata.p  	3 28931
/Volumes/Biggy/Discog/artists-discogs-db/metadata/12-Metadata.p  	4 36208
/Volumes/Biggy/Discog/artists-discogs-db/metadata/13-Metadata.p  	5 43542
/Volumes/Biggy/Discog/artists-discogs-db/metadata/14-Metadata.p  	6 50620
/Volumes/Biggy/Discog/artists-discogs-db/metadata/15-Metadata.p  	7 57829
/Volumes/Biggy/Discog/artists-discogs-db/metadata/16-Metadata.p  	8 64960
/Volumes/Biggy/Discog/artists-discogs-db/metadata/17-Metadata.p  	9 72189
/Volumes/Biggy/Discog/artists-discogs-db/metadata/18-Metadata.p  	10 79415
/Volumes/Biggy/Discog/artists-disc

  --> This file is 26.9MB.
Saved data to /Volumes/Biggy/Discog/db-discogs/ArtistIDToVariations.p
  --> This file is 26.9MB.
Current Time is Sun Apr 12, 2020 12:56:02 for Done with Creating Artist DBs
Process [Done with Creating Artist DBs] took 1.3 minutes.
Current Time is Sun Apr 12, 2020 12:56:02 for 
Loading ArtistID Data
Creating Pandas DataFrame for 718816 Artists
	Shape --> (718816, 1)
  Finding Real Artist Name
	Shape --> (718816, 3)
  Removing None Artist
	Shape --> (718816, 3)
  Finding Disc Artist Name
	Shape --> (718816, 4)
DataFrame Shape is (718816, 4)
Current Time is Sun Apr 12, 2020 12:56:19 for Done with 
Process [Done with 
Saving Master Artist DB File
  --> This file is 57.6MB.
Current Time is Sun Apr 12, 2020 12:56:25 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-discogs-db/metadata/0-MediaMetadata.p 	7119      16153     65892     
/Volumes/Biggy/Discog/artists-discogs-db/metadata/1-MediaMetadata.p 	14504     34086     137874    
/Volumes/Biggy/Discog/artists

/Volumes/Biggy/Discog/artists-discogs-db/metadata/72-MediaMetadata.p 	509679    1152631   4807376   
/Volumes/Biggy/Discog/artists-discogs-db/metadata/73-MediaMetadata.p 	516832    1168877   4875289   
/Volumes/Biggy/Discog/artists-discogs-db/metadata/74-MediaMetadata.p 	524045    1186081   4943204   
/Volumes/Biggy/Discog/artists-discogs-db/metadata/75-MediaMetadata.p 	531195    1201907   5007249   
/Volumes/Biggy/Discog/artists-discogs-db/metadata/76-MediaMetadata.p 	538359    1217729   5076719   
/Volumes/Biggy/Discog/artists-discogs-db/metadata/77-MediaMetadata.p 	545490    1234201   5146528   
/Volumes/Biggy/Discog/artists-discogs-db/metadata/78-MediaMetadata.p 	552784    1250429   5215826   
/Volumes/Biggy/Discog/artists-discogs-db/metadata/79-MediaMetadata.p 	559984    1266464   5280393   
/Volumes/Biggy/Discog/artists-discogs-db/metadata/8-MediaMetadata.p 	567213    1282352   5350485   
/Volumes/Biggy/Discog/artists-discogs-db/metadata/80-MediaMetadata.p 	574439    1300335   54

Unnamed: 0,Albums
1000,"{'Albums': {'44815': 'Archive One', '44831': '..."
1000500,{'Miscellaneous': {'1178875': 'Peak Controller'}}
100200,"{'Albums': {'50511': 'PottpÃ¼ree'}, 'Singles &..."
1002000,{'Instruments & Performance': {'1002108': 'Are...
1002600,{'Vocals': {'1180905': 'Quiero'}}


#### AceBootlegs

In [15]:
%load_ext autoreload
%autoreload

####################################################################################################
## Create Artist ID Lookup
####################################################################################################
from lookup import createArtistIDMap
createArtistIDMap(discAB)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getSlimArtistDB
discSlimArtistABDB = getSlimArtistDB(discAB, force=True)
discSlimArtistABDB.head()


####################################################################################################
## Create Artist ID to Album ID Lookup
####################################################################################################
from lookup import createArtistAlbumIDMap
createArtistAlbumIDMap(discAB)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getArtistAlbumsDB
discArtistABAlbumsDB = getArtistAlbumsDB(discAB, force=True)
discArtistABAlbumsDB.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sun Apr 12, 2020 13:10:33 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/0-Metadata.p  	0 2
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/10-Metadata.p  	1 3
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/11-Metadata.p  	2 5
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/12-Metadata.p  	3 14
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/13-Metadata.p  	4 16
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/14-Metadata.p  	5 20
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/15-Metadata.p  	6 21
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/16-Metadata.p  	7 24
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/17-Metadata.p  	8 27
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/18-Metadata.p  	9 32
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/19-Metadata.p  	10 33
/Volumes/Biggy/Discog/ar

/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/40-MediaMetadata.p 	113       0         1281      
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/41-MediaMetadata.p 	116       0         1319      
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/42-MediaMetadata.p 	118       0         1340      
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/43-MediaMetadata.p 	121       0         1360      
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/44-MediaMetadata.p 	128       0         1390      
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/45-MediaMetadata.p 	130       0         1422      
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/46-MediaMetadata.p 	131       0         1430      
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/47-MediaMetadata.p 	137       0         1449      
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/48-MediaMetadata.p 	140       0         1483      
/Volumes/Biggy/Discog/artists-acebootlegs-db/metadata/4

Unnamed: 0,Albums
808801813200,"{'Bootleg': {'10753': 'Warning The Audience', ..."
393858009400,{'Bootleg': {'27966': 'Live Trash'}}
98803225010,{'Bootleg': {'26358': '14 September 1978 El Mo...
363272091111,{'Bootleg': {'19772': 'Live In France'}}
872005022711,{'Bootleg': {'20735': 'Live At The Greek Theat...


#### RateYourMusic

In [16]:
%load_ext autoreload
%autoreload

####################################################################################################
## Create Artist ID Lookup
####################################################################################################
from lookup import createArtistIDMap
createArtistIDMap(discRM)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getSlimArtistDB
discSlimArtistRMDB = getSlimArtistDB(discRM, force=True)
discSlimArtistRMDB.head()


####################################################################################################
## Create Artist ID to Album ID Lookup
####################################################################################################
from lookup import createArtistAlbumIDMap
createArtistAlbumIDMap(discRM)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getArtistAlbumsDB
discArtistRMAlbumsDB = getArtistAlbumsDB(discRM, force=True)
discArtistRMAlbumsDB.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sun Apr 12, 2020 13:10:34 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-rateyourmusic-db/metadata/0-Metadata.p  	0 1
/Volumes/Biggy/Discog/artists-rateyourmusic-db/metadata/16-Metadata.p  	1 3
/Volumes/Biggy/Discog/artists-rateyourmusic-db/metadata/19-Metadata.p  	2 4
/Volumes/Biggy/Discog/artists-rateyourmusic-db/metadata/20-Metadata.p  	3 5
/Volumes/Biggy/Discog/artists-rateyourmusic-db/metadata/22-Metadata.p  	4 6
/Volumes/Biggy/Discog/artists-rateyourmusic-db/metadata/23-Metadata.p  	5 7
/Volumes/Biggy/Discog/artists-rateyourmusic-db/metadata/27-Metadata.p  	6 8
/Volumes/Biggy/Discog/artists-rateyourmusic-db/metadata/28-Metadata.p  	7 10
/Volumes/Biggy/Discog/artists-rateyourmusic-db/metadata/33-Metadata.p  	8 11
/Volumes/Biggy/Discog/artists-rateyourmusic-db/metadata/41-Metadata.p  	9 12
/Volumes/Biggy/Discog/artists-rateyourmusic-db/metadata/45-Metadata.p  	10 15
/Volum

  --> This file is 68.9kB.
Current Time is Sun Apr 12, 2020 13:10:34 for Done with 
Process [Done with 


Unnamed: 0,Albums
8700,"{'Album': {'493633': 'Duppy or Gunman', '32919..."
416,{'Album': {'6364': 'Peter Green's Fleetwood Ma...
417216,"{'Mixtape': {'2617766': 'Motion Picture', '464..."
146419,{'Single': {'613366': 'Johnny Runs for Paregor...
1090320,"{'Album': {'6238923': 'Great Pine', '9905730':..."


#### LastLM

In [17]:
%load_ext autoreload
%autoreload

####################################################################################################
## Create Artist ID Lookup
####################################################################################################
from lookup import createArtistIDMap
createArtistIDMap(discLM)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getSlimArtistDB
discSlimArtistLMDB = getSlimArtistDB(discLM, force=True)
discSlimArtistLMDB.head()


####################################################################################################
## Create Artist ID to Album ID Lookup
####################################################################################################
from lookup import createArtistAlbumIDMap
createArtistAlbumIDMap(discLM)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getArtistAlbumsDB
discArtistLMAlbumsDB = getArtistAlbumsDB(discLM, force=True)
discArtistLMAlbumsDB.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sun Apr 12, 2020 13:10:34 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/0-Metadata.p  	0 453
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/1-Metadata.p  	1 917
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/10-Metadata.p  	2 1411
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/11-Metadata.p  	3 1884
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/12-Metadata.p  	4 2381
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/13-Metadata.p  	5 2899
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/14-Metadata.p  	6 3376
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/15-Metadata.p  	7 3856
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/16-Metadata.p  	8 4349
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/17-Metadata.p  	9 4794
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/18-Metadata.p  	10 5258
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/19-Metad

  --> This file is 1.6MB.
Saved data to /Volumes/Biggy/Discog/db-lastfm/ArtistIDToVariations.p
  --> This file is 1.6MB.
Current Time is Sun Apr 12, 2020 13:10:40 for Done with Creating Artist DBs
Process [Done with Creating Artist DBs] took 5 seconds.
Current Time is Sun Apr 12, 2020 13:10:40 for 
Loading ArtistID Data
Creating Pandas DataFrame for 48223 Artists
	Shape --> (48223, 1)
  Finding Real Artist Name
	Shape --> (48223, 3)
  Removing None Artist
	Shape --> (48223, 3)
  Finding Disc Artist Name
	Shape --> (48223, 4)
DataFrame Shape is (48223, 4)
Current Time is Sun Apr 12, 2020 13:10:41 for Done with 
Process [Done with 
Saving Master Artist DB File
  --> This file is 6.2MB.
Current Time is Sun Apr 12, 2020 13:10:42 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/0-MediaMetadata.p 	453       712       712       
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/1-MediaMetadata.p 	917       1350      1350      
/Volumes/Biggy/Discog/artists-lastfm-db/met

/Volumes/Biggy/Discog/artists-lastfm-db/metadata/77-MediaMetadata.p 	36635     56467     56467     
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/78-MediaMetadata.p 	37117     57423     57423     
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/79-MediaMetadata.p 	37604     58101     58101     
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/8-MediaMetadata.p 	38079     58907     58907     
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/80-MediaMetadata.p 	38574     59755     59755     
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/81-MediaMetadata.p 	39034     60194     60194     
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/82-MediaMetadata.p 	39560     60794     60794     
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/83-MediaMetadata.p 	40027     61412     61412     
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/84-MediaMetadata.p 	40542     62227     62227     
/Volumes/Biggy/Discog/artists-lastfm-db/metadata/85-MediaMetadata.p 	41059     62816     62816     
/

Unnamed: 0,Albums
10074300700,{'Albums': {}}
10197954100,{'Albums': {}}
10588500900,{'Albums': {}}
10998118200,{'Albums': {}}
11060537400,{'Albums': {}}


#### DatPiff

In [18]:
%load_ext autoreload
%autoreload

####################################################################################################
## Create Artist ID Lookup
####################################################################################################
from lookup import createArtistIDMap
createArtistIDMap(discDP)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getSlimArtistDB
discSlimArtistDPDB = getSlimArtistDB(discDP, force=True)
discSlimArtistDPDB.head()


####################################################################################################
## Create Artist ID to Album ID Lookup
####################################################################################################
from lookup import createArtistAlbumIDMap
createArtistAlbumIDMap(discDP)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getArtistAlbumsDB
discArtistDPAlbumsDB = getArtistAlbumsDB(discDP, force=True)
discArtistDPAlbumsDB.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sun Apr 12, 2020 13:10:58 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/0-Metadata.p  	0 410
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/1-Metadata.p  	1 830
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/10-Metadata.p  	2 1276
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/11-Metadata.p  	3 1749
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/12-Metadata.p  	4 2197
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/13-Metadata.p  	5 2621
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/14-Metadata.p  	6 3071
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/15-Metadata.p  	7 3509
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/16-Metadata.p  	8 3952
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/17-Metadata.p  	9 4379
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/18-Metadata.p  	10 4783
/Volumes/Biggy/Discog/artists-datpiff-db/metad

  --> This file is 955.7kB.
Saved data to /Volumes/Biggy/Discog/db-datpiff/ArtistIDToVariations.p
  --> This file is 955.7kB.
Current Time is Sun Apr 12, 2020 13:11:02 for Done with Creating Artist DBs
Process [Done with Creating Artist DBs] took 3 seconds.
Current Time is Sun Apr 12, 2020 13:11:02 for 
Loading ArtistID Data
Creating Pandas DataFrame for 44170 Artists
	Shape --> (44170, 1)
  Finding Real Artist Name
	Shape --> (44170, 3)
  Removing None Artist
	Shape --> (44170, 3)
  Finding Disc Artist Name
	Shape --> (44170, 4)
DataFrame Shape is (44170, 4)
Current Time is Sun Apr 12, 2020 13:11:03 for Done with 
Process [Done with 
Saving Master Artist DB File
  --> This file is 3.1MB.
Current Time is Sun Apr 12, 2020 13:11:03 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/0-MediaMetadata.p 	410       0         2820      
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/1-MediaMetadata.p 	830       0         3740      
/Volumes/Biggy/Discog/artists-datpif

/Volumes/Biggy/Discog/artists-datpiff-db/metadata/75-MediaMetadata.p 	32653     0         94021     
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/76-MediaMetadata.p 	33071     0         95028     
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/77-MediaMetadata.p 	33512     0         95971     
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/78-MediaMetadata.p 	33932     0         96911     
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/79-MediaMetadata.p 	34383     0         98043     
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/8-MediaMetadata.p 	34782     0         99040     
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/80-MediaMetadata.p 	35216     0         100261    
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/81-MediaMetadata.p 	35641     0         102058    
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/82-MediaMetadata.p 	36092     0         103108    
/Volumes/Biggy/Discog/artists-datpiff-db/metadata/83-MediaMetadata.p 	36528     0         10

Unnamed: 0,Albums
1863800,{'MixTape': {'8370019': 'Coast 2 Coast Mixtape...
6695000,{'MixTape': {'1289055': 'Movies On Demand 2'}}
6537000,{'MixTape': {'9658322': 'Domino Mothafucka! Re...
9285900,{'MixTape': {'8355863': 'Mr5torm Presents: Pro...
1931900,{'MixTape': {'6282725': 'Jacking For Beats Vol...


#### RockCorner

In [19]:
%load_ext autoreload
%autoreload

####################################################################################################
## Create Artist ID Lookup
####################################################################################################
from lookup import createArtistIDMap
createArtistIDMap(discRC)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getSlimArtistDB
discSlimArtistRCDB = getSlimArtistDB(discRC, force=True)
discSlimArtistRCDB.head()


####################################################################################################
## Create Artist ID to Album ID Lookup
####################################################################################################
from lookup import createArtistAlbumIDMap
createArtistAlbumIDMap(discRC)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getArtistAlbumsDB
discArtistRCAlbumsDB = getArtistAlbumsDB(discRC, force=True)
discArtistRCAlbumsDB.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sun Apr 12, 2020 13:11:18 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/0-Metadata.p  	0 19
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/1-Metadata.p  	1 30
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/10-Metadata.p  	2 45
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/11-Metadata.p  	3 59
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/12-Metadata.p  	4 72
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/13-Metadata.p  	5 83
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/14-Metadata.p  	6 93
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/15-Metadata.p  	7 104
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/16-Metadata.p  	8 114
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/17-Metadata.p  	9 123
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/18-Metadata.p  	10 132
/Volumes/Biggy/Discog/artists

  --> This file is 25.9kB.
Saved data to /Volumes/Biggy/Discog/db-rockcorner/ArtistIDToName.p
  --> This file is 25.9kB.
Saving 1251 entries to /Volumes/Biggy/Discog/db-rockcorner/ArtistIDToVariations.p

Saving data to /Volumes/Biggy/Discog/db-rockcorner/ArtistIDToVariations.p
  --> This file is 30.0kB.
Saved data to /Volumes/Biggy/Discog/db-rockcorner/ArtistIDToVariations.p
  --> This file is 30.0kB.
Current Time is Sun Apr 12, 2020 13:11:19 for Done with Creating Artist DBs
Process [Done with Creating Artist DBs] took 389.0 millseconds.
Current Time is Sun Apr 12, 2020 13:11:19 for 
Loading ArtistID Data
Creating Pandas DataFrame for 1251 Artists
	Shape --> (1251, 1)
  Finding Real Artist Name
	Shape --> (1251, 3)
  Removing None Artist
	Shape --> (1251, 3)
  Finding Disc Artist Name
	Shape --> (1251, 4)
DataFrame Shape is (1251, 4)
Current Time is Sun Apr 12, 2020 13:11:19 for Done with 
Process [Done with 
Saving Master Artist DB File
  --> This file is 41.9kB.
Current Time is Sun 

/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/77-MediaMetadata.p 	959       10957     66777     
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/78-MediaMetadata.p 	970       11102     67452     
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/79-MediaMetadata.p 	984       11281     68462     
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/8-MediaMetadata.p 	989       11318     68755     
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/80-MediaMetadata.p 	1000      11403     69469     
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/81-MediaMetadata.p 	1017      11622     70647     
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/82-MediaMetadata.p 	1026      11731     71268     
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/83-MediaMetadata.p 	1037      11893     71988     
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/84-MediaMetadata.p 	1053      12138     73210     
/Volumes/Biggy/Discog/artists-rockcorner-db/metadata/85-MediaMeta

Unnamed: 0,Albums
114396000,"{'Albums': {'799619505': 'Hell To Pay', '57489..."
150110900,"{'Albums': {'985030875': 'Some Nights', '49644..."
153352100,"{'Albums': {'190618332': 'The CBS Recordings, ..."
214126900,{'Albums': {'959493591': 'The Green Car Motel'...
257073300,{'Albums': {'383248847': 'Dimmi cosa succede s...


#### CDandLP

In [20]:
%load_ext autoreload
%autoreload

####################################################################################################
## Create Artist ID Lookup
####################################################################################################
from lookup import createArtistIDMap
createArtistIDMap(discCL)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getSlimArtistDB
discSlimArtistCLDB = getSlimArtistDB(discCL, force=True)
discSlimArtistCLDB.head()


####################################################################################################
## Create Artist ID to Album ID Lookup
####################################################################################################
from lookup import createArtistAlbumIDMap
createArtistAlbumIDMap(discCL)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getArtistAlbumsDB
discArtistCLAlbumsDB = getArtistAlbumsDB(discCL, force=True)
discArtistCLAlbumsDB.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sun Apr 12, 2020 13:11:25 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/0-Metadata.p  	0 10
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/1-Metadata.p  	1 20
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/10-Metadata.p  	2 28
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/11-Metadata.p  	3 38
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/12-Metadata.p  	4 43
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/13-Metadata.p  	5 50
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/15-Metadata.p  	6 58
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/16-Metadata.p  	7 64
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/17-Metadata.p  	8 67
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/18-Metadata.p  	9 75
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/19-Metadata.p  	10 84
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/2-Metadata.p  	1

/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/1-MediaMetadata.p 	20        115       115       
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/10-MediaMetadata.p 	28        153       153       
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/11-MediaMetadata.p 	38        199       199       
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/12-MediaMetadata.p 	43        208       208       
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/13-MediaMetadata.p 	50        270       270       
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/15-MediaMetadata.p 	58        313       313       
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/16-MediaMetadata.p 	64        369       369       
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/17-MediaMetadata.p 	67        397       397       
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/18-MediaMetadata.p 	75        427       427       
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/19-MediaMetadata.p 	84        499       49

/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/90-MediaMetadata.p 	519       3684      3684      
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/91-MediaMetadata.p 	527       3731      3731      
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/92-MediaMetadata.p 	532       3755      3755      
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/93-MediaMetadata.p 	536       3763      3763      
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/94-MediaMetadata.p 	540       3801      3801      
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/95-MediaMetadata.p 	545       3837      3837      
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/96-MediaMetadata.p 	550       3907      3907      
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/97-MediaMetadata.p 	557       3954      3954      
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/98-MediaMetadata.p 	563       4002      4002      
/Volumes/Biggy/Discog/artists-cdandlp-db/metadata/99-MediaMetadata.p 	568       4046      4

Unnamed: 0,Albums
10164083958400,"{'Albums': {'90322725707033': 'Damn E.P.', '67..."
14949541170200,{'Albums': {'13109527179712': 'So Strong (Remi...
18432190263200,{'Albums': {'43304212049028': 'Down In The Boo...
25622009416200,{'Albums': {'69575693315202': 'Retro Failure'}}
52956743695400,"{'Albums': {'40355153279759': 'Inquire', '8153..."


#### MusicStack

In [21]:
%load_ext autoreload
%autoreload

####################################################################################################
## Create Artist ID Lookup
####################################################################################################
from lookup import createArtistIDMap
createArtistIDMap(discMS)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getSlimArtistDB
discSlimArtistMSDB = getSlimArtistDB(discMS, force=True)
discSlimArtistMSDB.head()


####################################################################################################
## Create Artist ID to Album ID Lookup
####################################################################################################
from lookup import createArtistAlbumIDMap
createArtistAlbumIDMap(discMS)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getArtistAlbumsDB
discArtistMSAlbumsDB = getArtistAlbumsDB(discMS, force=True)
discArtistMSAlbumsDB.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sun Apr 12, 2020 13:11:26 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/0-Metadata.p  	0 2
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/1-Metadata.p  	1 3
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/10-Metadata.p  	2 7
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/11-Metadata.p  	3 12
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/12-Metadata.p  	4 13
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/13-Metadata.p  	5 16
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/16-Metadata.p  	6 17
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/17-Metadata.p  	7 18
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/18-Metadata.p  	8 21
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/19-Metadata.p  	9 23
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/2-Metadata.p  	10 26
/Volumes/Biggy/Discog/artists-musicst

/Volumes/Biggy/Discog/artists-musicstack-db/metadata/21-MediaMetadata.p 	29        0         72        
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/23-MediaMetadata.p 	34        0         83        
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/24-MediaMetadata.p 	38        0         90        
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/25-MediaMetadata.p 	40        0         92        
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/26-MediaMetadata.p 	41        0         93        
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/27-MediaMetadata.p 	44        0         96        
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/28-MediaMetadata.p 	47        0         100       
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/29-MediaMetadata.p 	50        0         106       
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/30-MediaMetadata.p 	52        0         114       
/Volumes/Biggy/Discog/artists-musicstack-db/metadata/31-MediaMet

  --> This file is 16.8kB.
Current Time is Sun Apr 12, 2020 13:11:27 for Done with 
Process [Done with 


Unnamed: 0,Albums
574300,{'MixTape': {'5653704': 'Pierced Pussy Lips'}}
8962700,"{'MixTape': {'6636854': 'Commando Of Love', '4..."
9790801,"{'MixTape': {'7790478': 'Jesus, He Brings Me J..."
7623910,{'MixTape': {'7814021': 'Analia Y Los Accesori...
5562310,{'MixTape': {'7161584': 'Supersloop'}}


#### MetalStorm

In [8]:
%load_ext autoreload
%autoreload

####################################################################################################
## Create Artist ID Lookup
####################################################################################################
from lookup import createArtistIDMap
createArtistIDMap(discMT)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getSlimArtistDB
discSlimArtistMTDB = getSlimArtistDB(discMT, force=True)
discSlimArtistMTDB.head()


####################################################################################################
## Create Artist ID to Album ID Lookup
####################################################################################################
from lookup import createArtistAlbumIDMap
createArtistAlbumIDMap(discMT)


####################################################################################################
## Create Artist ID Pandas DataFrame
####################################################################################################
from masterdb import getArtistAlbumsDB
discArtistMTAlbumsDB = getArtistAlbumsDB(discMT, force=True)
discArtistMTAlbumsDB.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
Current Time is Sat Apr 11, 2020 19:22:46 for Creating Artist DBs
/Volumes/Biggy/Discog/artists-metalstorm-db/metadata/0-Metadata.p  	0 11



Saving 11 entries to /Volumes/Biggy/Discog/db-metalstorm/ArtistIDToRef.p

Saving data to /Volumes/Biggy/Discog/db-metalstorm/ArtistIDToRef.p
  --> This file is 195B.
Saved data to /Volumes/Biggy/Discog/db-metalstorm/ArtistIDToRef.p
  --> This file is 195B.
Saving 11 entries to /Volumes/Biggy/Discog/db-metalstorm/ArtistIDToName.p

Saving data to /Volumes/Biggy/Discog/db-metalstorm/ArtistIDToName.p
  --> This file is 251B.
Saved data to /Volumes/Biggy/Discog/db-metalstorm/ArtistIDToName.p
  --> This file is 251B.
Saving 11 entries to /Volumes/Biggy/Discog/db-metalstorm/ArtistIDToVariations.p

Saving data to /Volumes/Biggy/Discog/db-metalstorm/ArtistIDToVariations.p
  --> This file is 283B.
Saved data to /Volumes/Biggy/Discog/db-metalstorm/ArtistIDToVariations.p


Unnamed: 0,Albums
10100,{'Album': {'94150': 'A Misanthrope's Guide To ...
10400,"{'EP': {'96928': 'Horizons', '96927': 'Cénotap..."
11400,{'Album': {'107463': 'Before The Gates Of Gomo...
1500,"{'EP': {'6208': 'Bloodridden Disease'}, 'Album..."
2500,{'Album': {'18430': 'Bloody Tales Of Disgraced...


***
***
***

## Artist ID --> Genre, Style, Artists Lookup Table

In [None]:
## Basic stuff
%load_ext autoreload
%autoreload
from lookup import createArtistMetadataMap
createArtistMetadataMap(discAM)

In [None]:
## Basic stuff
%load_ext autoreload
%autoreload
from lookup import createArtistMetadataMap
createArtistMetadataMap(discDC)

## Album ID --> Name, Ref, Artists Lookup Table

In [None]:
## Basic stuff
%load_ext autoreload
%autoreload
from lookup import createAlbumIDMap
createAlbumIDMap(disc)

# Master Lookup Tests

In [None]:
%load_ext autoreload
%autoreload
from lookup import testLookupMaps
testLookupMaps(disc)

In [None]:

discArtistLMAlbumsDB = getArtistAlbumsDB(discRM, force=False)

In [None]:
from collections import Counter
cntr = Counter()
for artistData in discArtistLMAlbumsDB["Albums"]:
    for key in artistData.keys():
        cntr[key] += 1
cntr

# Pandas DB

## Slim Artist DB

In [None]:
from masterdb import getSlimArtistDB
discSlimArtistDB = getSlimArtistDB(disc)
discSlimArtistDB.head()

## Artist DB

In [None]:
from masterdb import getArtistDB

In [None]:
discArtistDB = getArtistDB(disc)
discArtistDB.head()

## Artist Metadata DB

In [None]:
from masterdb import getArtistMetadataDB

In [None]:
discArtistMetadataDB = getArtistMetadataDB(disc)
discArtistMetadataDB.head()

## Artist Albums DB

In [None]:
from masterdb import getArtistAlbumsDB

In [None]:
discArtistAlbumsDB = getArtistAlbumsDB(disc, force=False)
discArtistAlbumsDB.head()

In [None]:
discArtistAlbumsDB = getArtistAlbumsDB(disc)
discArtistAlbumsDB.head()

## Albums DB

In [None]:
from masterdb import getAlbumDB

In [None]:
discAlbumDB = getAlbumDB(disc)
discAlbumDB.head()

## Artist Album ID --> Known Albums

In [None]:
from masterdb import getArtistAlbumKnownDB

In [None]:
discArtistAlbumKnownDB = getArtistAlbumKnownDB(discAlbumDB, discArtistAlbumsDB)
discArtistAlbumKnownDB.head()

# Joining Artist ID DataFrame

In [None]:
from masterdb import createMasterDB

In [None]:
createMasterDB(disc, discArtistDB, discArtistMetadataDB, discArtistAlbumKnownDB)

In [None]:
from random import random