# Similarity experiment 2: comparing performance of FONN similarity tools across three tune families.


# Extract all tune titles for target tune family:

In [11]:
import pandas as pd


# Find and list all tunes in target tune family
root_dir = '/Users/dannydiamond/NUIG/Polifonia/thesession/test_corpus/tune_fams_ground_truth'
tune_family = 'blackbird'

input_data = pd.read_csv(f'{root_dir}/{tune_family}.csv', index_col=0)
print("Reading input data...")
print(input_data.head())
tune_family_members = input_data['title'].tolist()
print(f"\n\nTune family to be tested: {tune_family.capitalize()}")
for tune in tune_family_members:
    print(tune)

print(f"Number of tunes in family: {len(tune_family_members)}")






Reading input data...
               title
0   BlackbirdThe1104
1  BlackbirdThe14355
2  BlackbirdThe14356
3  BlackbirdThe14357
4  BlackbirdThe15415


Tune family to be tested: Blackbird
BlackbirdThe1104
BlackbirdThe14355
BlackbirdThe14356
BlackbirdThe14357
BlackbirdThe15415
BlackbirdThe17110
BlackbirdThe17111
BlackbirdThe17112
BlackbirdThe1996
BlackbirdThe24050
BlackbirdThe26494
BlackbirdThe27198
BlackbirdThe28174
BlackbirdThe28821
BlackbirdThe31201
BlackbirdThe32399
BlackbirdThe34225
BlackbirdThe36690
BlackbirdThe39782
BlackbirdThe4101
BlackbirdThe4508
QueenOfTheEarthChildOfTheSkies27066
Number of tunes in family: 22


# Set up an instance of the similarity experiment:


In [12]:
from similarity_search import PatternSimilarity

print('Initializing experimental instance...')
inpath = '/Users/dannydiamond/NUIG/Polifonia/thesession/3_7gram_pattern_corpus/pitch_class_accent_ngrams.pkl'
similarity_experiment = PatternSimilarity(inpath)
similarity_experiment.calculate_tune_lengths(feat_seq_path='/Users/dannydiamond/NUIG/Polifonia/thesession/feat_seq_corpus/feat_seq_accents')
print("Experiment successfully initialized.")

Initializing experimental instance...
Calculating tune lengths:
MrsJamesMacInnesEdinburgh36755:
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe20663  \
length                        33               62               32   

        WellAllLieTogether19130  LInconnuDeLimoise17950  MerryReapersThe35815  \
length                       48                      29                    64   

        GanAinm7377  ...  OlympusMons41569  MineAinHoose36350  PulletThe8003  \
length           64  ...                96                 18             65   

        SilverTipThe42437  BumperSquireJones2623  CatInTheCornerThe36729  \
length                 32                     17                      64   

        AnUglyCustomer32800  RustyGulleyThe30917  HuntThe29171  \
length                   32                   16            81 

Set up inputs, outputs, parameters, and run experiment.

In [13]:
modes = ['idx', 'max']  # defines experimental parameters: alternative 'idx' (index) and 'max' (maximum tf-idf) pattern extraction methods.
norm = {True: 'norm', False: 'raw'}  # defines parameters and labelling: allowing output of both normalized and raw experimental results

# set output paths, print to confirm:
results_root_dir = f"/Users/dannydiamond/NUIG/Polifonia/thesession/similarity_results/similarity_experiment_2ii/{tune_family}"
print("Paths for pattern results output files:")
for tune in tune_family_members:
    print(tune)
    for m in modes:
        # raw pattern similarity results are stored here:
        similarity_experiment.pattern_results_path = f"{results_root_dir}/{tune}/patterns/{m}/"
        for n in norm.items():
            # tune similarity results are stored at paths per 'out_path' variable:
            out_path = f"{results_root_dir}/{tune}/results/fonn/{m}/{n[1]}"
            similarity_experiment.presence_results_path = similarity_experiment.freq_count_results_path = out_path
            print(similarity_experiment.presence_results_path)
            # Run experiment:
            similarity_experiment.extract_candidate_patterns(title=tune, mode=m, indices=[0], n=6)
            similarity_experiment.find_similar_patterns(edit_dist_threshold=1)
            similarity_experiment.find_similar_tunes()
            similarity_experiment.calc_pattern_presence_results(normalize=n[0])
            similarity_experiment.calc_freq_count_results(normalize=n[0])

Paths for pattern results output files:
BlackbirdThe1104
/Users/dannydiamond/NUIG/Polifonia/thesession/similarity_results/similarity_experiment_2ii/blackbird/BlackbirdThe1104/results/fonn/idx/norm
Reading input data...
       ngram   freq  doc_freq      idf  BoysOfPatstaiThe4772  \
0  (0, 0, 7)  21543      9215  4.40013                     0   
1  (0, 0, 0)  27778      8647  4.46300                     0   
2  (2, 0, 0)  20765      8411  4.49035                     0   
3  (0, 7, 0)  22462      8327  4.50028                     0   
4  (7, 0, 0)  19956      8075  4.53067                     0   

   MouldyPintThe7496  LongfordCollectorThe24745  BraesOfTulliemetThe23904  \
0                  4                          0                         0   
1                  8                          4                         0   
2                  0                          7                         2   
3                  2                          0                         0   
4          

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1792826.09it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe1104:
(0, 4, 4, 7, 4, 5)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 423772.29it/s]



72 Similar patterns detected:
                    ngram  DL distance
28     (0, 4, 4, 7, 4, 5)          0.0
0         (0, 4, 4, 7, 4)          1.0
50  (0, 4, 4, 7, 4, 5, 5)          1.0
49  (0, 4, 4, 7, 4, 5, 9)          1.0
48  (0, 4, 4, 7, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
TouristThe24037                  2
TouristThe29507                  3
CarmelMahoneyMulhaire15948       1
Zamora42034                      2
OffToPuckFair16187               1
                                ..
CarmelMahoneyMulhaire33772       1
BigJohns34647                    1
SmithsAGallantFiremanThe17303    1
LizaLynn15920                    1
FrancisOConnors29682             2
Name: pattern presence, Length: 761, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

       

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2201658.69it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe1104:
(0, 4, 4, 7, 4, 5)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 454894.23it/s]



72 Similar patterns detected:
                    ngram  DL distance
28     (0, 4, 4, 7, 4, 5)          0.0
0         (0, 4, 4, 7, 4)          1.0
50  (0, 4, 4, 7, 4, 5, 5)          1.0
49  (0, 4, 4, 7, 4, 5, 9)          1.0
48  (0, 4, 4, 7, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
TouristThe24037                  2
TouristThe29507                  3
CarmelMahoneyMulhaire15948       1
Zamora42034                      2
OffToPuckFair16187               1
                                ..
CarmelMahoneyMulhaire33772       1
BigJohns34647                    1
SmithsAGallantFiremanThe17303    1
LizaLynn15920                    1
FrancisOConnors29682             2
Name: pattern presence, Length: 761, dtype: int64
Similarity results for BlackbirdThe1104 (pattern presence):
                 title  pattern presence
0     BlackbirdThe1104                 7
1   LaGrandeChaine3489                 7
2  LaGrandeChaine26064                

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2059278.39it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 429288.61it/s]



72 Similar patterns detected:
                    ngram  DL distance
28     (0, 4, 4, 7, 4, 5)          0.0
0         (0, 4, 4, 7, 4)          1.0
50  (0, 4, 4, 7, 4, 5, 5)          1.0
49  (0, 4, 4, 7, 4, 5, 9)          1.0
48  (0, 4, 4, 7, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
TouristThe24037                  2
TouristThe29507                  3
CarmelMahoneyMulhaire15948       1
Zamora42034                      2
OffToPuckFair16187               1
                                ..
CarmelMahoneyMulhaire33772       1
BigJohns34647                    1
SmithsAGallantFiremanThe17303    1
LizaLynn15920                    1
FrancisOConnors29682             2
Name: pattern presence, Length: 761, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

       

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1936730.48it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 433453.41it/s]



72 Similar patterns detected:
                    ngram  DL distance
28     (0, 4, 4, 7, 4, 5)          0.0
0         (0, 4, 4, 7, 4)          1.0
50  (0, 4, 4, 7, 4, 5, 5)          1.0
49  (0, 4, 4, 7, 4, 5, 9)          1.0
48  (0, 4, 4, 7, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
TouristThe24037                  2
TouristThe29507                  3
CarmelMahoneyMulhaire15948       1
Zamora42034                      2
OffToPuckFair16187               1
                                ..
CarmelMahoneyMulhaire33772       1
BigJohns34647                    1
SmithsAGallantFiremanThe17303    1
LizaLynn15920                    1
FrancisOConnors29682             2
Name: pattern presence, Length: 761, dtype: int64
Similarity results for BlackbirdThe1104 (pattern presence):
                 title  pattern presence
0     BlackbirdThe1104                 7
1   LaGrandeChaine3489                 7
2  LaGrandeChaine26064                

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1981645.66it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe14355:
(7, 11, 11, 2, 11, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 356300.55it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe2

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1902126.48it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe14355:
(7, 11, 11, 2, 11, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 437676.35it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Similarity results for BlackbirdThe14355 (pattern presence):
               title  pattern presence
0  BlackbirdThe14357                 8
1  BlackbirdThe34225                 8
2  BlackbirdThe14355                 7
3  BlackbirdThe14356                 7
4      DerryThe19062

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2074293.14it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 435732.87it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe2

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1895212.77it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 392221.50it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Similarity results for BlackbirdThe14355 (pattern presence):
               title  pattern presence
0  BlackbirdThe14357                 8
1  BlackbirdThe34225                 8
2  BlackbirdThe14355                 7
3  BlackbirdThe14356                 7
4      DerryThe19062

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2114715.82it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe14356:
(7, 11, 11, 2, 11, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 369601.18it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe2

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2161950.20it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe14356:
(7, 11, 11, 2, 11, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 446504.91it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Similarity results for BlackbirdThe14356 (pattern presence):
               title  pattern presence
0  BlackbirdThe14357                 8
1  BlackbirdThe34225                 8
2  BlackbirdThe14355                 7
3  BlackbirdThe14356                 7
4      DerryThe19062

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1999312.46it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 440070.67it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe2

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2119079.52it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 455132.50it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Similarity results for BlackbirdThe14356 (pattern presence):
               title  pattern presence
0  BlackbirdThe14357                 8
1  BlackbirdThe34225                 8
2  BlackbirdThe14355                 7
3  BlackbirdThe14356                 7
4      DerryThe19062

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2174960.71it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe14357:
(7, 11, 11, 2, 11, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 418760.96it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe2

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1978805.12it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe14357:
(7, 11, 11, 2, 11, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 456463.36it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Similarity results for BlackbirdThe14357 (pattern presence):
               title  pattern presence
0  BlackbirdThe14357                 8
1  BlackbirdThe34225                 8
2  BlackbirdThe14355                 7
3  BlackbirdThe14356                 7
4      DerryThe19062

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1979409.80it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 444661.26it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe2

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2136065.48it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 440696.66it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Similarity results for BlackbirdThe14357 (pattern presence):
               title  pattern presence
0  BlackbirdThe14357                 8
1  BlackbirdThe34225                 8
2  BlackbirdThe14355                 7
3  BlackbirdThe14356                 7
4      DerryThe19062

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1868758.06it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe15415:
(4, 11, 9, 4, 2, 7)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 395246.08it/s]



51 Similar patterns detected:
                   ngram  DL distance
14   (4, 11, 9, 4, 2, 7)          0.0
0        (4, 9, 4, 2, 7)          1.0
28  (4, 11, 9, 4, 11, 7)          1.0
29   (4, 11, 9, 2, 2, 7)          1.0
30   (4, 11, 9, 4, 2, 4)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
GreenMountainThe33664                  1
RollingWavesThe30078                   2
SimonsWart9663                         1
LuachrachnsThe1851                     2
Newmarket331                           1
                                      ..
SeamusThompsons40888                   1
DiplodocusThe22648                     1
TolkaThe35403                          1
NielGowsLamentForHisSecondWife35334    1
LilyBobs41351                          2
Name: pattern presence, Length: 261, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1994033.73it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe15415:
(4, 11, 9, 4, 2, 7)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 409451.69it/s]



51 Similar patterns detected:
                   ngram  DL distance
14   (4, 11, 9, 4, 2, 7)          0.0
0        (4, 9, 4, 2, 7)          1.0
28  (4, 11, 9, 4, 11, 7)          1.0
29   (4, 11, 9, 2, 2, 7)          1.0
30   (4, 11, 9, 4, 2, 4)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
GreenMountainThe33664                  1
RollingWavesThe30078                   2
SimonsWart9663                         1
LuachrachnsThe1851                     2
Newmarket331                           1
                                      ..
SeamusThompsons40888                   1
DiplodocusThe22648                     1
TolkaThe35403                          1
NielGowsLamentForHisSecondWife35334    1
LilyBobs41351                          2
Name: pattern presence, Length: 261, dtype: int64
Similarity results for BlackbirdThe15415 (pattern presence):
                        title  pattern presence
0  FirstFlightOfGeeseThe36738                 5
1   

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1857607.02it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 351254.00it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 359235.76it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 425774.75it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 431351.99it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 360504.01it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 371516.84it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 397183.33it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 393051.93it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 355812.91it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 371808.44it/s]
Calculating pattern similarity...: 100%|██████████


1167 Similar patterns detected:
                      ngram  DL distance  (9, 4, 2, 0, 9, 4)  \
43       (4, 2, 7, 0, 4, 2)          0.0                 4.0   
1130     (4, 2, 1, 0, 4, 2)          1.0                 4.0   
122      (4, 2, 7, 0, 4, 0)          1.0                 4.0   
1120  (4, 2, 7, 4, 0, 4, 2)          1.0                 5.0   
120      (0, 2, 7, 0, 4, 2)          1.0                 5.0   

      (9, 0, 0, 7, 0, 9)  (2, 9, 0, 0, 7, 0)  (2, 7, 0, 4, 2, 0)  \
43                   5.0                 5.0                 2.0   
1130                 6.0                 5.0                 3.0   
122                  5.0                 4.0                 2.0   
1120                 6.0                 5.0                 3.0   
120                  4.0                 5.0                 2.0   

      (7, 0, 4, 2, 0, 9)  (9, 9, 4, 2, 0, 9)  (0, 9, 9, 4, 2, 0)  \
43                   4.0                 5.0                 5.0   
1130                 5.0             

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2136526.14it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 438590.02it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 442065.31it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 471211.10it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 448467.49it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 442452.80it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 413217.27it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 446750.26it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 388773.49it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 411064.51it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 389794.36it/s]
Calculating pattern similarity...: 100%|██████████


1167 Similar patterns detected:
                      ngram  DL distance  (9, 4, 2, 0, 9, 4)  \
43       (4, 2, 7, 0, 4, 2)          0.0                 4.0   
1130     (4, 2, 1, 0, 4, 2)          1.0                 4.0   
122      (4, 2, 7, 0, 4, 0)          1.0                 4.0   
1120  (4, 2, 7, 4, 0, 4, 2)          1.0                 5.0   
120      (0, 2, 7, 0, 4, 2)          1.0                 5.0   

      (9, 0, 0, 7, 0, 9)  (2, 9, 0, 0, 7, 0)  (2, 7, 0, 4, 2, 0)  \
43                   5.0                 5.0                 2.0   
1130                 6.0                 5.0                 3.0   
122                  5.0                 4.0                 2.0   
1120                 6.0                 5.0                 3.0   
120                  4.0                 5.0                 2.0   

      (7, 0, 4, 2, 0, 9)  (9, 9, 4, 2, 0, 9)  (0, 9, 9, 4, 2, 0)  \
43                   4.0                 5.0                 5.0   
1130                 5.0             

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1866335.14it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe17110:
(0, 4, 4, 5, 4, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 430077.43it/s]



81 Similar patterns detected:
                     ngram  DL distance
27      (0, 4, 4, 5, 4, 0)          0.0
0          (0, 4, 4, 4, 0)          1.0
57  (0, 4, 4, 5, 11, 4, 0)          1.0
56   (0, 9, 4, 4, 5, 4, 0)          1.0
55      (0, 4, 4, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085        3
KansasCity30048         1
LuckyInLove39389        1
SoundAsATrout9610       1
FatherKellys6899        1
                       ..
EarlOfSpaceThe36462     1
PlanxtyJoeBurke28157    1
AnotherDay37522         1
Erins39725              1
FrancisOConnors29682    1
Name: pattern presence, Length: 1035, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe20663  \
length                       

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2063390.79it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe17110:
(0, 4, 4, 5, 4, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 471079.12it/s]



81 Similar patterns detected:
                     ngram  DL distance
27      (0, 4, 4, 5, 4, 0)          0.0
0          (0, 4, 4, 4, 0)          1.0
57  (0, 4, 4, 5, 11, 4, 0)          1.0
56   (0, 9, 4, 4, 5, 4, 0)          1.0
55      (0, 4, 4, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085        3
KansasCity30048         1
LuckyInLove39389        1
SoundAsATrout9610       1
FatherKellys6899        1
                       ..
EarlOfSpaceThe36462     1
PlanxtyJoeBurke28157    1
AnotherDay37522         1
Erins39725              1
FrancisOConnors29682    1
Name: pattern presence, Length: 1035, dtype: int64
Similarity results for BlackbirdThe17110 (pattern presence):
                    title  pattern presence
0          CliffsThe33580                 7
1       BlackbirdThe17110                 7
2       BlackbirdThe17111                 7
3  ChampionOfTheSeas41964                 6
4    FarleyBridgeThe23757       

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2054104.51it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 475202.37it/s]



81 Similar patterns detected:
                     ngram  DL distance
27      (0, 4, 4, 5, 4, 0)          0.0
0          (0, 4, 4, 4, 0)          1.0
57  (0, 4, 4, 5, 11, 4, 0)          1.0
56   (0, 9, 4, 4, 5, 4, 0)          1.0
55      (0, 4, 4, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085        3
KansasCity30048         1
LuckyInLove39389        1
SoundAsATrout9610       1
FatherKellys6899        1
                       ..
EarlOfSpaceThe36462     1
PlanxtyJoeBurke28157    1
AnotherDay37522         1
Erins39725              1
FrancisOConnors29682    1
Name: pattern presence, Length: 1035, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe20663  \
length                       

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2177576.00it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 480135.24it/s]



81 Similar patterns detected:
                     ngram  DL distance
27      (0, 4, 4, 5, 4, 0)          0.0
0          (0, 4, 4, 4, 0)          1.0
57  (0, 4, 4, 5, 11, 4, 0)          1.0
56   (0, 9, 4, 4, 5, 4, 0)          1.0
55      (0, 4, 4, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085        3
KansasCity30048         1
LuckyInLove39389        1
SoundAsATrout9610       1
FatherKellys6899        1
                       ..
EarlOfSpaceThe36462     1
PlanxtyJoeBurke28157    1
AnotherDay37522         1
Erins39725              1
FrancisOConnors29682    1
Name: pattern presence, Length: 1035, dtype: int64
Similarity results for BlackbirdThe17110 (pattern presence):
                    title  pattern presence
0          CliffsThe33580                 7
1       BlackbirdThe17110                 7
2       BlackbirdThe17111                 7
3  ChampionOfTheSeas41964                 6
4    FarleyBridgeThe23757       

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2083763.27it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe17111:
(0, 4, 4, 5, 4, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 408188.47it/s]



81 Similar patterns detected:
                     ngram  DL distance
27      (0, 4, 4, 5, 4, 0)          0.0
0          (0, 4, 4, 4, 0)          1.0
57  (0, 4, 4, 5, 11, 4, 0)          1.0
56   (0, 9, 4, 4, 5, 4, 0)          1.0
55      (0, 4, 4, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085        3
KansasCity30048         1
LuckyInLove39389        1
SoundAsATrout9610       1
FatherKellys6899        1
                       ..
EarlOfSpaceThe36462     1
PlanxtyJoeBurke28157    1
AnotherDay37522         1
Erins39725              1
FrancisOConnors29682    1
Name: pattern presence, Length: 1035, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe20663  \
length                       

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2128802.52it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe17111:
(0, 4, 4, 5, 4, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 472228.22it/s]



81 Similar patterns detected:
                     ngram  DL distance
27      (0, 4, 4, 5, 4, 0)          0.0
0          (0, 4, 4, 4, 0)          1.0
57  (0, 4, 4, 5, 11, 4, 0)          1.0
56   (0, 9, 4, 4, 5, 4, 0)          1.0
55      (0, 4, 4, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085        3
KansasCity30048         1
LuckyInLove39389        1
SoundAsATrout9610       1
FatherKellys6899        1
                       ..
EarlOfSpaceThe36462     1
PlanxtyJoeBurke28157    1
AnotherDay37522         1
Erins39725              1
FrancisOConnors29682    1
Name: pattern presence, Length: 1035, dtype: int64
Similarity results for BlackbirdThe17111 (pattern presence):
                    title  pattern presence
0          CliffsThe33580                 7
1       BlackbirdThe17110                 7
2       BlackbirdThe17111                 7
3  ChampionOfTheSeas41964                 6
4    FarleyBridgeThe23757       

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2413800.22it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 467825.56it/s]



81 Similar patterns detected:
                     ngram  DL distance
27      (0, 4, 4, 5, 4, 0)          0.0
0          (0, 4, 4, 4, 0)          1.0
57  (0, 4, 4, 5, 11, 4, 0)          1.0
56   (0, 9, 4, 4, 5, 4, 0)          1.0
55      (0, 4, 4, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085        3
KansasCity30048         1
LuckyInLove39389        1
SoundAsATrout9610       1
FatherKellys6899        1
                       ..
EarlOfSpaceThe36462     1
PlanxtyJoeBurke28157    1
AnotherDay37522         1
Erins39725              1
FrancisOConnors29682    1
Name: pattern presence, Length: 1035, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe20663  \
length                       

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2142342.11it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 477679.18it/s]



81 Similar patterns detected:
                     ngram  DL distance
27      (0, 4, 4, 5, 4, 0)          0.0
0          (0, 4, 4, 4, 0)          1.0
57  (0, 4, 4, 5, 11, 4, 0)          1.0
56   (0, 9, 4, 4, 5, 4, 0)          1.0
55      (0, 4, 4, 4, 5, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085        3
KansasCity30048         1
LuckyInLove39389        1
SoundAsATrout9610       1
FatherKellys6899        1
                       ..
EarlOfSpaceThe36462     1
PlanxtyJoeBurke28157    1
AnotherDay37522         1
Erins39725              1
FrancisOConnors29682    1
Name: pattern presence, Length: 1035, dtype: int64
Similarity results for BlackbirdThe17111 (pattern presence):
                    title  pattern presence
0          CliffsThe33580                 7
1       BlackbirdThe17110                 7
2       BlackbirdThe17111                 7
3  ChampionOfTheSeas41964                 6
4    FarleyBridgeThe23757       

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2041258.11it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe17112:
(7, 0, 9, 11, 11, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 398099.53it/s]



58 Similar patterns detected:
                   ngram  DL distance
41  (7, 0, 9, 11, 11, 0)          0.0
0       (7, 0, 9, 11, 0)          1.0
31   (7, 0, 9, 0, 11, 0)          1.0
32   (7, 0, 9, 11, 5, 0)          1.0
33  (7, 0, 2, 11, 11, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
MissRowanDavies31729          2
NathanielGowsQuickstep9143    2
ODriscollsFavourite5735       1
BallyoranThe39611             1
MoleCatchersThe26053          1
                             ..
ShelburneThe23777             1
ImWaitingForYou3615           1
RosinTheBow24014              1
Jeans255                      1
SwingingOnTheGate12939        2
Name: pattern presence, Length: 425, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1890065.68it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe17112:
(7, 0, 9, 11, 11, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 391215.99it/s]



58 Similar patterns detected:
                   ngram  DL distance
41  (7, 0, 9, 11, 11, 0)          0.0
0       (7, 0, 9, 11, 0)          1.0
31   (7, 0, 9, 0, 11, 0)          1.0
32   (7, 0, 9, 11, 5, 0)          1.0
33  (7, 0, 2, 11, 11, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
MissRowanDavies31729          2
NathanielGowsQuickstep9143    2
ODriscollsFavourite5735       1
BallyoranThe39611             1
MoleCatchersThe26053          1
                             ..
ShelburneThe23777             1
ImWaitingForYou3615           1
RosinTheBow24014              1
Jeans255                      1
SwingingOnTheGate12939        2
Name: pattern presence, Length: 425, dtype: int64
Similarity results for BlackbirdThe17112 (pattern presence):
                   title  pattern presence
0      BlackbirdThe17112                 5
1  ReturnOfSpringThe6645                 5
2  KilfenoraLassThe32439                 4
3        OffSheGoes14399   

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2119612.91it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 445609.14it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 461107.32it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 457209.27it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 455778.25it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 455868.98it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 451095.30it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 445768.89it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 466761.01it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 450348.91it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 458041.93it/s]
Calculating pattern similarity...: 100%|██████████


1132 Similar patterns detected:
                        ngram  DL distance  (2, 7, 11, 7, 7, 0)  \
127      (7, 11, 5, 2, 7, 11)          0.0                  4.0   
1097  (5, 7, 11, 5, 2, 7, 11)          1.0                  4.0   
143      (7, 11, 9, 2, 7, 11)          1.0                  4.0   
933       (7, 11, 5, 2, 7, 5)          1.0                  4.0   
932       (7, 11, 5, 2, 7, 9)          1.0                  4.0   

      (11, 5, 2, 7, 11, 7)  (7, 11, 7, 7, 0, 9)  (2, 7, 11, 5, 2, 7)  \
127                    2.0                  4.0                  2.0   
1097                   3.0                  5.0                  2.0   
143                    3.0                  4.0                  3.0   
933                    3.0                  4.0                  2.0   
932                    3.0                  3.0                  2.0   

      (0, 11, 7, 2, 7, 11)  (5, 2, 7, 11, 7, 7)  (11, 11, 0, 11, 7, 2)  \
127                    2.0                  4.0          

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2135496.70it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 445764.54it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 456352.77it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 452108.83it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 462062.43it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 451841.94it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 455414.49it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 448957.92it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 471402.53it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 466337.98it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 455999.86it/s]
Calculating pattern similarity...: 100%|██████████


1132 Similar patterns detected:
                        ngram  DL distance  (2, 7, 11, 7, 7, 0)  \
127      (7, 11, 5, 2, 7, 11)          0.0                  4.0   
1097  (5, 7, 11, 5, 2, 7, 11)          1.0                  4.0   
143      (7, 11, 9, 2, 7, 11)          1.0                  4.0   
933       (7, 11, 5, 2, 7, 5)          1.0                  4.0   
932       (7, 11, 5, 2, 7, 9)          1.0                  4.0   

      (11, 5, 2, 7, 11, 7)  (7, 11, 7, 7, 0, 9)  (2, 7, 11, 5, 2, 7)  \
127                    2.0                  4.0                  2.0   
1097                   3.0                  5.0                  2.0   
143                    3.0                  4.0                  3.0   
933                    3.0                  4.0                  2.0   
932                    3.0                  3.0                  2.0   

      (0, 11, 7, 2, 7, 11)  (5, 2, 7, 11, 7, 7)  (11, 11, 0, 11, 7, 2)  \
127                    2.0                  4.0          

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2027643.33it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe1996:
(4, 11, 9, 4, 2, 7)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 341689.72it/s]



51 Similar patterns detected:
                   ngram  DL distance
14   (4, 11, 9, 4, 2, 7)          0.0
0        (4, 9, 4, 2, 7)          1.0
28  (4, 11, 9, 4, 11, 7)          1.0
29   (4, 11, 9, 2, 2, 7)          1.0
30   (4, 11, 9, 4, 2, 4)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
GreenMountainThe33664                  1
RollingWavesThe30078                   2
SimonsWart9663                         1
LuachrachnsThe1851                     2
Newmarket331                           1
                                      ..
SeamusThompsons40888                   1
DiplodocusThe22648                     1
TolkaThe35403                          1
NielGowsLamentForHisSecondWife35334    1
LilyBobs41351                          2
Name: pattern presence, Length: 261, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2058623.94it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe1996:
(4, 11, 9, 4, 2, 7)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 390942.01it/s]



51 Similar patterns detected:
                   ngram  DL distance
14   (4, 11, 9, 4, 2, 7)          0.0
0        (4, 9, 4, 2, 7)          1.0
28  (4, 11, 9, 4, 11, 7)          1.0
29   (4, 11, 9, 2, 2, 7)          1.0
30   (4, 11, 9, 4, 2, 4)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
GreenMountainThe33664                  1
RollingWavesThe30078                   2
SimonsWart9663                         1
LuachrachnsThe1851                     2
Newmarket331                           1
                                      ..
SeamusThompsons40888                   1
DiplodocusThe22648                     1
TolkaThe35403                          1
NielGowsLamentForHisSecondWife35334    1
LilyBobs41351                          2
Name: pattern presence, Length: 261, dtype: int64
Similarity results for BlackbirdThe1996 (pattern presence):
                        title  pattern presence
0  FirstFlightOfGeeseThe36738                 5
1    

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1367307.35it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 394736.62it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 441511.20it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 363170.67it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 438158.57it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 392211.56it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 342616.32it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 415254.47it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 426815.49it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 392663.20it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 377864.28it/s]
Calculating pattern similarity...: 100%|█████████


1167 Similar patterns detected:
                      ngram  DL distance  (9, 4, 2, 0, 9, 4)  \
43       (4, 2, 7, 0, 4, 2)          0.0                 4.0   
1130     (4, 2, 1, 0, 4, 2)          1.0                 4.0   
122      (4, 2, 7, 0, 4, 0)          1.0                 4.0   
1120  (4, 2, 7, 4, 0, 4, 2)          1.0                 5.0   
120      (0, 2, 7, 0, 4, 2)          1.0                 5.0   

      (9, 0, 0, 7, 0, 9)  (2, 9, 0, 0, 7, 0)  (2, 7, 0, 4, 2, 0)  \
43                   5.0                 5.0                 2.0   
1130                 6.0                 5.0                 3.0   
122                  5.0                 4.0                 2.0   
1120                 6.0                 5.0                 3.0   
120                  4.0                 5.0                 2.0   

      (7, 0, 4, 2, 0, 9)  (9, 9, 4, 2, 0, 9)  (0, 9, 9, 4, 2, 0)  \
43                   4.0                 5.0                 5.0   
1130                 5.0             

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2108599.79it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 443426.87it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 453158.62it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 465191.59it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 440180.61it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 436891.59it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 416850.99it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 456695.02it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 439278.36it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 378257.01it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 398007.62it/s]
Calculating pattern similarity...: 100%|██████████


1167 Similar patterns detected:
                      ngram  DL distance  (9, 4, 2, 0, 9, 4)  \
43       (4, 2, 7, 0, 4, 2)          0.0                 4.0   
1130     (4, 2, 1, 0, 4, 2)          1.0                 4.0   
122      (4, 2, 7, 0, 4, 0)          1.0                 4.0   
1120  (4, 2, 7, 4, 0, 4, 2)          1.0                 5.0   
120      (0, 2, 7, 0, 4, 2)          1.0                 5.0   

      (9, 0, 0, 7, 0, 9)  (2, 9, 0, 0, 7, 0)  (2, 7, 0, 4, 2, 0)  \
43                   5.0                 5.0                 2.0   
1130                 6.0                 5.0                 3.0   
122                  5.0                 4.0                 2.0   
1120                 6.0                 5.0                 3.0   
120                  4.0                 5.0                 2.0   

      (7, 0, 4, 2, 0, 9)  (9, 9, 4, 2, 0, 9)  (0, 9, 9, 4, 2, 0)  \
43                   4.0                 5.0                 5.0   
1130                 5.0             

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2093424.36it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe24050:
(5, 2, 9, 0, 0, 7)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 400869.76it/s]



77 Similar patterns detected:
                     ngram  DL distance
14      (5, 2, 9, 0, 0, 7)          0.0
0          (5, 2, 0, 0, 7)          1.0
55     (5, 2, 9, 0, 0, 11)          1.0
54   (5, 2, 9, 0, 0, 7, 4)          1.0
53  (5, 2, 11, 9, 0, 0, 7)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
BraesOfTulliemetThe23904         1
Franks30966                      3
LadyOfTheLake32782               2
RoseOfDrishaneThe2844            1
Portobello39482                  1
                                ..
DickHarmons12731                 1
PaddyCarter27207                 1
SmithsAGallantFiremanThe17303    7
GrahamAndJillysWedding6129       2
WoodcroftLane39745               1
Name: pattern presence, Length: 931, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

 

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2165341.32it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe24050:
(5, 2, 9, 0, 0, 7)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 417093.41it/s]



77 Similar patterns detected:
                     ngram  DL distance
14      (5, 2, 9, 0, 0, 7)          0.0
0          (5, 2, 0, 0, 7)          1.0
55     (5, 2, 9, 0, 0, 11)          1.0
54   (5, 2, 9, 0, 0, 7, 4)          1.0
53  (5, 2, 11, 9, 0, 0, 7)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
BraesOfTulliemetThe23904         1
Franks30966                      3
LadyOfTheLake32782               2
RoseOfDrishaneThe2844            1
Portobello39482                  1
                                ..
DickHarmons12731                 1
PaddyCarter27207                 1
SmithsAGallantFiremanThe17303    7
GrahamAndJillysWedding6129       2
WoodcroftLane39745               1
Name: pattern presence, Length: 931, dtype: int64
Similarity results for BlackbirdThe24050 (pattern presence):
                           title  pattern presence
0  SmithsAGallantFiremanThe17303                 7
1               CatOnALeash28126                 7
2

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2160203.21it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 476689.10it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 449959.12it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 428824.41it/s]



255 Similar patterns detected:
                     ngram  DL distance  (2, 9, 0, 0, 7, 0)  \
23      (9, 0, 0, 7, 0, 9)          0.0                 2.0   
138  (9, 0, 0, 7, 9, 0, 9)          1.0                 3.0   
69      (9, 0, 0, 7, 9, 9)          1.0                 3.0   
68      (9, 0, 0, 4, 0, 9)          1.0                 3.0   
67      (9, 0, 0, 0, 7, 9)          1.0                 3.0   

     (5, 2, 9, 0, 0, 7)  
23                  4.0  
138                 5.0  
69                  4.0  
68                  5.0  
67                  4.0  

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
BraesOfTulliemetThe23904      1
ErikaDamianis5812             2
AnneFraserMacKenzie21588      2
PalmSunday30320               3
Franks30966                   4
                             ..
GrahamAndJillysWedding6129    5
WoodcroftLane39745            4
CherishTheLadies25984         1
RectorAtTheFeis17764          1
ValseDesPoeles11589           2
Na

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2127457.97it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 458883.05it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 437097.85it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 326073.52it/s]



255 Similar patterns detected:
                     ngram  DL distance  (2, 9, 0, 0, 7, 0)  \
23      (9, 0, 0, 7, 0, 9)          0.0                 2.0   
138  (9, 0, 0, 7, 9, 0, 9)          1.0                 3.0   
69      (9, 0, 0, 7, 9, 9)          1.0                 3.0   
68      (9, 0, 0, 4, 0, 9)          1.0                 3.0   
67      (9, 0, 0, 0, 7, 9)          1.0                 3.0   

     (5, 2, 9, 0, 0, 7)  
23                  4.0  
138                 5.0  
69                  4.0  
68                  5.0  
67                  4.0  

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
BraesOfTulliemetThe23904      1
ErikaDamianis5812             2
AnneFraserMacKenzie21588      2
PalmSunday30320               3
Franks30966                   4
                             ..
GrahamAndJillysWedding6129    5
WoodcroftLane39745            4
CherishTheLadies25984         1
RectorAtTheFeis17764          1
ValseDesPoeles11589           2
Na

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2175297.82it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe26494:
(0, 0, 2, 0, 2, 5)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 430023.32it/s]



93 Similar patterns detected:
                    ngram  DL distance
14     (0, 0, 2, 0, 2, 5)          0.0
0         (0, 0, 2, 0, 2)          1.0
67  (0, 0, 3, 2, 0, 2, 5)          1.0
66  (0, 0, 0, 2, 0, 2, 5)          1.0
65  (0, 0, 2, 0, 0, 2, 5)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
BraesOfTulliemetThe23904      1
TailgatingTheMinister27264    2
FarewellToGurteen1733         1
WrenThe16036                  5
QueenEsthers30451             2
                             ..
DowdsFavourite229             1
CeolSaBhaile39052             1
MunsterLassThe1132            2
FrostIsAllOverThe5199         1
RustyGulleyThe30917           2
Name: pattern presence, Length: 965, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  Camowe

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2098249.36it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe26494:
(0, 0, 2, 0, 2, 5)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 470633.84it/s]



93 Similar patterns detected:
                    ngram  DL distance
14     (0, 0, 2, 0, 2, 5)          0.0
0         (0, 0, 2, 0, 2)          1.0
67  (0, 0, 3, 2, 0, 2, 5)          1.0
66  (0, 0, 0, 2, 0, 2, 5)          1.0
65  (0, 0, 2, 0, 0, 2, 5)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
BraesOfTulliemetThe23904      1
TailgatingTheMinister27264    2
FarewellToGurteen1733         1
WrenThe16036                  5
QueenEsthers30451             2
                             ..
DowdsFavourite229             1
CeolSaBhaile39052             1
MunsterLassThe1132            2
FrostIsAllOverThe5199         1
RustyGulleyThe30917           2
Name: pattern presence, Length: 965, dtype: int64
Similarity results for BlackbirdThe26494 (pattern presence):
                     title  pattern presence
0             WrenThe16037                 9
1  KeepingUpWithCalum27965                 7
2                EnDro5289                 6
3            

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2107491.59it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 488292.78it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 474223.17it/s]



189 Similar patterns detected:
                    ngram  DL distance  (0, 2, 0, 2, 5, 0)
30     (0, 0, 2, 0, 2, 5)          0.0                 2.0
53     (0, 0, 2, 5, 2, 5)          1.0                 3.0
74     (0, 0, 2, 7, 2, 5)          1.0                 3.0
73  (0, 0, 2, 0, 7, 2, 5)          1.0                 3.0
72     (0, 0, 9, 0, 2, 5)          1.0                 3.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
BraesOfTulliemetThe23904                       1
TailgatingTheMinister27264                     2
ItWasAMagicMistThatPutMeAstrayOneNight31391    1
DevilInTheWoodpileThe7351                      2
BiddyMcGhee28793                               1
                                              ..
EarlsChairThe12904                             1
CeolSaBhaile39052                              1
MunsterLassThe1132                             3
FrostIsAllOverThe5199                          2
RustyGulleyThe30917                          

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2103490.66it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 489151.90it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 484003.70it/s]



189 Similar patterns detected:
                    ngram  DL distance  (0, 2, 0, 2, 5, 0)
30     (0, 0, 2, 0, 2, 5)          0.0                 2.0
53     (0, 0, 2, 5, 2, 5)          1.0                 3.0
74     (0, 0, 2, 7, 2, 5)          1.0                 3.0
73  (0, 0, 2, 0, 7, 2, 5)          1.0                 3.0
72     (0, 0, 9, 0, 2, 5)          1.0                 3.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
BraesOfTulliemetThe23904                       1
TailgatingTheMinister27264                     2
ItWasAMagicMistThatPutMeAstrayOneNight31391    1
DevilInTheWoodpileThe7351                      2
BiddyMcGhee28793                               1
                                              ..
EarlsChairThe12904                             1
CeolSaBhaile39052                              1
MunsterLassThe1132                             3
FrostIsAllOverThe5199                          2
RustyGulleyThe30917                          

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2072327.83it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe27198:
(2, 10, 0, 5, 2, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 353755.23it/s]



43 Similar patterns detected:
                     ngram  DL distance
22     (2, 10, 0, 5, 2, 0)          0.0
0          (2, 0, 5, 2, 0)          1.0
23  (2, 10, 0, 5, 2, 0, 0)          1.0
24     (2, 10, 7, 5, 2, 0)          1.0
25  (2, 10, 0, 5, 2, 0, 7)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
MikeCooneysFancy3481     2
ReelAroundTheSun11046    1
MartinWynnes40960        1
NewBobThe27291           1
BlackbirdThe39782        1
                        ..
LaMalAimable35779        1
AnGriann2554             1
SleeplessInSyros29504    1
DancingInAllihies8863    2
HoMoChaileagan32246      2
Name: pattern presence, Length: 292, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe20663  \
length             

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2175438.31it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe27198:
(2, 10, 0, 5, 2, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 457525.54it/s]



43 Similar patterns detected:
                     ngram  DL distance
22     (2, 10, 0, 5, 2, 0)          0.0
0          (2, 0, 5, 2, 0)          1.0
23  (2, 10, 0, 5, 2, 0, 0)          1.0
24     (2, 10, 7, 5, 2, 0)          1.0
25  (2, 10, 0, 5, 2, 0, 7)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
MikeCooneysFancy3481     2
ReelAroundTheSun11046    1
MartinWynnes40960        1
NewBobThe27291           1
BlackbirdThe39782        1
                        ..
LaMalAimable35779        1
AnGriann2554             1
SleeplessInSyros29504    1
DancingInAllihies8863    2
HoMoChaileagan32246      2
Name: pattern presence, Length: 292, dtype: int64
Similarity results for BlackbirdThe27198 (pattern presence):
                 title  pattern presence
0   WeSawYouComing5187                 6
1    TommyPeoples14349                 6
2    BlackbirdThe27198                 5
3      IntoTheWay29865                 4
4  KolevsKopanitsa3159               

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2084072.70it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 378497.92it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 439354.45it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 457264.53it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 446314.59it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 453780.10it/s]



266 Similar patterns detected:
                     ngram  DL distance  (0, 5, 2, 10, 0, 5)  \
59      (0, 4, 0, 5, 4, 0)          0.0                  5.0   
117  (7, 0, 4, 0, 5, 4, 0)          1.0                  6.0   
115  (0, 4, 0, 5, 4, 0, 7)          1.0                  5.0   
113  (0, 5, 4, 0, 5, 4, 0)          1.0                  4.0   
108    (0, 4, 0, 5, 4, 11)          1.0                  5.0   

     (10, 0, 5, 2, 0, 0)  (5, 2, 10, 0, 5, 2)  (2, 10, 0, 5, 2, 0)  
59                   4.0                  5.0                  3.0  
117                  5.0                  5.0                  4.0  
115                  4.0                  6.0                  4.0  
113                  4.0                  5.0                  4.0  
108                  5.0                  5.0                  4.0  

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085            1
EarlOfMansfieldsThe21885    2
TomBriggs35343              1


Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1918288.79it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 471661.41it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 455528.43it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 458197.35it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 449538.49it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 454063.21it/s]



266 Similar patterns detected:
                     ngram  DL distance  (0, 5, 2, 10, 0, 5)  \
59      (0, 4, 0, 5, 4, 0)          0.0                  5.0   
117  (7, 0, 4, 0, 5, 4, 0)          1.0                  6.0   
115  (0, 4, 0, 5, 4, 0, 7)          1.0                  5.0   
113  (0, 5, 4, 0, 5, 4, 0)          1.0                  4.0   
108    (0, 4, 0, 5, 4, 11)          1.0                  5.0   

     (10, 0, 5, 2, 0, 0)  (5, 2, 10, 0, 5, 2)  (2, 10, 0, 5, 2, 0)  
59                   4.0                  5.0                  3.0  
117                  5.0                  5.0                  4.0  
115                  4.0                  6.0                  4.0  
113                  4.0                  5.0                  4.0  
108                  5.0                  5.0                  4.0  

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085            1
EarlOfMansfieldsThe21885    2
TomBriggs35343              1


Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2073833.38it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe28174:
(0, 4, 0, 5, 4, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 439210.68it/s]



93 Similar patterns detected:
                     ngram  DL distance
31      (0, 4, 0, 5, 4, 0)          0.0
0          (0, 4, 0, 4, 0)          1.0
66   (0, 4, 0, 5, 4, 0, 4)          1.0
65   (0, 4, 0, 5, 4, 0, 0)          1.0
64  (0, 4, 0, 5, 4, 11, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085            1
EarlOfMansfieldsThe21885    2
TomBriggs35343              1
MyTwoFeet40561              2
LuckyInLove39389            1
                           ..
McDonaghs25486              3
PlanxtyJoeBurke28157        1
Erins39725                  1
CeolSaBhaile39052           1
MineAinHoose36350           1
Name: pattern presence, Length: 1601, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  Quim

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1796919.56it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe28174:
(0, 4, 0, 5, 4, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 454297.76it/s]



93 Similar patterns detected:
                     ngram  DL distance
31      (0, 4, 0, 5, 4, 0)          0.0
0          (0, 4, 0, 4, 0)          1.0
66   (0, 4, 0, 5, 4, 0, 4)          1.0
65   (0, 4, 0, 5, 4, 0, 0)          1.0
64  (0, 4, 0, 5, 4, 11, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085            1
EarlOfMansfieldsThe21885    2
TomBriggs35343              1
MyTwoFeet40561              2
LuckyInLove39389            1
                           ..
McDonaghs25486              3
PlanxtyJoeBurke28157        1
Erins39725                  1
CeolSaBhaile39052           1
MineAinHoose36350           1
Name: pattern presence, Length: 1601, dtype: int64
Similarity results for BlackbirdThe28174 (pattern presence):
                      title  pattern presence
0           ScholarThe24085                 9
1       ClumsyLoverThe29450                 8
2         BlackbirdThe28174                 7
3  HandMeDownTheTackle36

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1904277.19it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 451917.38it/s]



93 Similar patterns detected:
                     ngram  DL distance
31      (0, 4, 0, 5, 4, 0)          0.0
0          (0, 4, 0, 4, 0)          1.0
66   (0, 4, 0, 5, 4, 0, 4)          1.0
65   (0, 4, 0, 5, 4, 0, 0)          1.0
64  (0, 4, 0, 5, 4, 11, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085            1
EarlOfMansfieldsThe21885    2
TomBriggs35343              1
MyTwoFeet40561              2
LuckyInLove39389            1
                           ..
McDonaghs25486              3
PlanxtyJoeBurke28157        1
Erins39725                  1
CeolSaBhaile39052           1
MineAinHoose36350           1
Name: pattern presence, Length: 1601, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  Quim

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2000903.91it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 460863.72it/s]



93 Similar patterns detected:
                     ngram  DL distance
31      (0, 4, 0, 5, 4, 0)          0.0
0          (0, 4, 0, 4, 0)          1.0
66   (0, 4, 0, 5, 4, 0, 4)          1.0
65   (0, 4, 0, 5, 4, 0, 0)          1.0
64  (0, 4, 0, 5, 4, 11, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085            1
EarlOfMansfieldsThe21885    2
TomBriggs35343              1
MyTwoFeet40561              2
LuckyInLove39389            1
                           ..
McDonaghs25486              3
PlanxtyJoeBurke28157        1
Erins39725                  1
CeolSaBhaile39052           1
MineAinHoose36350           1
Name: pattern presence, Length: 1601, dtype: int64
Similarity results for BlackbirdThe28174 (pattern presence):
                      title  pattern presence
0           ScholarThe24085                 9
1       ClumsyLoverThe29450                 8
2         BlackbirdThe28174                 7
3  HandMeDownTheTackle36

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1824206.95it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe28821:
(2, 0, 11, 7, 2, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 363523.58it/s]



88 Similar patterns detected:
                     ngram  DL distance
14     (2, 0, 11, 7, 2, 0)          0.0
0          (2, 0, 7, 2, 0)          1.0
63    (2, 11, 11, 7, 2, 0)          1.0
62  (2, 0, 11, 7, 7, 2, 0)          1.0
61  (2, 0, 11, 7, 2, 0, 6)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
WellAllLieTogether19130    1
JoeyBeatons12157           1
RollingWavesThe30078       1
DrowsyMaggie35491          1
MysteryThe18576            1
                          ..
Vinden29915                2
MunsterLassThe1132         1
FrancisOConnors29682       1
WellAllLieTogether19129    1
SilverTipThe42437          2
Name: pattern presence, Length: 1229, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe20663

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2100002.28it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe28821:
(2, 0, 11, 7, 2, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 448486.51it/s]



88 Similar patterns detected:
                     ngram  DL distance
14     (2, 0, 11, 7, 2, 0)          0.0
0          (2, 0, 7, 2, 0)          1.0
63    (2, 11, 11, 7, 2, 0)          1.0
62  (2, 0, 11, 7, 7, 2, 0)          1.0
61  (2, 0, 11, 7, 2, 0, 6)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
WellAllLieTogether19130    1
JoeyBeatons12157           1
RollingWavesThe30078       1
DrowsyMaggie35491          1
MysteryThe18576            1
                          ..
Vinden29915                2
MunsterLassThe1132         1
FrancisOConnors29682       1
WellAllLieTogether19129    1
SilverTipThe42437          2
Name: pattern presence, Length: 1229, dtype: int64
Similarity results for BlackbirdThe28821 (pattern presence):
                         title  pattern presence
0  FatherDollardsFavourite2333                 9
1  MichaelGallaghersFancy11282                 8
2          MuineiraDeCasu31754                 7
3          WhenTheCatIs

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2510405.48it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 388353.78it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 396665.32it/s]



164 Similar patterns detected:
                  ngram  DL distance  (0, 11, 7, 2, 0, 11)
23  (2, 0, 11, 7, 2, 0)          0.0                   2.0
0       (2, 0, 7, 2, 0)          1.0                   3.0
97  (2, 0, 10, 7, 2, 0)          1.0                   3.0
96  (2, 2, 11, 7, 2, 0)          1.0                   3.0
95  (2, 0, 11, 7, 2, 9)          1.0                   3.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
WellAllLieTogether19130     1
MorganAndersensForet5881    2
JoeyBeatons12157            1
Quinns27487                 1
RollingWavesThe30078        1
                           ..
Vinden29915                 2
MunsterLassThe1132          1
FrancisOConnors29682        1
WellAllLieTogether19129     1
SilverTipThe42437           2
Name: pattern presence, Length: 1619, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length             

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2136770.10it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 444312.48it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 437994.36it/s]



164 Similar patterns detected:
                  ngram  DL distance  (0, 11, 7, 2, 0, 11)
23  (2, 0, 11, 7, 2, 0)          0.0                   2.0
0       (2, 0, 7, 2, 0)          1.0                   3.0
97  (2, 0, 10, 7, 2, 0)          1.0                   3.0
96  (2, 2, 11, 7, 2, 0)          1.0                   3.0
95  (2, 0, 11, 7, 2, 9)          1.0                   3.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
WellAllLieTogether19130     1
MorganAndersensForet5881    2
JoeyBeatons12157            1
Quinns27487                 1
RollingWavesThe30078        1
                           ..
Vinden29915                 2
MunsterLassThe1132          1
FrancisOConnors29682        1
WellAllLieTogether19129     1
SilverTipThe42437           2
Name: pattern presence, Length: 1619, dtype: int64
Similarity results for BlackbirdThe28821 (pattern presence):
                         title  pattern presence
0  FatherDollardsFavourite2333              

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1811414.59it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe31201:
(5, 5, 4, 5, 4, 5)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 482855.12it/s]



72 Similar patterns detected:
                    ngram  DL distance
9      (5, 5, 4, 5, 4, 5)          0.0
0         (5, 4, 5, 4, 5)          1.0
51  (9, 5, 5, 4, 5, 4, 5)          1.0
50     (5, 5, 4, 5, 2, 5)          1.0
49  (5, 5, 4, 5, 4, 2, 5)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085            3
Fishers14045                2
Lochanside24182             4
Stumpie42230                2
ChristmasThe24592           1
                           ..
TwentyOneHighland20345      2
KickTheWorldBeforeMe6436    4
Fishers14048                2
JimmyDoyles19753            2
RectorAtTheFeis17764        1
Name: pattern presence, Length: 473, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe2

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2099086.21it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe31201:
(5, 5, 4, 5, 4, 5)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 461451.68it/s]



72 Similar patterns detected:
                    ngram  DL distance
9      (5, 5, 4, 5, 4, 5)          0.0
0         (5, 4, 5, 4, 5)          1.0
51  (9, 5, 5, 4, 5, 4, 5)          1.0
50     (5, 5, 4, 5, 2, 5)          1.0
49  (5, 5, 4, 5, 4, 2, 5)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
JudiqueHall12085            3
Fishers14045                2
Lochanside24182             4
Stumpie42230                2
ChristmasThe24592           1
                           ..
TwentyOneHighland20345      2
KickTheWorldBeforeMe6436    4
Fishers14048                2
JimmyDoyles19753            2
RectorAtTheFeis17764        1
Name: pattern presence, Length: 473, dtype: int64
Similarity results for BlackbirdThe31201 (pattern presence):
                 title  pattern presence
0  BobMacPhersons36595                 9
1  BobMacPhersons36557                 9
2     PeterStreet10147                 7
3     PeterStreet20231                 7
4       AB

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2547042.37it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 435361.14it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 437706.84it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 395168.33it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 461148.21it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 428911.17it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 407042.90it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 450125.00it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 450031.01it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 459186.19it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 487000.97it/s]
Calculating pattern similarity...: 100%|██████████


2001 Similar patterns detected:
                      ngram  DL distance  (0, 0, 7, 5, 4, 0)  \
86       (7, 5, 4, 0, 7, 5)          0.0                 4.0   
1582  (7, 5, 4, 0, 7, 4, 5)          1.0                 5.0   
880      (7, 5, 4, 0, 2, 5)          1.0                 4.0   
879   (7, 5, 4, 0, 0, 7, 5)          1.0                 5.0   
419      (7, 4, 4, 0, 7, 5)          1.0                 5.0   

      (4, 7, 5, 4, 2, 7)  (5, 0, 0, 7, 5, 4)  (7, 5, 4, 2, 7, 4)  \
86                   3.0                 3.0                 2.0   
1582                 4.0                 3.0                 2.0   
880                  3.0                 4.0                 3.0   
879                  4.0                 3.0                 3.0   
419                  4.0                 4.0                 3.0   

      (7, 4, 0, 4, 7, 5)  (7, 5, 0, 4, 7, 5)  (5, 4, 0, 7, 5, 0)  \
86                   2.0                 1.0                 2.0   
1582                 2.0             

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2034649.14it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 440291.29it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 432544.76it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 448750.35it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 410622.27it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 424353.09it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 426448.52it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 411080.54it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 389694.38it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 438902.30it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 487729.38it/s]
Calculating pattern similarity...: 100%|██████████


2001 Similar patterns detected:
                      ngram  DL distance  (0, 0, 7, 5, 4, 0)  \
86       (7, 5, 4, 0, 7, 5)          0.0                 4.0   
1582  (7, 5, 4, 0, 7, 4, 5)          1.0                 5.0   
880      (7, 5, 4, 0, 2, 5)          1.0                 4.0   
879   (7, 5, 4, 0, 0, 7, 5)          1.0                 5.0   
419      (7, 4, 4, 0, 7, 5)          1.0                 5.0   

      (4, 7, 5, 4, 2, 7)  (5, 0, 0, 7, 5, 4)  (7, 5, 4, 2, 7, 4)  \
86                   3.0                 3.0                 2.0   
1582                 4.0                 3.0                 2.0   
880                  3.0                 4.0                 3.0   
879                  4.0                 3.0                 3.0   
419                  4.0                 4.0                 3.0   

      (7, 4, 0, 4, 7, 5)  (7, 5, 0, 4, 7, 5)  (5, 4, 0, 7, 5, 0)  \
86                   2.0                 1.0                 2.0   
1582                 2.0             

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2181581.38it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe32399:
(4, 2, 7, 4, 7, 4)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 434932.37it/s]



92 Similar patterns detected:
                    ngram  DL distance
8      (4, 2, 7, 4, 7, 4)          0.0
0         (4, 7, 4, 7, 4)          1.0
66  (4, 2, 7, 2, 4, 7, 4)          1.0
65  (4, 2, 7, 4, 7, 2, 4)          1.0
64  (4, 2, 7, 4, 7, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
LarkinsBeehives28212            1
BalcomieHouse32723              2
BlackRogueThe37609              1
PaddyOBriensReturnToErin2925    1
CatInTheCornerThe21264          2
                               ..
FareWell20241                   1
GanAinm5551                     1
LilyBobs41351                   2
PatDonald9454                   1
KevinMcHughs24967               1
Name: pattern presence, Length: 1525, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTu

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2198009.51it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe32399:
(4, 2, 7, 4, 7, 4)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 470390.81it/s]



92 Similar patterns detected:
                    ngram  DL distance
8      (4, 2, 7, 4, 7, 4)          0.0
0         (4, 7, 4, 7, 4)          1.0
66  (4, 2, 7, 2, 4, 7, 4)          1.0
65  (4, 2, 7, 4, 7, 2, 4)          1.0
64  (4, 2, 7, 4, 7, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
LarkinsBeehives28212            1
BalcomieHouse32723              2
BlackRogueThe37609              1
PaddyOBriensReturnToErin2925    1
CatInTheCornerThe21264          2
                               ..
FareWell20241                   1
GanAinm5551                     1
LilyBobs41351                   2
PatDonald9454                   1
KevinMcHughs24967               1
Name: pattern presence, Length: 1525, dtype: int64
Similarity results for BlackbirdThe32399 (pattern presence):
                         title  pattern presence
0            JamesMurrays37504                10
1                    MAndM9818                 9
2             JamesMurr

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2188100.34it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:02<00:00, 343184.25it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 473822.82it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 459758.60it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 462309.51it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 458526.29it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 451452.58it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 489820.48it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 497925.60it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 444922.79it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 481457.39it/s]
Calculating pattern similarity...: 100%|██████████


2038 Similar patterns detected:
                  ngram  DL distance  (2, 7, 4, 7, 4, 7)  (0, 0, 7, 5, 4, 0)  \
90   (7, 5, 4, 0, 7, 5)          0.0                 5.0                 4.0   
791  (7, 4, 5, 0, 7, 5)          1.0                 4.0                 5.0   
552  (7, 5, 4, 0, 9, 5)          1.0                 5.0                 4.0   
553  (7, 5, 4, 0, 4, 5)          1.0                 4.0                 4.0   
588  (7, 9, 4, 0, 7, 5)          1.0                 5.0                 5.0   

     (4, 7, 5, 4, 2, 7)  (5, 0, 0, 7, 5, 4)  (7, 5, 4, 2, 7, 4)  \
90                  3.0                 3.0                 2.0   
791                 4.0                 4.0                 3.0   
552                 4.0                 4.0                 3.0   
553                 4.0                 4.0                 3.0   
588                 4.0                 4.0                 3.0   

     (4, 2, 7, 4, 7, 4)  (7, 4, 7, 4, 7, 5)  (7, 5, 0, 4, 7, 5)  ...  \
90         

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2119186.17it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 441259.24it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 473053.78it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 458373.28it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 459477.58it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 446641.05it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 445583.41it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 483366.06it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 481946.17it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 445144.67it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 497008.96it/s]
Calculating pattern similarity...: 100%|██████████


2038 Similar patterns detected:
                  ngram  DL distance  (2, 7, 4, 7, 4, 7)  (0, 0, 7, 5, 4, 0)  \
90   (7, 5, 4, 0, 7, 5)          0.0                 5.0                 4.0   
791  (7, 4, 5, 0, 7, 5)          1.0                 4.0                 5.0   
552  (7, 5, 4, 0, 9, 5)          1.0                 5.0                 4.0   
553  (7, 5, 4, 0, 4, 5)          1.0                 4.0                 4.0   
588  (7, 9, 4, 0, 7, 5)          1.0                 5.0                 5.0   

     (4, 7, 5, 4, 2, 7)  (5, 0, 0, 7, 5, 4)  (7, 5, 4, 2, 7, 4)  \
90                  3.0                 3.0                 2.0   
791                 4.0                 4.0                 3.0   
552                 4.0                 4.0                 3.0   
553                 4.0                 4.0                 3.0   
588                 4.0                 4.0                 3.0   

     (4, 2, 7, 4, 7, 4)  (7, 4, 7, 4, 7, 5)  (7, 5, 0, 4, 7, 5)  ...  \
90         

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1989487.59it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe34225:
(7, 11, 11, 2, 11, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 429505.97it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe2

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2185488.09it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe34225:
(7, 11, 11, 2, 11, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 459534.27it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Similarity results for BlackbirdThe34225 (pattern presence):
               title  pattern presence
0  BlackbirdThe14357                 8
1  BlackbirdThe34225                 8
2  BlackbirdThe14355                 7
3  BlackbirdThe14356                 7
4      DerryThe19062

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2084717.63it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 450270.73it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe2

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2135415.47it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 450991.22it/s]



50 Similar patterns detected:
                    ngram  DL distance
8   (7, 11, 11, 2, 11, 0)          0.0
0       (7, 11, 2, 11, 0)          1.0
27   (7, 11, 0, 2, 11, 0)          1.0
28  (7, 11, 11, 0, 11, 0)          1.0
29   (7, 11, 11, 2, 4, 0)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
DublinLadsThe4994           1
Vallafield8987              1
Bagpipe19817                1
YoungScotty8357             1
BunkerHill29203             1
                           ..
ShelburneThe23777           1
RockingTheCradle11617       1
HakketoneSchottische2676    1
GanAinm38701                3
CalCallaghans36448          1
Name: pattern presence, Length: 155, dtype: int64
Similarity results for BlackbirdThe34225 (pattern presence):
               title  pattern presence
0  BlackbirdThe14357                 8
1  BlackbirdThe34225                 8
2  BlackbirdThe14355                 7
3  BlackbirdThe14356                 7
4      DerryThe19062

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2062178.07it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe36690:
(2, 7, 0, 2, 11, 7)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 403108.05it/s]



80 Similar patterns detected:
                     ngram  DL distance
23     (2, 7, 0, 2, 11, 7)          0.0
0          (2, 7, 0, 2, 7)          1.0
56  (2, 7, 0, 2, 11, 7, 5)          1.0
55  (2, 7, 0, 2, 11, 9, 7)          1.0
54  (2, 7, 0, 4, 2, 11, 7)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
AnneFraserMacKenzie21588               1
StropTheRazor39234                     1
Nellies16733                           1
CaseyFinnegans6048                     1
NathanielGowsQuickstep9143             1
                                      ..
YLancers21156                          1
HerbReids15793                         1
NielGowsLamentForHisSecondWife35334    1
DoylesFancy24990                       1
RoseCottage27259                       5
Name: pattern presence, Length: 876, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length        

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2154538.02it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe36690:
(2, 7, 0, 2, 11, 7)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 431089.19it/s]



80 Similar patterns detected:
                     ngram  DL distance
23     (2, 7, 0, 2, 11, 7)          0.0
0          (2, 7, 0, 2, 7)          1.0
56  (2, 7, 0, 2, 11, 7, 5)          1.0
55  (2, 7, 0, 2, 11, 9, 7)          1.0
54  (2, 7, 0, 4, 2, 11, 7)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
AnneFraserMacKenzie21588               1
StropTheRazor39234                     1
Nellies16733                           1
CaseyFinnegans6048                     1
NathanielGowsQuickstep9143             1
                                      ..
YLancers21156                          1
HerbReids15793                         1
NielGowsLamentForHisSecondWife35334    1
DoylesFancy24990                       1
RoseCottage27259                       5
Name: pattern presence, Length: 876, dtype: int64
Similarity results for BlackbirdThe36690 (pattern presence):
                    title  pattern presence
0        StrangerThe17142                 8


Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2166762.08it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 443937.19it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 402915.70it/s]



147 Similar patterns detected:
                     ngram  DL distance  (4, 2, 7, 0, 2, 11)
35     (2, 7, 0, 2, 11, 7)          0.0                  2.0
0          (2, 7, 0, 2, 7)          1.0                  2.0
97  (2, 7, 0, 4, 2, 11, 7)          1.0                  3.0
96     (2, 7, 0, 3, 11, 7)          1.0                  3.0
95     (7, 2, 0, 2, 11, 7)          1.0                  3.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
AnneFraserMacKenzie21588               2
StropTheRazor39234                     2
Nellies16733                           2
Oblique23252                           2
CaseyFinnegans6048                     1
                                      ..
NielGowsLamentForHisSecondWife35334    3
DoylesFancy24990                       2
RoseCottage27259                       6
EarlOfSpaceThe36462                    2
WeaponsOfNonExistenceThe2841           1
Name: pattern presence, Length: 1098, dtype: int64
Normalising presence 

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2181666.16it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 447402.10it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 425716.12it/s]



147 Similar patterns detected:
                     ngram  DL distance  (4, 2, 7, 0, 2, 11)
35     (2, 7, 0, 2, 11, 7)          0.0                  2.0
0          (2, 7, 0, 2, 7)          1.0                  2.0
97  (2, 7, 0, 4, 2, 11, 7)          1.0                  3.0
96     (2, 7, 0, 3, 11, 7)          1.0                  3.0
95     (7, 2, 0, 2, 11, 7)          1.0                  3.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
AnneFraserMacKenzie21588               2
StropTheRazor39234                     2
Nellies16733                           2
Oblique23252                           2
CaseyFinnegans6048                     1
                                      ..
NielGowsLamentForHisSecondWife35334    3
DoylesFancy24990                       2
RoseCottage27259                       6
EarlOfSpaceThe36462                    2
WeaponsOfNonExistenceThe2841           1
Name: pattern presence, Length: 1098, dtype: int64
Similarity results fo

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2262589.11it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe39782:
(10, 0, 5, 4, 0, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 413905.38it/s]



33 Similar patterns detected:
                     ngram  DL distance
31     (10, 0, 5, 4, 0, 0)          0.0
0          (0, 5, 4, 0, 0)          1.0
30  (10, 0, 5, 4, 0, 0, 5)          1.0
29  (10, 0, 5, 4, 0, 0, 7)          1.0
28     (10, 0, 5, 4, 0, 7)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
TomBriggs35343            2
BeggarmanThe11475         3
MikeCooneysFancy3481      1
FrancAPhoill31            2
Drobe3774                 2
                         ..
PresidentLincolns18199    2
CherryBlossomThe39709     2
BoysOfKilsarneThe41150    2
DukeOfPerthThe5444        2
MenFromMallowThe40512     1
Name: pattern presence, Length: 286, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe20663  \
length  

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2020540.15it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe39782:
(10, 0, 5, 4, 0, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 452397.36it/s]



33 Similar patterns detected:
                     ngram  DL distance
31     (10, 0, 5, 4, 0, 0)          0.0
0          (0, 5, 4, 0, 0)          1.0
30  (10, 0, 5, 4, 0, 0, 5)          1.0
29  (10, 0, 5, 4, 0, 0, 7)          1.0
28     (10, 0, 5, 4, 0, 7)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
TomBriggs35343            2
BeggarmanThe11475         3
MikeCooneysFancy3481      1
FrancAPhoill31            2
Drobe3774                 2
                         ..
PresidentLincolns18199    2
CherryBlossomThe39709     2
BoysOfKilsarneThe41150    2
DukeOfPerthThe5444        2
MenFromMallowThe40512     1
Name: pattern presence, Length: 286, dtype: int64
Similarity results for BlackbirdThe39782 (pattern presence):
                   title  pattern presence
0      BlackbirdThe39782                 7
1  AustralianWaters27209                 4
2   TripToCapeSpear35059                 3
3   AustralianWaters2607                 3
4  AustralianWat

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2183334.84it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 450788.17it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 454244.67it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 427400.96it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 427231.56it/s]



123 Similar patterns detected:
                      ngram  DL distance  (10, 0, 5, 4, 0, 0)  \
38      (0, 5, 2, 10, 0, 5)          0.0                  4.0   
122  (7, 0, 5, 2, 10, 0, 5)          1.0                  4.0   
95      (0, 5, 2, 10, 8, 5)          1.0                  5.0   
60      (0, 5, 8, 10, 0, 5)          1.0                  4.0   
30      (0, 5, 0, 10, 0, 5)          1.0                  4.0   

     (5, 2, 10, 0, 5, 4)  (2, 10, 0, 5, 4, 0)  
38                   2.0                  4.0  
122                  3.0                  5.0  
95                   3.0                  5.0  
60                   3.0                  5.0  
30                   3.0                  5.0  

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
TomBriggs35343              3
BeggarmanThe11475           4
KashmirCloakThe2874         1
CloudedSkyThe11305          1
MikeCooneysFancy3481        1
                           ..
BulgarianThe24599           1


Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 1901954.63it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 452295.83it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 464602.74it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 432750.01it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 430218.74it/s]



123 Similar patterns detected:
                      ngram  DL distance  (10, 0, 5, 4, 0, 0)  \
38      (0, 5, 2, 10, 0, 5)          0.0                  4.0   
122  (7, 0, 5, 2, 10, 0, 5)          1.0                  4.0   
95      (0, 5, 2, 10, 8, 5)          1.0                  5.0   
60      (0, 5, 8, 10, 0, 5)          1.0                  4.0   
30      (0, 5, 0, 10, 0, 5)          1.0                  4.0   

     (5, 2, 10, 0, 5, 4)  (2, 10, 0, 5, 4, 0)  
38                   2.0                  4.0  
122                  3.0                  5.0  
95                   3.0                  5.0  
60                   3.0                  5.0  
30                   3.0                  5.0  

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
TomBriggs35343              3
BeggarmanThe11475           4
KashmirCloakThe2874         1
CloudedSkyThe11305          1
MikeCooneysFancy3481        1
                           ..
BulgarianThe24599           1


Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2088181.26it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   4%|▍         | 33070/741454 [00:00<00:02, 330683.76it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe4101:
(5, 4, 0, 7, 5, 4)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 415334.11it/s]



84 Similar patterns detected:
                     ngram  DL distance
7       (5, 4, 0, 7, 5, 4)          0.0
0          (4, 0, 7, 5, 4)          1.0
60   (5, 4, 0, 9, 7, 5, 4)          1.0
59  (11, 5, 4, 0, 7, 5, 4)          1.0
58   (5, 4, 0, 0, 7, 5, 4)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
MyTwoFeet40561             1
Lochanside24182            1
DownTheGreenFields28924    3
BlackRogueThe1076          1
Rainmaker8751              1
                          ..
PlanxtyJoeBurke28157       3
JacksonsDream24770         1
CherishTheLadies25984      1
JimmyDoyles19753           1
RectorAtTheFeis17764       1
Name: pattern presence, Length: 1166, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe20663

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2128022.48it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe4101:
(5, 4, 0, 7, 5, 4)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 437885.76it/s]



84 Similar patterns detected:
                     ngram  DL distance
7       (5, 4, 0, 7, 5, 4)          0.0
0          (4, 0, 7, 5, 4)          1.0
60   (5, 4, 0, 9, 7, 5, 4)          1.0
59  (11, 5, 4, 0, 7, 5, 4)          1.0
58   (5, 4, 0, 0, 7, 5, 4)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
MyTwoFeet40561             1
Lochanside24182            1
DownTheGreenFields28924    3
BlackRogueThe1076          1
Rainmaker8751              1
                          ..
PlanxtyJoeBurke28157       3
JacksonsDream24770         1
CherishTheLadies25984      1
JimmyDoyles19753           1
RectorAtTheFeis17764       1
Name: pattern presence, Length: 1166, dtype: int64
Similarity results for BlackbirdThe4101 (pattern presence):
                    title  pattern presence
0   PasucaisDeLaVilla9004                 9
1  PasucaisDeLaVilla31256                 9
2        BlackbirdThe4101                 8
3         TommyGunns29363                 8


Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2117134.92it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 438176.41it/s]



84 Similar patterns detected:
                     ngram  DL distance
7       (5, 4, 0, 7, 5, 4)          0.0
0          (4, 0, 7, 5, 4)          1.0
60   (5, 4, 0, 9, 7, 5, 4)          1.0
59  (11, 5, 4, 0, 7, 5, 4)          1.0
58   (5, 4, 0, 0, 7, 5, 4)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
MyTwoFeet40561             1
Lochanside24182            1
DownTheGreenFields28924    3
BlackRogueThe1076          1
Rainmaker8751              1
                          ..
PlanxtyJoeBurke28157       3
JacksonsDream24770         1
CherishTheLadies25984      1
JimmyDoyles19753           1
RectorAtTheFeis17764       1
Name: pattern presence, Length: 1166, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length                    32                 65                         64   

        BraesOfTulliemetThe23904  CamowenThe11581  QuimperThe20663

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2143705.55it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 450125.00it/s]



84 Similar patterns detected:
                     ngram  DL distance
7       (5, 4, 0, 7, 5, 4)          0.0
0          (4, 0, 7, 5, 4)          1.0
60   (5, 4, 0, 9, 7, 5, 4)          1.0
59  (11, 5, 4, 0, 7, 5, 4)          1.0
58   (5, 4, 0, 0, 7, 5, 4)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
MyTwoFeet40561             1
Lochanside24182            1
DownTheGreenFields28924    3
BlackRogueThe1076          1
Rainmaker8751              1
                          ..
PlanxtyJoeBurke28157       3
JacksonsDream24770         1
CherishTheLadies25984      1
JimmyDoyles19753           1
RectorAtTheFeis17764       1
Name: pattern presence, Length: 1166, dtype: int64
Similarity results for BlackbirdThe4101 (pattern presence):
                    title  pattern presence
0   PasucaisDeLaVilla9004                 9
1  PasucaisDeLaVilla31256                 9
2        BlackbirdThe4101                 8
3         TommyGunns29363                 8


Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2086913.37it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe4508:
(2, 7, 0, 2, 11, 7)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 409055.09it/s]



80 Similar patterns detected:
                     ngram  DL distance
23     (2, 7, 0, 2, 11, 7)          0.0
0          (2, 7, 0, 2, 7)          1.0
56  (2, 7, 0, 2, 11, 7, 5)          1.0
55  (2, 7, 0, 2, 11, 9, 7)          1.0
54  (2, 7, 0, 4, 2, 11, 7)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
AnneFraserMacKenzie21588               1
StropTheRazor39234                     1
Nellies16733                           1
CaseyFinnegans6048                     1
NathanielGowsQuickstep9143             1
                                      ..
YLancers21156                          1
HerbReids15793                         1
NielGowsLamentForHisSecondWife35334    1
DoylesFancy24990                       1
RoseCottage27259                       5
Name: pattern presence, Length: 876, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4772  MouldyPintThe7496  LongfordCollectorThe24745  \
length        

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2084072.70it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from BlackbirdThe4508:
(2, 7, 0, 2, 11, 7)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 452041.60it/s]



80 Similar patterns detected:
                     ngram  DL distance
23     (2, 7, 0, 2, 11, 7)          0.0
0          (2, 7, 0, 2, 7)          1.0
56  (2, 7, 0, 2, 11, 7, 5)          1.0
55  (2, 7, 0, 2, 11, 9, 7)          1.0
54  (2, 7, 0, 4, 2, 11, 7)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
AnneFraserMacKenzie21588               1
StropTheRazor39234                     1
Nellies16733                           1
CaseyFinnegans6048                     1
NathanielGowsQuickstep9143             1
                                      ..
YLancers21156                          1
HerbReids15793                         1
NielGowsLamentForHisSecondWife35334    1
DoylesFancy24990                       1
RoseCottage27259                       5
Name: pattern presence, Length: 876, dtype: int64
Similarity results for BlackbirdThe4508 (pattern presence):
                    title  pattern presence
0        StrangerThe17142                 8
1

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2075545.73it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 446892.97it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 427220.00it/s]



147 Similar patterns detected:
                     ngram  DL distance  (4, 2, 7, 0, 2, 11)
35     (2, 7, 0, 2, 11, 7)          0.0                  2.0
0          (2, 7, 0, 2, 7)          1.0                  2.0
97  (2, 7, 0, 4, 2, 11, 7)          1.0                  3.0
96     (2, 7, 0, 3, 11, 7)          1.0                  3.0
95     (7, 2, 0, 2, 11, 7)          1.0                  3.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
AnneFraserMacKenzie21588               2
StropTheRazor39234                     2
Nellies16733                           2
Oblique23252                           2
CaseyFinnegans6048                     1
                                      ..
NielGowsLamentForHisSecondWife35334    3
DoylesFancy24990                       2
RoseCottage27259                       6
EarlOfSpaceThe36462                    2
WeaponsOfNonExistenceThe2841           1
Name: pattern presence, Length: 1098, dtype: int64
Normalising presence 

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2123568.36it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 441512.20it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 416237.83it/s]



147 Similar patterns detected:
                     ngram  DL distance  (4, 2, 7, 0, 2, 11)
35     (2, 7, 0, 2, 11, 7)          0.0                  2.0
0          (2, 7, 0, 2, 7)          1.0                  2.0
97  (2, 7, 0, 4, 2, 11, 7)          1.0                  3.0
96     (2, 7, 0, 3, 11, 7)          1.0                  3.0
95     (7, 2, 0, 2, 11, 7)          1.0                  3.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
AnneFraserMacKenzie21588               2
StropTheRazor39234                     2
Nellies16733                           2
Oblique23252                           2
CaseyFinnegans6048                     1
                                      ..
NielGowsLamentForHisSecondWife35334    3
DoylesFancy24990                       2
RoseCottage27259                       6
EarlOfSpaceThe36462                    2
WeaponsOfNonExistenceThe2841           1
Name: pattern presence, Length: 1098, dtype: int64
Similarity results fo

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2114450.32it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from QueenOfTheEarthChildOfTheSkies27066:
(7, 5, 7, 4, 0, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 422507.17it/s]



85 Similar patterns detected:
                     ngram  DL distance
22      (7, 5, 7, 4, 0, 0)          0.0
0          (7, 7, 4, 0, 0)          1.0
61   (7, 5, 9, 7, 4, 0, 0)          1.0
60  (7, 5, 7, 4, 0, 0, 11)          1.0
59   (7, 5, 7, 4, 0, 0, 9)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
72ndHighlandersFarewellToAberdeenThe28289    1
AnneFraserMacKenzie21588                     1
PlanxtyMaguire29910                          1
StronsayWeaverThe37646                       2
CailinMoRinSa30339                           3
                                            ..
PlanxtyMonaghan3704                          1
PlanxtyJoeBurke28157                         2
JacksonsDream24770                           1
FrancisOConnors29682                         1
BaddeckGatheringThe22956                     2
Name: pattern presence, Length: 1371, dtype: int64
Normalising presence data...
Loading tune length data...
        BoysOfPatstaiThe4

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2117853.74it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo


Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]


Frequent n-gram pattern(s) extracted from QueenOfTheEarthChildOfTheSkies27066:
(7, 5, 7, 4, 0, 0)


Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 460621.94it/s]



85 Similar patterns detected:
                     ngram  DL distance
22      (7, 5, 7, 4, 0, 0)          0.0
0          (7, 7, 4, 0, 0)          1.0
61   (7, 5, 9, 7, 4, 0, 0)          1.0
60  (7, 5, 7, 4, 0, 0, 11)          1.0
59   (7, 5, 7, 4, 0, 0, 9)          1.0

Searching cre_corpus for similar tunes...

Compiling pattern presence data...
72ndHighlandersFarewellToAberdeenThe28289    1
AnneFraserMacKenzie21588                     1
PlanxtyMaguire29910                          1
StronsayWeaverThe37646                       2
CailinMoRinSa30339                           3
                                            ..
PlanxtyMonaghan3704                          1
PlanxtyJoeBurke28157                         2
JacksonsDream24770                           1
FrancisOConnors29682                         1
BaddeckGatheringThe22956                     2
Name: pattern presence, Length: 1371, dtype: int64
Similarity results for QueenOfTheEarthChildOfTheSkies27066 (pattern presence):
   

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2573665.29it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 459110.67it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 460586.80it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 463444.90it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 498222.43it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 474673.97it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 491141.35it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 460868.50it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 457206.51it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 471873.54it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 470827.01it/s]



802 Similar patterns detected:
                      ngram  DL distance  (0, 7, 5, 7, 4, 0)  \
54       (9, 7, 4, 7, 0, 0)          0.0                 3.0   
639  (11, 9, 7, 4, 7, 0, 0)          1.0                 4.0   
319     (11, 7, 4, 7, 0, 0)          1.0                 3.0   
509     (9, 7, 4, 7, 0, 11)          1.0                 4.0   
89       (2, 7, 4, 7, 0, 0)          1.0                 3.0   

     (7, 5, 7, 4, 0, 0)  (0, 4, 7, 7, 4, 0)  (0, 4, 4, 0, 7, 5)  \
54                  3.0                 3.0                 4.0   
639                 3.0                 4.0                 5.0   
319                 3.0                 3.0                 4.0   
509                 4.0                 4.0                 4.0   
89                  3.0                 3.0                 4.0   

     (4, 7, 7, 4, 0, 0)  (5, 5, 0, 4, 7, 7)  (5, 0, 4, 7, 7, 4)  \
54                  2.0                 5.0                 4.0   
639                 3.0                 5.0   

Locating candidate tune in pattern cre_corpus...: 100%|██████████| 40154/40154 [00:00<00:00, 2154427.78it/s]
Calculating pattern similarity...:   0%|          | 0/741454 [00:00<?, ?it/s]

                   ngram      idf  BoysOfPatstaiThe4772  MouldyPintThe7496  \
1547  (0, 0, 0, 0, 0, 0)  7.63632                     0                  0   
1724  (7, 7, 7, 2, 7, 7)  7.72991                     0                  0   
1746  (0, 7, 0, 7, 0, 7)  7.73915                     0                  0   
1750  (7, 7, 7, 7, 7, 7)  7.74225                     0                  0   
2095  (0, 7, 2, 0, 0, 7)  7.90361                     0                  0   

      LongfordCollectorThe24745  BraesOfTulliemetThe23904  CamowenThe11581  \
1547                          0                         0                0   
1724                          0                         0                0   
1746                          0                         0                0   
1750                          0                         0                0   
2095                          0                         0                0   

      QuimperThe20663  WellAllLieTogether19130  LInconnuDeLimo

Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 432786.62it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 450415.37it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 455705.59it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 460721.29it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 455944.97it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 485663.03it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 443863.50it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 448969.07it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 448693.83it/s]
Calculating pattern similarity...: 100%|██████████| 741454/741454 [00:01<00:00, 448538.32it/s]



802 Similar patterns detected:
                      ngram  DL distance  (0, 7, 5, 7, 4, 0)  \
54       (9, 7, 4, 7, 0, 0)          0.0                 3.0   
639  (11, 9, 7, 4, 7, 0, 0)          1.0                 4.0   
319     (11, 7, 4, 7, 0, 0)          1.0                 3.0   
509     (9, 7, 4, 7, 0, 11)          1.0                 4.0   
89       (2, 7, 4, 7, 0, 0)          1.0                 3.0   

     (7, 5, 7, 4, 0, 0)  (0, 4, 7, 7, 4, 0)  (0, 4, 4, 0, 7, 5)  \
54                  3.0                 3.0                 4.0   
639                 3.0                 4.0                 5.0   
319                 3.0                 3.0                 4.0   
509                 4.0                 4.0                 4.0   
89                  3.0                 3.0                 4.0   

     (4, 7, 7, 4, 0, 0)  (5, 5, 0, 4, 7, 7)  (5, 0, 4, 7, 7, 4)  \
54                  2.0                 5.0                 4.0   
639                 3.0                 5.0   