In [1]:
for name in dir():
    if not name.startswith('_'): del globals()[name]

In [2]:
import matplotlib
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np

In [3]:
SEED = 2000
np.random.seed(SEED)
pd.options.display.max_columns = None

# To plot pretty figures
%matplotlib inline
plt.rcParams['axes.labelsize'] = 14
plt.rcParams['xtick.labelsize'] = 12
plt.rcParams['ytick.labelsize'] = 12
plt.rcParams['figure.figsize'] = 10, 10

# Where to save the figures
PROJECT_ROOT_DIR = "."
TITLE_ID = "speech_features"

def save_fig(fig_id, tight_layout=True):
    path = os.path.join(PROJECT_ROOT_DIR, "figures", fig_id + ".png")
    print("Saving figure", fig_id)
    if tight_layout:
        plt.tight_layout()
    plt.savefig(path, format='png', dpi=300)

In [4]:
path = 'data.csv'
df = pd.read_csv(path, sep=",")

In [5]:
df.head()

Unnamed: 0,soundname,nsyll,npause,dur (s),phonationtime (s),speechrate (nsyll/dur),articulation rate (nsyll / phonationtime),ASD (speakingtime/nsyll),Materials,Participant
0,27KD-WDB8-YP2F-audio2-kakburk,486,35,135.53,113.56,3.59,4.28,0.234,new,patient
1,2MDJ-RVRY-UJPT-audio2-kakburk,262,24,86.29,65.67,3.04,3.99,0.251,new,patient
2,32WJ-FB3B-S64F-audio2-kakburk,235,36,95.71,56.49,2.46,4.16,0.24,new,patient
3,338H-F93S-5Y5P-audio2-kakburk,39,5,14.54,9.15,2.68,4.26,0.235,new,patient
4,3N4A-3G7P-LHWE-audio2-kakburk,361,34,122.7,83.38,2.94,4.33,0.231,new,patient


In [6]:
df['speaker'] = df['soundname'].str[:14]

In [7]:
df[df['speaker'] == 'LABM-75GG-5K4H'] = 'LABM-75GG-5KH4'

In [8]:
df['age'] = df['speaker']
df['gender'] = df['speaker']
df['condition'] = df['speaker']
df['MMSE'] = df['speaker']
df['education'] = df['speaker'] 

In [9]:
cleanup_nums = {"age":
{"WDWD-XU5H-2EXS" : "70",
"ZD3N-YVLS-83FK" : "71",
"UGLP-E76L-2F98" : "76",
"XC2P-PRBL-8REY" : "65",
"VCR4-AKGC-MJBK" : "65",
"53AC-AP7Q-7UKA" : "78",
"4Y2B-KLTS-6UWA" : "75",
"5DJF-CPGZ-BUGQ" : "78",
"3WLV-CYG6-GXAL" : "66",
"5KVZ-SG7W-UQ6E" : "58",
"RGH4-HSN4-GCMR" : "58",
"8LZM-NGHA-PRWM" : "58",
"YZBC-5BN2-ZWCA" : "62",
"T4UG-98R9-RDCS" : "60",
"TXLH-R239-CPQG" : "74",
"ZDTD-KWQQ-JGPB" : "73",
"LABM-75GG-5KH4" : "72",
"U89K-H28U-NKZ9" : "70",
"S8S8-TGDH-LG9H" : "57",
"M4NC-ELN3-WJBA" : "77",
"XTQN-WA4V-39Y7" : "76",
"XPEU-R5UC-JYUJ" : "74",
"R4SL-RNDM-UJCG" : "72",
"RMHT-ZRLX-S59E" : "58",
"SFBG-TTUN-B8Y7" : "72",
"S47G-BTHK-MMHG" : "55",
"STGY-LEC5-AC2H" : "70",
"ZFBE-82GF-SERT" : "55",
"VYGF-G4MF-27S5" : "72",
"WFBN-8TLU-ZKA4" : "67",
"T6NM-JN4H-4PFM" : "57",
"VDS6-5ULJ-X7YZ" : "68",
"W4N3-62QL-KMZN" : "73",
"V56M-J6RZ-MCLU" : "72",
"TAHE-J5KC-XXTL" : "70",
"TK5R-Y7L4-458U" : "71",
"NU94-Z6MG-K85T" : "65",
"M9S8-UYGU-Q865" : "79",
"PWCG-RX8N-W8NB" : "73",
"D59B-5ZYP-SZPQ" : "71",
"79PA-NFUF-3HEQ" : "78",
"FAGL-HXK3-LBSD" : "76",
"84BU-QCK7-2N8M" : "77",
"63Z2-JEMQ-EQ7N" : "74",
"32WJ-FB3B-S64F" : "72",
"GQ28-X6XM-YSXF" : "73",
"FTPL-RAE7-HJM7" : "71",
"CLAZ-JCKM-JFQT" : "58",
"A2A7-6E6H-H5GJ" : "63",
"X53K-6TFA-C2ST" : "70",
"8GBU-GFRE-QUZR" : "66",
"CRG2-7X84-BLWF" : "68",
"2MDJ-RVRY-UJPT" : "63",
"338H-F93S-5Y5P" : "72",
"PMZM-UYEH-ZSZW" : "75",
"79CJ-M7A3-FALX" : "64",
"7AGX-DJD3-UK39" : "72",
"GA8A-2E3B-LX6F" : "64",
"PWPP-D5EX-EIDN" : "75",
"9EL8-FFJJ-TG5R" : "72",
"HA6B-9WJS-XKES" : "63",
"H2D9-Q75Y-3GDT" : "78",
"7AL7-ACFY-T3JC" : "66",
"MXF3-B9HZ-XPTT" : "66",
"JXQ5-T9DF-F75B" : "58",
"BPYV-H5DR-66TJ" : "72",
"P8X7-9J36-36PQ" : "73",
"8ZMZ-SBTA-MQRP" : "71",
"PWPP-D5EX-EJDN" : "75",
"RUR8-7Z9V-LURB" : "54",
"NTGA-T37M-P8YW" : "72",
"MNFG-MFWA-H3KE" : "71",
"3N4A-3G7P-LHWE" : "69",
"3RQD-KCAQ-UGHK" : "64",
"PTRC-MTWD-BPWV" : "64",
"Q9GV-3VGJ-8Y5Z" : "53",
"KQ4P-55A6-5MML" : "58",
"27KD-WDB8-YP2F" : "70",
"KE3V-PF7F-F59Y" : "74",
"3PRQ-6LYG-6ZTY" : "73",
"8DUH-BE7V-YYBG" : "72",
"6W42-V2GN-MXNM" : "53",
"AVF7-4HU9-N99R" : "71",
"BBB3-ZXUV-448Q" : "70",
"N9NL-VGG3-JPUY" : "70",
"8U3R-J54J-EVXC" : "66",
"3TUP-R5PQ-D4WT" : "70",
"7XHB-V5AT-W3CY" : "74",
"H63Z-TGYG-48JQ" : "72",
"8AMP-SKYB-84H5" : "59",
"84QY-JTL9-4H9C" : "59",
"8FM9-X6A2-3TUN" : "67"},
                
"gender":
{"WDWD-XU5H-2EXS" : "M", 
"ZD3N-YVLS-83FK" : "M", 
"UGLP-E76L-2F98" : "F", 
"XC2P-PRBL-8REY" : "F", 
"VCR4-AKGC-MJBK" : "F", 
"53AC-AP7Q-7UKA" : "M", 
"4Y2B-KLTS-6UWA" : "F", 
"5DJF-CPGZ-BUGQ" : "F", 
"3WLV-CYG6-GXAL" : "F", 
"5KVZ-SG7W-UQ6E" : "F", 
"RGH4-HSN4-GCMR" : "F", 
"8LZM-NGHA-PRWM" : "F", 
"YZBC-5BN2-ZWCA" : "M", 
"T4UG-98R9-RDCS" : "M", 
"TXLH-R239-CPQG" : "F", 
"ZDTD-KWQQ-JGPB" : "F", 
"LABM-75GG-5KH4" : "M", 
"U89K-H28U-NKZ9" : "F", 
"S8S8-TGDH-LG9H" : "F", 
"M4NC-ELN3-WJBA" : "F", 
"XTQN-WA4V-39Y7" : "F", 
"XPEU-R5UC-JYUJ" : "M", 
"R4SL-RNDM-UJCG" : "F", 
"RMHT-ZRLX-S59E" : "M", 
"SFBG-TTUN-B8Y7" : "F", 
"S47G-BTHK-MMHG" : "F", 
"STGY-LEC5-AC2H" : "M", 
"ZFBE-82GF-SERT" : "F", 
"VYGF-G4MF-27S5" : "M", 
"WFBN-8TLU-ZKA4" : "F", 
"T6NM-JN4H-4PFM" : "F", 
"VDS6-5ULJ-X7YZ" : "F", 
"W4N3-62QL-KMZN" : "M", 
"V56M-J6RZ-MCLU" : "M", 
"TAHE-J5KC-XXTL" : "F", 
"TK5R-Y7L4-458U" : "M", 
"NU94-Z6MG-K85T" : "F", 
"M9S8-UYGU-Q865" : "F", 
"PWCG-RX8N-W8NB" : "F", 
"D59B-5ZYP-SZPQ" : "F", 
"79PA-NFUF-3HEQ" : "F", 
"FAGL-HXK3-LBSD" : "F", 
"84BU-QCK7-2N8M" : "F", 
"63Z2-JEMQ-EQ7N" : "F", 
"32WJ-FB3B-S64F" : "F", 
"GQ28-X6XM-YSXF" : "F", 
"FTPL-RAE7-HJM7" : "F", 
"CLAZ-JCKM-JFQT" : "F", 
"A2A7-6E6H-H5GJ" : "F", 
"X53K-6TFA-C2ST" : "F", 
"8GBU-GFRE-QUZR" : "F", 
"CRG2-7X84-BLWF" : "F", 
"2MDJ-RVRY-UJPT" : "M", 
"338H-F93S-5Y5P" : "M", 
"PMZM-UYEH-ZSZW" : "M", 
"79CJ-M7A3-FALX" : "M", 
"7AGX-DJD3-UK39" : "M", 
"GA8A-2E3B-LX6F" : "M", 
"PWPP-D5EX-EIDN" : "M", 
"9EL8-FFJJ-TG5R" : "M", 
"HA6B-9WJS-XKES" : "M", 
"H2D9-Q75Y-3GDT" : "M", 
"7AL7-ACFY-T3JC" : "M", 
"MXF3-B9HZ-XPTT" : "M", 
"JXQ5-T9DF-F75B" : "M", 
"BPYV-H5DR-66TJ" : "M", 
"P8X7-9J36-36PQ" : "M", 
"8ZMZ-SBTA-MQRP" : "M", 
"PWPP-D5EX-EJDN" : "M",
"RUR8-7Z9V-LURB" : "F", 
"NTGA-T37M-P8YW" : "F", 
"MNFG-MFWA-H3KE" : "F", 
"3N4A-3G7P-LHWE" : "F", 
"3RQD-KCAQ-UGHK" : "F", 
"PTRC-MTWD-BPWV" : "F", 
"Q9GV-3VGJ-8Y5Z" : "F", 
"KQ4P-55A6-5MML" : "F",
"27KD-WDB8-YP2F" : "F", 
"KE3V-PF7F-F59Y" : "F", 
"3PRQ-6LYG-6ZTY" : "F", 
"8DUH-BE7V-YYBG" : "F", 
"6W42-V2GN-MXNM" : "F", 
"AVF7-4HU9-N99R" : "F", 
"BBB3-ZXUV-448Q" : "M", 
"N9NL-VGG3-JPUY" : "M", 
"8U3R-J54J-EVXC" : "M", 
"3TUP-R5PQ-D4WT" : "M", 
"7XHB-V5AT-W3CY" : "M", 
"H63Z-TGYG-48JQ" : "M", 
"8AMP-SKYB-84H5" : "M", 
"84QY-JTL9-4H9C" : "M", 
"8FM9-X6A2-3TUN" : "M"},

"condition":
{"WDWD-XU5H-2EXS" : "HC",
"ZD3N-YVLS-83FK" : "HC",
"UGLP-E76L-2F98" : "HC",
"XC2P-PRBL-8REY" : "HC",
"VCR4-AKGC-MJBK" : "HC",
"53AC-AP7Q-7UKA" : "HC",
"4Y2B-KLTS-6UWA" : "HC",
"5DJF-CPGZ-BUGQ" : "HC",
"3WLV-CYG6-GXAL" : "HC",
"5KVZ-SG7W-UQ6E" : "HC",
"RGH4-HSN4-GCMR" : "HC",
"8LZM-NGHA-PRWM" : "HC",
"YZBC-5BN2-ZWCA" : "HC",
"T4UG-98R9-RDCS" : "HC",
"TXLH-R239-CPQG" : "HC",
"ZDTD-KWQQ-JGPB" : "HC",
"LABM-75GG-5KH4" : "HC",
"U89K-H28U-NKZ9" : "HC",
"S8S8-TGDH-LG9H" : "HC",
"M4NC-ELN3-WJBA" : "HC",
"XTQN-WA4V-39Y7" : "HC",
"XPEU-R5UC-JYUJ" : "HC",
"R4SL-RNDM-UJCG" : "HC",
"RMHT-ZRLX-S59E" : "HC",
"SFBG-TTUN-B8Y7" : "HC",
"S47G-BTHK-MMHG" : "HC",
"STGY-LEC5-AC2H" : "HC",
"ZFBE-82GF-SERT" : "HC",
"VYGF-G4MF-27S5" : "HC",
"WFBN-8TLU-ZKA4" : "HC",
"T6NM-JN4H-4PFM" : "HC",
"VDS6-5ULJ-X7YZ" : "HC",
"W4N3-62QL-KMZN" : "HC",
"V56M-J6RZ-MCLU" : "HC",
"TAHE-J5KC-XXTL" : "HC",
"TK5R-Y7L4-458U" : "HC",
"NU94-Z6MG-K85T" : "MCI",
"M9S8-UYGU-Q865" : "MCI",
"PWCG-RX8N-W8NB" : "MCI",
"D59B-5ZYP-SZPQ" : "MCI",
"79PA-NFUF-3HEQ" : "MCI",
"FAGL-HXK3-LBSD" : "MCI",
"84BU-QCK7-2N8M" : "MCI",
"63Z2-JEMQ-EQ7N" : "MCI",
"32WJ-FB3B-S64F" : "MCI",
"GQ28-X6XM-YSXF" : "MCI",
"FTPL-RAE7-HJM7" : "MCI",
"CLAZ-JCKM-JFQT" : "MCI",
"A2A7-6E6H-H5GJ" : "MCI",
"X53K-6TFA-C2ST" : "MCI",
"8GBU-GFRE-QUZR" : "MCI",
"CRG2-7X84-BLWF" : "MCI",
"2MDJ-RVRY-UJPT" : "MCI",
"338H-F93S-5Y5P" : "MCI",
"PMZM-UYEH-ZSZW" : "MCI",
"79CJ-M7A3-FALX" : "MCI",
"7AGX-DJD3-UK39" : "MCI",
"GA8A-2E3B-LX6F" : "MCI",
"PWPP-D5EX-EIDN" : "MCI",
"9EL8-FFJJ-TG5R" : "MCI",
"HA6B-9WJS-XKES" : "MCI",
"H2D9-Q75Y-3GDT" : "MCI",
"7AL7-ACFY-T3JC" : "MCI",
"MXF3-B9HZ-XPTT" : "MCI",
"JXQ5-T9DF-F75B" : "MCI",
"BPYV-H5DR-66TJ" : "MCI",
"P8X7-9J36-36PQ" : "MCI",
"8ZMZ-SBTA-MQRP" : "MCI",
"PWPP-D5EX-EJDN" : "MCI",
"RUR8-7Z9V-LURB" : "SCI",
"NTGA-T37M-P8YW" : "SCI",
"MNFG-MFWA-H3KE" : "SCI",
"3N4A-3G7P-LHWE" : "SCI",
"3RQD-KCAQ-UGHK" : "SCI",
"PTRC-MTWD-BPWV" : "SCI",
"Q9GV-3VGJ-8Y5Z" : "SCI",
"KQ4P-55A6-5MML" : "SCI",
"27KD-WDB8-YP2F" : "SCI",
"KE3V-PF7F-F59Y" : "SCI",
"3PRQ-6LYG-6ZTY" : "SCI",
"8DUH-BE7V-YYBG" : "SCI",
"6W42-V2GN-MXNM" : "SCI",
"AVF7-4HU9-N99R" : "SCI",
"BBB3-ZXUV-448Q" : "SCI",
"N9NL-VGG3-JPUY" : "SCI",
"8U3R-J54J-EVXC" : "SCI",
"3TUP-R5PQ-D4WT" : "SCI",
"7XHB-V5AT-W3CY" : "SCI",
"H63Z-TGYG-48JQ" : "SCI",
"8AMP-SKYB-84H5" : "SCI",
"84QY-JTL9-4H9C" : "SCI",
"8FM9-X6A2-3TUN" : "SCI"},
               
"MMSE" :
{"27KD-WDB8-YP2F" : "30",
"2MDJ-RVRY-UJPT" : "30",
"32WJ-FB3B-S64F" : "28",
"338H-F93S-5Y5P" : "28",
"3N4A-3G7P-LHWE" : "30",
"3PRQ-6LYG-6ZTY" : "30",
"3RQD-KCAQ-UGHK" : "30",
"3TUP-R5PQ-D4WT" : "30",
"3WLV-CYG6-GXAL" : "29",
"4Y2B-KLTS-6UWA" : "30",
"53AC-AP7Q-7UKA" : "29",
"5DJF-CPGZ-BUGQ" : "30",
"5KVZ-SG7W-UQ6E" : "29",
"63Z2-JEMQ-EQ7N" : "29",
"6W42-V2GN-MXNM" : "28",
"79CJ-M7A3-FALX" : "28",
"79PA-NFUF-3HEQ" : "28",
"7AGX-DJD3-UK39" : "28",
"7AL7-ACFY-T3JC" : "30",
"7XHB-V5AT-W3CY" : "30",
"84BU-QCK7-2N8M" : "30",
"84QY-JTL9-4H9C" : "30",
"8AMP-SKYB-84H5" : "30",
"8DUH-BE7V-YYBG" : "29",
"8FM9-X6A2-3TUN" : "30",
"8GBU-GFRE-QUZR" : "28",
"8LZM-NGHA-PRWM" : "30",
"8U3R-J54J-EVXC" : "30",
"8ZMZ-SBTA-MQRP" : "29",
"9EL8-FFJJ-TG5R" : "30",
"A2A7-6E6H-H5GJ" : "29",
"AVF7-4HU9-N99R" : "30",
"BBB3-ZXUV-448Q" : "28",
"BPYV-H5DR-66TJ" : "27",
"CLAZ-JCKM-JFQT" : "28",
"CRG2-7X84-BLWF" : "28",
"D59B-5ZYP-SZPQ" : "25",
"FAGL-HXK3-LBSD" : "27",
"FTPL-RAE7-HJM7" : "26",
"GA8A-2E3B-LX6F" : "25",
"GQ28-X6XM-YSXF" : "29",
"H2D9-Q75Y-3GDT" : "29",
"H63Z-TGYG-48JQ" : "30",
"HA6B-9WJS-XKES" : "29",
"JXQ5-T9DF-F75B" : "29",
"KE3V-PF7F-F59Y" : "30",
"KQ4P-55A6-5MML" : "30",
"LABM-75GG-5KH4" : "28",
"M4NC-ELN3-WJBA" : "30",
"M9S8-UYGU-Q865" : "30",
"MNFG-MFWA-H3KE" : "28",
"MXF3-B9HZ-XPTT" : "29",
"N9NL-VGG3-JPUY" : "29",
"NTGA-T37M-P8YW" : "29",
"NU94-Z6MG-K85T" : "27",
"P8X7-9J36-36PQ" : "27",
"PMZM-UYEH-ZSZW" : "29",
"PTRC-MTWD-BPWV" : "30",
"PWCG-RX8N-W8NB" : "28",
"PWPP-D5EX-EIDN" : "26",
"Q9GV-3VGJ-8Y5Z" : "30",
"R4SL-RNDM-UJCG" : "30",
"RGH4-HSN4-GCMR" : "30",
"RMHT-ZRLX-S59E" : "30",
"RUR8-7Z9V-LURB" : "27",
"S47G-BTHK-MMHG" : "28",
"S8S8-TGDH-LG9H" : "29",
"SFBG-TTUN-B8Y7" : "30",
"STGY-LEC5-AC2H" : "30",
"T4UG-98R9-RDCS" : "30",
"T6NM-JN4H-4PFM" : "29",
"TAHE-J5KC-XXTL" : "30",
"TK5R-Y7L4-458U" : "30",
"TXLH-R239-CPQG" : "30",
"U89K-H28U-NKZ9" : "30",
"UGLP-E76L-2F98" : "29",
"W4N3-62QL-KMZN" : "30",
"V56M-J6RZ-MCLU" : "30",
"VCR4-AKGC-MJBK" : "NA",
"VDS6-5ULJ-X7YZ" : "29",
"WDWD-XU5H-2EXS" : "30",
"WFBN-8TLU-ZKA4" : "29",
"VYGF-G4MF-27S5" : "30",
"X53K-6TFA-C2ST" : "30",
"XC2P-PRBL-8REY" : "30",
"XPEU-R5UC-JYUJ" : "29",
"XTQN-WA4V-39Y7" : "30",
"YZBC-5BN2-ZWCA" : "30",
"ZD3N-YVLS-83FK" : "29",
"ZDTD-KWQQ-JGPB" : "30",
"ZFBE-82GF-SERT" : "29"},

"education":
{"27KD-WDB8-YP2F" : "18",
"2MDJ-RVRY-UJPT" : "9",
"32WJ-FB3B-S64F" : "15",
"338H-F93S-5Y5P" : "10",
"3N4A-3G7P-LHWE" : "17",
"3PRQ-6LYG-6ZTY" : "15",
"3RQD-KCAQ-UGHK" : "17",
"3TUP-R5PQ-D4WT" : "12",
"3WLV-CYG6-GXAL" : "12",
"4Y2B-KLTS-6UWA" : "10",
"53AC-AP7Q-7UKA" : "9",
"5DJF-CPGZ-BUGQ" : "8",
"5KVZ-SG7W-UQ6E" : "15",
"63Z2-JEMQ-EQ7N" : "11",
"6W42-V2GN-MXNM" : "19",
"79CJ-M7A3-FALX" : "12",
"79PA-NFUF-3HEQ" : "17",
"7AGX-DJD3-UK39" : "8",
"7AL7-ACFY-T3JC" : "15",
"7XHB-V5AT-W3CY" : "17",
"84BU-QCK7-2N8M" : "18",
"84QY-JTL9-4H9C" : "14",
"8AMP-SKYB-84H5" : "20",
"8DUH-BE7V-YYBG" : "16",
"8FM9-X6A2-3TUN" : "16",
"8GBU-GFRE-QUZR" : "15",
"8LZM-NGHA-PRWM" : "11",
"8U3R-J54J-EVXC" : "14",
"8ZMZ-SBTA-MQRP" : "12",
"9EL8-FFJJ-TG5R" : "15",
"A2A7-6E6H-H5GJ" : "15",
"AVF7-4HU9-N99R" : "15",
"BBB3-ZXUV-448Q" : "16",
"BPYV-H5DR-66TJ" : "19",
"CLAZ-JCKM-JFQT" : "15",
"CRG2-7X84-BLWF" : "8",
"D59B-5ZYP-SZPQ" : "11",
"FAGL-HXK3-LBSD" : "9",
"FTPL-RAE7-HJM7" : "11",
"GA8A-2E3B-LX6F" : "17",
"GQ28-X6XM-YSXF" : "17",
"H2D9-Q75Y-3GDT" : "15",
"H63Z-TGYG-48JQ" : "18",
"HA6B-9WJS-XKES" : "16",
"JXQ5-T9DF-F75B" : "17",
"KE3V-PF7F-F59Y" : "13",
"KQ4P-55A6-5MML" : "18",
"LABM-75GG-5KH4" : "16",
"M4NC-ELN3-WJBA" : "24",
"M9S8-UYGU-Q865" : "16",
"MNFG-MFWA-H3KE" : "18",
"MXF3-B9HZ-XPTT" : "14",
"N9NL-VGG3-JPUY" : "17",
"NTGA-T37M-P8YW" : "15",
"NU94-Z6MG-K85T" : "9",
"P8X7-9J36-36PQ" : "20",
"PMZM-UYEH-ZSZW" : "20",
"PTRC-MTWD-BPWV" : "12",
"PWCG-RX8N-W8NB" : "15",
"PWPP-D5EX-EIDN" : "18",
"Q9GV-3VGJ-8Y5Z" : "16",
"R4SL-RNDM-UJCG" : "9",
"RGH4-HSN4-GCMR" : "14",
"RMHT-ZRLX-S59E" : "19",
"RUR8-7Z9V-LURB" : "18",
"S47G-BTHK-MMHG" : "15",
"S8S8-TGDH-LG9H" : "13",
"SFBG-TTUN-B8Y7" : "12",
"STGY-LEC5-AC2H" : "14",
"T4UG-98R9-RDCS" : "11",
"T6NM-JN4H-4PFM" : "18",
"TAHE-J5KC-XXTL" : "12",
"TK5R-Y7L4-458U" : "14",
"TXLH-R239-CPQG" : "9",
"U89K-H28U-NKZ9" : "13",
"UGLP-E76L-2F98" : "11",
"W4N3-62QL-KMZN" : "14",
"V56M-J6RZ-MCLU" : "18",
"VCR4-AKGC-MJBK" : "9",
"VDS6-5ULJ-X7YZ" : "19",
"WDWD-XU5H-2EXS" : "14",
"WFBN-8TLU-ZKA4" : "11",
"VYGF-G4MF-27S5" : "15",
"X53K-6TFA-C2ST" : "11",
"XC2P-PRBL-8REY" : "14",
"XPEU-R5UC-JYUJ" : "12",
"XTQN-WA4V-39Y7" : "15",
"YZBC-5BN2-ZWCA" : "12",
"ZD3N-YVLS-83FK" : "9",
"ZDTD-KWQQ-JGPB" : "11",
"ZFBE-82GF-SERT" : "12"}                
               }

In [10]:
df.replace(cleanup_nums, inplace=True)

In [11]:
df.to_csv("final.csv")

In [12]:
for i in df.speaker:
    print(i)

27KD-WDB8-YP2F
2MDJ-RVRY-UJPT
32WJ-FB3B-S64F
338H-F93S-5Y5P
3N4A-3G7P-LHWE
3RQD-KCAQ-UGHK
3TUP-R5PQ-D4WT
3WLV-CYG6-GXAL
4Y2B-KLTS-6UWA
53AC-AP7Q-7UKA
5DJF-CPGZ-BUGQ
5KVZ-SG7W-UQ6E
63Z2-JEMQ-EQ7N
6W42-V2GN-MXNM
79CJ-M7A3-FALX
79PA-NFUF-3HEQ
7AL7-ACFY-T3JC
7XHB-V5AT-W3CY
84BU-QCK7-2N8M
84QY-JTL9-4H9C
8AMP-SKYB-84H5
8FM9-X6A2-3TUN
8LZM-NGHA-PRWM
8U3R-J54J-EVXC
8ZMZ-SBTA-MQRP
9EL8-FFJJ-TG5R
A2A7-6E6H-H5GJ
AVF7-4HU9-N99R
BBB3-ZXUV-448Q
BPYV-H5DR-66TJ
CLAZ-JCKM-JFQT
CRG2-7X84-BLWF
FAGL-HXK3-LBSD
GQ28-X6XM-YSXF
H2D9-Q75Y-3GDT
KE3V-PF7F-F59Y
KQ4P-55A6-5MML
LABM-75GG-5KH4
M4NC-ELN3-WJBA
M9S8-UYGU-Q865
MNFG-MFWA-H3KE
MXF3-B9HZ-XPTT
N9NL-VGG3-JPUY
NTGA-T37M-P8YW
NU94-Z6MG-K85T
PMZM-UYEH-ZSZW
PTRC-MTWD-BPWV
PWPP-D5EX-EIDN
Q9GV-3VGJ-8Y5Z
RGH4-HSN4-GCMR
RMHT-ZRLX-S59E
S8S8-TGDH-LG9H
SFBG-TTUN-B8Y7
STGY-LEC5-AC2H
T4UG-98R9-RDCS
T6NM-JN4H-4PFM
TAHE-J5KC-XXTL
TK5R-Y7L4-458U
TXLH-R239-CPQG
U89K-H28U-NKZ9
UGLP-E76L-2F98
V56M-J6RZ-MCLU
VCR4-AKGC-MJBK
VDS6-5ULJ-X7YZ
VYGF-G4MF-27S5
W4N3-62QL-KMZN
WDWD-XU5H-