In [19]:
import pandas as pd
df = pd.read_csv('dataset/Naive_Classifier.csv', 
                   header=None, 
                   names=['label', 'value'])

# Output printing out first 5 rows
df.head()

Unnamed: 0,label,value
0,address,"s/o saminathan28/3 nagar 3rd , street, korattu..."
1,address,"flat 6 ird main 4h nagar, mookordapalli, 635126"
2,address,1169 kaviyarasu kannadasan nagar kodungaiyur ...
3,address,1568 bhagavath 21. nedumkadu thiruvananthapur...
4,address,22 nehru colony kumarapalnvam coimbatore ici ...


In [20]:
# Check the shape of the dataset
df.shape

(180741, 2)

In [21]:
#Check if any null values are present in the dataset
df.isnull().sum()

label    0
value    1
dtype: int64

In [22]:
# Remove the null fields
df = df.dropna()
df.shape

(180740, 2)

In [23]:
df.head()

Unnamed: 0,label,value
0,address,"s/o saminathan28/3 nagar 3rd , street, korattu..."
1,address,"flat 6 ird main 4h nagar, mookordapalli, 635126"
2,address,1169 kaviyarasu kannadasan nagar kodungaiyur ...
3,address,1568 bhagavath 21. nedumkadu thiruvananthapur...
4,address,22 nehru colony kumarapalnvam coimbatore ici ...


The label field consist of categorical data, hence need to be converted to numerical data <br>

0 -----------> Address <br>
1 -----------> Name

In [26]:
# Mapping of the categorical fields 0 to address and 
df['label'] = df.label.map({'address':0, 'name':1})
df.head() # returns (rows, columns)


Unnamed: 0,label,value
0,0,"s/o saminathan28/3 nagar 3rd , street, korattu..."
1,0,"flat 6 ird main 4h nagar, mookordapalli, 635126"
2,0,1169 kaviyarasu kannadasan nagar kodungaiyur ...
3,0,1568 bhagavath 21. nedumkadu thiruvananthapur...
4,0,22 nehru colony kumarapalnvam coimbatore ici ...


In [27]:
# split into training and testing sets
from sklearn.model_selection import train_test_split

X_train, X_test, y_train, y_test = train_test_split(df['value'], 
                                                    df['label'], 
                                                    random_state=1)

print('Number of rows in the total set: {}'.format(df.shape[0]))
print('Number of rows in the training set: {}'.format(X_train.shape[0]))
print('Number of rows in the test set: {}'.format(X_test.shape[0]))

Number of rows in the total set: 180740
Number of rows in the training set: 135555
Number of rows in the test set: 45185


In [28]:
# Instantiate the CountVectorizer method
from sklearn.feature_extraction.text import CountVectorizer
count_vector = CountVectorizer()

# Fit the training data and then return the matrix
training_data = count_vector.fit_transform(X_train)

# Transform testing data and return the matrix. Note we are not fitting the testing data into the CountVectorizer()
testing_data = count_vector.transform(X_test)

In [29]:
from sklearn.naive_bayes import MultinomialNB
naive_bayes = MultinomialNB()
naive_bayes.fit(training_data, y_train)

MultinomialNB(alpha=1.0, class_prior=None, fit_prior=True)

In [30]:
predictions = naive_bayes.predict(testing_data)

In [31]:

from sklearn.metrics import classification_report,accuracy_score, precision_score, recall_score, f1_score, confusion_matrix
print('Accuracy score: ', format(accuracy_score(y_test, predictions)))
print('Precision score: ', format(precision_score(y_test, predictions)))
print('Recall score: ', format(recall_score(y_test, predictions)))
print('F1 score: ', format(f1_score(y_test, predictions)))
print(confusion_matrix(y_test, predictions))
print(classification_report(y_test,predictions))


Accuracy score:  0.9743277636383756
Precision score:  0.9929864253393665
Recall score:  0.9702204256931725
F1 score:  0.9814714244641088
[[13302   217]
 [  943 30723]]
              precision    recall  f1-score   support

           0       0.93      0.98      0.96     13519
           1       0.99      0.97      0.98     31666

    accuracy                           0.97     45185
   macro avg       0.96      0.98      0.97     45185
weighted avg       0.98      0.97      0.97     45185



In [32]:
name = 'Ram Kumar'
names = [name,]
names = count_vector.transform(names)
value = naive_bayes.predict(names)
if value[0] == 0:
    print("address")
else:
    print("name")

name


In [139]:
address_list = [
  "Brockton Avenue",
  "30 Memorial Drive, Avon MA 2322",
  "250 Hartford Avenue, Bellingham MA 2019",
  "700 Oak Street, Brockton MA 2301",
  "66-4 Parkhurst Rd, Chelmsford MA 1824",
  "591 Memorial Dr, Chicopee MA 1020",
  "55 Brooksby Village Way, Danvers MA 1923",
  "137 Teaticket Hwy, East Falmouth MA 2536",
  "42 Fairhaven Commons Way, Fairhaven MA 2719",
  "374 William S Canning Blvd, Fall River MA 2721",
  "121 Worcester Rd, Framingham MA 1701",
  "677 Timpany Blvd, Gardner MA 1440",
  "337 Russell St, Hadley MA 1035",
  "295 Plymouth Street, Halifax MA 2338",
  "1775 Washington St, Hanover MA 2339",
  "280 Washington Street, Hudson MA 1749",
  "20 Soojian Dr, Leicester MA 1524",
  "11 Jungle Road, Leominster MA 1453",
  "301 Massachusetts Ave, Lunenburg MA 1462",
  "780 Lynnway, Lynn MA 1905",
  "70 Pleasant Valley Street, Methuen MA 1844",
  "830 Curran Memorial Hwy, North Adams MA 1247",
  "1470 S Washington St, North Attleboro MA 2760",
  "506 State Road, North Dartmouth MA 2747",
  "742 Main Street, North Oxford MA 1537",
  "72 Main St, North Reading MA 1864",
  "200 Otis Street, Northborough MA 1532",
  "180 North King Street, Northhampton MA 1060",
  "555 East Main St, Orange MA 1364",
  "555 Hubbard Ave-Suite 12, Pittsfield MA 1201",
  "300 Colony Place, Plymouth MA 2360",
  "301 Falls Blvd, Quincy MA 2169",
  "36 Paramount Drive, Raynham MA 2767",
  "450 Highland Ave, Salem MA 1970",
  "1180 Fall River Avenue, Seekonk MA 2771",
  "1105 Boston Road, Springfield MA 1119",
  "100 Charlton Road, Sturbridge MA 1566",
  "262 Swansea Mall Dr, Swansea MA 2777",
  "333 Main Street, Tewksbury MA 1876",
  "550 Providence Hwy, Walpole MA 2081",
  "352 Palmer Road, Ware MA 1082",
  "3005 Cranberry Hwy Rt 6 28, Wareham MA 2538",
  "250 Rt 59, Airmont NY 10901",
  "141 Washington Ave Extension, Albany NY 12205",
  "13858 Rt 31 W, Albion NY 14411",
  "2055 Niagara Falls Blvd, Amherst NY 14228",
  "101 Sanford Farm Shpg Center, Amsterdam NY 12010",
  "297 Grant Avenue, Auburn NY 13021",
  "4133 Veterans Memorial Drive, Batavia NY 14020",
  "6265 Brockport Spencerport Rd, Brockport NY 14420",
  "5399 W Genesse St, Camillus NY 13031",
  "3191 County rd 10, Canandaigua NY 14424",
  "30 Catskill, Catskill NY 12414",
  "161 Centereach Mall, Centereach NY 11720",
  "3018 East Ave, Central Square NY 13036",
  "100 Thruway Plaza, Cheektowaga NY 14225",
  "8064 Brewerton Rd, Cicero NY 13039",
  "5033 Transit Road, Clarence NY 14031",
  "3949 Route 31, Clay NY 13041",
  "139 Merchant Place, Cobleskill NY 12043",
  "85 Crooked Hill Road, Commack NY 11725",
  "872 Route 13, Cortlandville NY 13045",
  "279 Troy Road, East Greenbush NY 12061",
  "2465 Hempstead Turnpike, East Meadow NY 11554",
  "6438 Basile Rowe, East Syracuse NY 13057",
  "25737 US Rt 11, Evans Mills NY 13637",
  "901 Route 110, Farmingdale NY 11735",
  "2400 Route 9, Fishkill NY 12524",
  "10401 Bennett Road, Fredonia NY 14063",
  "1818 State Route 3, Fulton NY 13069",
  "4300 Lakeville Road, Geneseo NY 14454",
  "990 Route 5 20, Geneva NY 14456",
  "311 RT 9W, Glenmont NY 12077",
  "200 Dutch Meadows Ln, Glenville NY 12302",
  "100 Elm Ridge Center Dr, Greece NY 14626",
  "1549 Rt 9, Halfmoon NY 12065",
  "5360 Southwestern Blvd, Hamburg NY 14075",
  "103 North Caroline St, Herkimer NY 13350",
  "1000 State Route 36, Hornell NY 14843",
  "1400 County Rd 64, Horseheads NY 14845",
  "135 Fairgrounds Memorial Pkwy, Ithaca NY 14850",
  "2 Gannett Dr, Johnson City NY 13790",
  "233 5th Ave Ext, Johnstown NY 12095",
  "601 Frank Stottile Blvd, Kingston NY 12401",
  "350 E Fairmount Ave, Lakewood NY 14750",
  "4975 Transit Rd, Lancaster NY 14086",
  "579 Troy-Schenectady Road, Latham NY 12110",
  "5783 So Transit Road, Lockport NY 14094",
  "7155 State Rt 12 S, Lowville NY 13367",
  "425 Route 31, Macedon NY 14502",
  "3222 State Rt 11, Malone NY 12953",
  "200 Sunrise Mall, Massapequa NY 11758",
  "43 Stephenville St, Massena NY 13662",
  "750 Middle Country Road, Middle Island NY 11953",
  "470 Route 211 East, Middletown NY 10940",
  "3133 E Main St, Mohegan Lake NY 10547",
  "288 Larkin, Monroe NY 10950",
  "41 Anawana Lake Road, Monticello NY 12701",
  "4765 Commercial Drive, New Hartford NY 13413",
  "1201 Rt 300, Newburgh NY 12550",
  "255 W Main St, Avon CT 6001",
  "120 Commercial Parkway, Branford CT 6405",
  "1400 Farmington Ave, Bristol CT 6010",
  "161 Berlin Road, Cromwell CT 6416",
  "67 Newton Rd, Danbury CT 6810",
  "656 New Haven Ave, Derby CT 6418",
  "69 Prospect Hill Road, East Windsor CT 6088",
  "150 Gold Star Hwy, Groton CT 6340",
  "900 Boston Post Road, Guilford CT 6437",
  "2300 Dixwell Ave, Hamden CT 6514",
  "495 Flatbush Ave, Hartford CT 6106",
  "180 River Rd, Lisbon CT 6351",
  "420 Buckland Hills Dr, Manchester CT 6040",
  "1365 Boston Post Road, Milford CT 6460",
  "1100 New Haven Road, Naugatuck CT 6770",
  "315 Foxon Blvd, New Haven CT 6513",
  "164 Danbury Rd, New Milford CT 6776",
  "3164 Berlin Turnpike, Newington CT 6111",
  "474 Boston Post Road, North Windham CT 6256",
  "650 Main Ave, Norwalk CT 6851",
  "680 Connecticut Avenue, Norwalk CT 6854",
  "220 Salem Turnpike, Norwich CT 6360",
  "655 Boston Post Rd, Old Saybrook CT 6475",
  "625 School Street, Putnam CT 6260",
  "80 Town Line Rd, Rocky Hill CT 6067",
  "465 Bridgeport Avenue, Shelton CT 6484",
  "235 Queen St, Southington CT 6489",
  "150 Barnum Avenue Cutoff, Stratford CT 6614",
  "970 Torringford Street, Torrington CT 6790",
  "844 No Colony Road, Wallingford CT 6492",
  "910 Wolcott St, Waterbury CT 6705",
  "155 Waterford Parkway No, Waterford CT 6385",
  "515 Sawmill Road, West Haven CT 6516",
  "2473 Hackworth Road, Adamsville AL 35005",
  "630 Coonial Promenade Pkwy, Alabaster AL 35007",
  "2643 Hwy 280 West, Alexander City AL 35010",
  "540 West Bypass, Andalusia AL 36420",
  "5560 Mcclellan Blvd, Anniston AL 36206",
  "1450 No Brindlee Mtn Pkwy, Arab AL 35016",
  "1011 US Hwy 72 East, Athens AL 35611",
  "973 Gilbert Ferry Road Se, Attalla AL 35954",
  "1717 South College Street, Auburn AL 36830",
  "701 Mcmeans Ave, Bay Minette AL 36507",
  "750 Academy Drive, Bessemer AL 35022",
  "312 Palisades Blvd, Birmingham AL 35209",
  "1600 Montclair Rd, Birmingham AL 35210",
  "5919 Trussville Crossings Pkwy, Birmingham AL 35235",
  "9248 Parkway East, Birmingham AL 35206",
  "1972 Hwy 431, Boaz AL 35957",
  "10675 Hwy 5, Brent AL 35034",
  "2041 Douglas Avenue, Brewton AL 36426",
  "5100 Hwy 31, Calera AL 35040",
  "1916 Center Point Rd, Center Point AL 35215",
  "1950 W Main St, Centre AL 35960",
  "16077 Highway 280, Chelsea AL 35043",
  "1415 7Th Street South, Clanton AL 35045",
  "626 Olive Street Sw, Cullman AL 35055",
  "27520 Hwy 98, Daphne AL 36526",
  "2800 Spring Avn SW, Decatur AL 35603",
  "969 Us Hwy 80 West, Demopolis AL 36732",
  "3300 South Oates Street, Dothan AL 36301",
  "4310 Montgomery Hwy, Dothan AL 36303",
  "600 Boll Weevil Circle, Enterprise AL 36330",
  "3176 South Eufaula Avenue, Eufaula AL 36027",
  "7100 Aaron Aronov Drive, Fairfield AL 35064",
  "10040 County Road 48, Fairhope AL 36533",
  "3186 Hwy 171 North, Fayette AL 35555",
  "3100 Hough Rd, Florence AL 35630",
  "2200 South Mckenzie St, Foley AL 36535",
  "2001 Glenn Bldv Sw, Fort Payne AL 35968",
  "340 East Meighan Blvd, Gadsden AL 35903",
  "890 Odum Road, Gardendale AL 35071",
  "1608 W Magnolia Ave, Geneva AL 36340",
  "501 Willow Lane, Greenville AL 36037",
  "170 Fort Morgan Road, Gulf Shores AL 36542",
  "11697 US Hwy 431, Guntersville AL 35976",
  "42417 Hwy 195, Haleyville AL 35565",
  "1706 Military Street South, Hamilton AL 35570",
  "1201 Hwy 31 NW, Hartselle AL 35640",
  "209 Lakeshore Parkway, Homewood AL 35209",
  "2780 John Hawkins Pkwy, Hoover AL 35244",
  "5335 Hwy 280 South, Hoover AL 35242",
  "1007 Red Farmer Drive, Hueytown AL 35023",
  "2900 S Mem PkwyDrake Ave, Huntsville AL 35801",
  "11610 Memorial Pkwy South, Huntsville AL 35803",
  "2200 Sparkman Drive, Huntsville AL 35810",
  "330 Sutton Rd, Huntsville AL 35763",
  "6140A Univ Drive, Huntsville AL 35806",
  "4206 N College Ave, Jackson AL 36545",
  "1625 Pelham South, Jacksonville AL 36265",
  "1801 Hwy 78 East, Jasper AL 35501",
  "8551 Whitfield Ave, Leeds AL 35094",
  "8650 Madison Blvd, Madison AL 35758",
  "145 Kelley Blvd, Millbrook AL 36054",
  "1970 S University Blvd, Mobile AL 36609",
  "6350 Cottage Hill Road, Mobile AL 36609",
  "101 South Beltline Highway, Mobile AL 36606",
  "2500 Dawes Road, Mobile AL 36695",
  "5245 Rangeline Service Rd, Mobile AL 36619",
  "685 Schillinger Rd, Mobile AL 36695",
  "3371 S Alabama Ave, Monroeville AL 36460",
  "10710 Chantilly Pkwy, Montgomery AL 36117",
  "3801 Eastern Blvd, Montgomery AL 36116",
  "6495 Atlanta Hwy, Montgomery AL 36117",
  "851 Ann St, Montgomery AL 36107",
  "15445 Highway 24, Moulton AL 35650",
  "517 West Avalon Ave, Muscle Shoals AL 35661",
  "5710 Mcfarland Blvd, Northport AL 35476",
  "2453 2Nd Avenue East, Oneonta AL 35121  205-625-647",
  "2900 Pepperrell Pkwy, Opelika AL 36801",
  "92 Plaza Lane, Oxford AL 36203",
  "1537 Hwy 231 South, Ozark AL 36360",
  "2181 Pelham Pkwy, Pelham AL 35124",
  "165 Vaughan Ln, Pell City AL 35125",
  "3700 Hwy 280-431 N, Phenix City AL 36867",
  "1903 Cobbs Ford Rd, Prattville AL 36066",
  "4180 Us Hwy 431, Roanoke AL 36274",
  "13675 Hwy 43, Russellville AL 35653",
  "1095 Industrial Pkwy, Saraland AL 36571",
  "24833 Johnt Reidprkw, Scottsboro AL 35768",
  "1501 Hwy 14 East, Selma AL 36703",
  "7855 Moffett Rd, Semmes AL 36575",
  "150 Springville Station Blvd, Springville AL 35146",
  "690 Hwy 78, Sumiton AL 35148",
  "41301 US Hwy 280, Sylacauga AL 35150",
  "214 Haynes Street, Talladega AL 35160",
  "1300 Gilmer Ave, Tallassee AL 36078",
  "34301 Hwy 43, Thomasville AL 36784",
  "1420 Us 231 South, Troy AL 36081",
  "1501 Skyland Blvd E, Tuscaloosa AL 35405",
  "3501 20th Av, Valley AL 36854",
  "1300 Montgomery Highway, Vestavia Hills AL 35216",
  "4538 Us Hwy 231, Wetumpka AL 36092",
  "2575 Us Hwy 43, Winfield AL 35594"
]

In [140]:
print(len(address_list))
address = count_vector.transform(address_list)
prediction_value = naive_bayes.predict(address)
prob = naive_bayes.predict_proba(address)


234


In [141]:
from prettytable import PrettyTable
table = PrettyTable(["Input", "Prediction", "Probability"])
count_name = 0
count_address = 0
for addr,pred,prob in zip(address_list,prediction_value,prob):
    if pred == 0:
        count_address = count_address + 1
    table.add_row([addr,"address" if pred == 0 else "name",prob])

print("Output of the Classifier")
print("Count of address classified", count_address)
print(table)

Output of the Classifier
Count of address classified 200
+-----------------------------------------------------+------------+---------------------------------+
|                        Input                        | Prediction |           Probability           |
+-----------------------------------------------------+------------+---------------------------------+
|             Brockton Avenue Abington MA             |  address   |     [0.92936933 0.07063067]     |
|           30 Memorial Drive, Avon MA 2322           |  address   | [9.99260216e-01 7.39784309e-04] |
|       250 Hartford Avenue, Bellingham MA 2019       |  address   | [9.99899853e-01 1.00146942e-04] |
|           700 Oak Street, Brockton MA 2301          |  address   |     [0.95835025 0.04164975]     |
|        66-4 Parkhurst Rd, Chelmsford MA 1824        |  address   |     [0.99293222 0.00706778]     |
|          591 Memorial Dr, Chicopee MA 1020          |  address   |     [0.91446134 0.08553866]     |
|       55 Brook

In [158]:
indian_names = ['Abbott',
  'Acevedo',
  'Acosta',
  'Adams',
  'Adkins',
  'Aguilar',
  'Aguirre',
  'Albert',
  'Alexander',
  'Alford',
  'Allen',
  'Allison',
  'Alston',
  'Alvarado',
  'Alvarez',
  'Anderson',
  'Andrews',
  'Anthony',
  'Armstrong',
  'Arnold',
  'Ashley',
  'Atkins',
  'Atkinson',
  'Austin',
  'Avery',
  'Avila',
  'Ayala',
  'Ayers',
  'Bailey',
  'Baird',
  'Baker',
  'Baldwin',
  'Ball',
  'Ballard',
  'Banks',
  'Barber',
  'Barker',
  'Barlow',
  'Barnes',
  'Barnett',
  'Barr',
  'Barrera',
  'Barrett',
  'Barron',
  'Barry',
  'Bartlett',
  'Barton',
  'Bass',
  'Bates',
  'Battle',
  'Bauer',
  'Baxter',
  'Beach',
  'Bean',
  'Beard',
  'Beasley',
  'Beck',
  'Becker',
  'Bell',
  'Bender',
  'Benjamin',
  'Bennett',
  'Benson',
  'Bentley',
  'Benton',
  'Berg',
  'Berger',
  'Bernard',
  'Berry',
  'Best',
  'Bird',
  'Bishop',
  'Black',
  'Blackburn',
  'Blackwell',
  'Blair',
  'Blake',
  'Blanchard',
  'Blankenship',
  'Blevins',
  'Bolton',
  'Bond',
  'Bonner',
  'Booker',
  'Boone',
  'Booth',
  'Bowen',
  'Bowers',
  'Bowman',
  'Boyd',
  'Boyer',
  'Boyle',
  'Bradford',
  'Bradley',
  'Bradshaw',
  'Brady',
  'Branch',
  'Bray',
  'Brennan',
  'Brewer',
  'Bridges',
  'Briggs',
  'Bright',
  'Britt',
  'Brock',
  'Brooks',
  'Brown',
  'Browning',
  'Bruce',
  'Bryan',
  'Bryant',
  'Buchanan',
  'Buck',
  'Buckley',
  'Buckner',
  'Bullock',
  'Burch',
  'Burgess',
  'Burke',
  'Burks',
  'Burnett',
  'Burns',
  'Burris',
  'Burt',
  'Burton',
  'Bush',
  'Butler',
  'Byers',
  'Byrd',
  'Cabrera',
  'Cain',
  'Calderon',
  'Caldwell',
  'Calhoun',
  'Callahan',
  'Camacho',
  'Cameron',
  'Campbell',
  'Campos',
  'Cannon',
  'Cantrell',
  'Cantu',
  'Cardenas',
  'Carey',
  'Carlson',
  'Carney',
  'Carpenter',
  'Carr',
  'Carrillo',
  'Carroll',
  'Carson',
  'Carter',
  'Carver',
  'Case',
  'Casey',
  'Cash',
  'Castaneda',
  'Castillo',
  'Castro',
  'Cervantes',
  'Chambers',
  'Chan',
  'Chandler',
  'Chaney',
  'Chang',
  'Chapman',
  'Charles',
  'Chase',
  'Chavez',
  'Chen',
  'Cherry',
  'Christensen',
  'Christian',
  'Church',
  'Clark',
  'Clarke',
  'Clay',
  'Clayton',
  'Clements',
  'Clemons',
  'Cleveland',
  'Cline',
  'Cobb',
  'Cochran',
  'Coffey',
  'Cohen',
  'Cole',
  'Coleman',
  'Collier',
  'Collins',
  'Colon',
  'Combs',
  'Compton',
  'Conley',
  'Conner',
  'Conrad',
  'Contreras',
  'Conway',
  'Cook',
  'Cooke',
  'Cooley',
  'Cooper',
  'Copeland',
  'Cortez',
  'Cote',
  'Cotton',
  'Cox',
  'Craft',
  'Craig',
  'Crane',
  'Crawford',
  'Crosby',
  'Cross',
  'Cruz',
  'Cummings',
  'Cunningham',
  'Curry',
  'Curtis',
  'Dale',
  'Dalton',
  'Daniel',
  'Daniels',
  'Daugherty',
  'Davenport',
  'David',
  'Davidson',
  'Davis',
  'Dawson',
  'Day',
  'Dean',
  'Decker',
  'Dejesus',
  'Delacruz',
  'Delaney',
  'Deleon',
  'Delgado',
  'Dennis',
  'Diaz',
  'Dickerson',
  'Dickson',
  'Dillard',
  'Dillon',
  'Dixon',
  'Dodson',
  'Dominguez',
  'Donaldson',
  'Donovan',
  'Dorsey',
  'Dotson',
  'Douglas',
  'Downs',
  'Doyle',
  'Drake',
  'Dudley',
  'Duffy',
  'Duke',
  'Duncan',
  'Dunlap',
  'Dunn',
  'Duran',
  'Durham',
  'Dyer',
  'Eaton',
  'Edwards',
  'Elliott',
  'Ellis',
  'Ellison',
  'Emerson',
  'England',
  'English',
  'Erickson',
  'Espinoza',
  'Estes',
  'Estrada',
  'Evans',
  'Everett',
  'Ewing',
  'Farley',
  'Farmer',
  'Farrell',
  'Faulkner',
  'Ferguson',
  'Fernandez',
  'Ferrell',
  'Fields',
  'Figueroa',
  'Finch',
  'Finley',
  'Fischer',
  'Fisher',
  'Fitzgerald',
  'Fitzpatrick',
  'Fleming',
  'Fletcher',
  'Flores',
  'Flowers',
  'Floyd',
  'Flynn',
  'Foley',
  'Forbes',
  'Ford',
  'Foreman',
  'Foster',
  'Fowler',
  'Fox',
  'Francis',
  'Franco',
  'Frank',
  'Franklin',
  'Franks',
  'Frazier',
  'Frederick',
  'Freeman',
  'French',
  'Frost',
  'Fry',
  'Frye',
  'Fuentes',
  'Fuller',
  'Fulton',
  'Gaines',
  'Gallagher',
  'Gallegos',
  'Galloway',
  'Gamble',
  'Garcia',
  'Gardner',
  'Garner',
  'Garrett',
  'Garrison',
  'Garza',
  'Gates',
  'Gay',
  'Gentry',
  'George',
  'Gibbs',
  'Gibson',
  'Gilbert',
  'Giles',
  'Gill',
  'Gillespie',
  'Gilliam',
  'Gilmore',
  'Glass',
  'Glenn',
  'Glover',
  'Goff',
  'Golden',
  'Gomez',
  'Gonzales',
  'Gonzalez',
  'Good',
  'Goodman',
  'Goodwin',
  'Gordon',
  'Gould',
  'Graham',
  'Grant',
  'Graves',
  'Gray',
  'Green',
  'Greene',
  'Greer',
  'Gregory',
  'Griffin',
  'Griffith',
  'Grimes',
  'Gross',
  'Guerra',
  'Guerrero',
  'Guthrie',
  'Gutierrez',
  'Guy',
  'Guzman',
  'Hahn',
  'Hale',
  'Haley',
  'Hall',
  'Hamilton',
  'Hammond',
  'Hampton',
  'Hancock',
  'Haney',
  'Hansen',
  'Hanson',
  'Hardin',
  'Harding',
  'Hardy',
  'Harmon',
  'Harper',
  'Harrell',
  'Harrington',
  'Harris',
  'Harrison',
  'Hart',
  'Hartman',
  'Harvey',
  'Hatfield',
  'Hawkins',
  'Hayden',
  'Hayes',
  'Haynes',
  'Hays',
  'Head',
  'Heath',
  'Hebert',
  'Henderson',
  'Hendricks',
  'Hendrix',
  'Henry',
  'Hensley',
  'Henson',
  'Herman',
  'Hernandez',
  'Herrera',
  'Herring',
  'Hess',
  'Hester',
  'Hewitt',
  'Hickman',
  'Hicks',
  'Higgins',
  'Hill',
  'Hines',
  'Hinton',
  'Hobbs',
  'Hodge',
  'Hodges',
  'Hoffman',
  'Hogan',
  'Holcomb',
  'Holden',
  'Holder',
  'Holland',
  'Holloway',
  'Holman',
  'Holmes',
  'Holt',
  'Hood',
  'Hooper',
  'Hoover',
  'Hopkins',
  'Hopper',
  'Horn',
  'Horne',
  'Horton',
  'House',
  'Houston',
  'Howard',
  'Howe',
  'Howell',
  'Hubbard',
  'Huber',
  'Hudson',
  'Huff',
  'Huffman',
  'Hughes',
  'Hull',
  'Humphrey',
  'Hunt',
  'Hunter',
  'Hurley',
  'Hurst',
  'Hutchinson',
  'Hyde',
  'Ingram',
  'Irwin',
  'Jackson',
  'Jacobs',
  'Jacobson',
  'James',
  'Jarvis',
  'Jefferson',
  'Jenkins',
  'Jennings',
  'Jensen',
  'Jimenez',
  'Johns',
  'Johnson',
  'Johnston',
  'Jones',
  'Jordan',
  'Joseph',
  'Joyce',
  'Joyner',
  'Juarez',
  'Justice',
  'Kane',
  'Kaufman',
  'Keith',
  'Keller',
  'Kelley',
  'Kelly',
  'Kemp',
  'Kennedy',
  'Kent',
  'Kerr',
  'Key',
  'Kidd',
  'Kim',
  'King',
  'Kinney',
  'Kirby',
  'Kirk',
  'Kirkland',
  'Klein',
  'Kline',
  'Knapp',
  'Knight',
  'Knowles',
  'Knox',
  'Koch',
  'Kramer',
  'Lamb',
  'Lambert',
  'Lancaster',
  'Landry',
  'Lane',
  'Lang',
  'Langley',
  'Lara',
  'Larsen',
  'Larson',
  'Lawrence',
  'Lawson',
  'Le',
  'Leach',
  'Leblanc',
  'Lee',
  'Leon',
  'Leonard',
  'Lester',
  'Levine',
  'Levy',
  'Lewis',
  'Lindsay',
  'Lindsey',
  'Little',
  'Livingston',
  'Lloyd',
  'Logan',
  'Long',
  'Lopez',
  'Lott',
  'Love',
  'Lowe',
  'Lowery',
  'Lucas',
  'Luna',
  'Lynch',
  'Lynn',
  'Lyons',
  'Macdonald',
  'Macias',
  'Mack',
  'Madden',
  'Maddox',
  'Maldonado',
  'Malone',
  'Mann',
  'Manning',
  'Marks',
  'Marquez',
  'Marsh',
  'Marshall',
  'Martin',
  'Martinez',
  'Mason',
  'Massey',
  'Mathews',
  'Mathis',
  'Matthews',
  'Maxwell',
  'May',
  'Mayer',
  'Maynard',
  'Mayo',
  'Mays',
  'Mcbride',
  'Mccall',
  'Mccarthy',
  'Mccarty',
  'Mcclain',
  'Mcclure',
  'Mcconnell',
  'Mccormick',
  'Mccoy',
  'Mccray',
  'Mccullough',
  'Mcdaniel',
  'Mcdonald',
  'Mcdowell',
  'Mcfadden',
  'Mcfarland',
  'Mcgee',
  'Mcgowan',
  'Mcguire',
  'Mcintosh',
  'Mcintyre',
  'Mckay',
  'Mckee',
  'Mckenzie',
  'Mckinney',
  'Mcknight',
  'Mclaughlin',
  'Mclean',
  'Mcleod',
  'Mcmahon',
  'Mcmillan',
  'Mcneil',
  'Mcpherson',
  'Meadows',
  'Medina',
  'Mejia',
  'Melendez',
  'Melton',
  'Mendez',
  'Mendoza',
  'Mercado',
  'Mercer',
  'Merrill',
  'Merritt',
  'Meyer',
  'Meyers',
  'Michael',
  'Middleton',
  'Miles',
  'Miller',
  'Mills',
  'Miranda',
  'Mitchell',
  'Molina',
  'Monroe',
  'Montgomery',
  'Montoya',
  'Moody',
  'Moon',
  'Mooney',
  'Moore',
  'Morales',
  'Moran',
  'Moreno',
  'Morgan',
  'Morin',
  'Morris',
  'Morrison',
  'Morrow',
  'Morse',
  'Morton',
  'Moses',
  'Mosley',
  'Moss',
  'Mueller',
  'Mullen',
  'Mullins',
  'Munoz',
  'Murphy',
  'Murray',
  'Myers',
  'Nash',
  'Navarro',
  'Neal',
  'Nelson',
  'Newman',
  'Newton',
  'Nguyen',
  'Nichols',
  'Nicholson',
  'Nielsen',
  'Nieves',
  'Nixon',
  'Noble',
  'Noel',
  'Nolan',
  'Norman',
  'Norris',
  'Norton',
  'Nunez',
  'Obrien',
  'Ochoa',
  'Oconnor',
  'Odom',
  'Odonnell',
  'Oliver',
  'Olsen',
  'Olson',
  'Oneal',
  'Oneil',
  'Oneill',
  'Orr',
  'Ortega',
  'Ortiz',
  'Osborn',
  'Osborne',
  'Owen',
  'Owens',
  'Pace',
  'Pacheco',
  'Padilla',
  'Page',
  'Palmer',
  'Park',
  'Parker',
  'Parks',
  'Parrish',
  'Parsons',
  'Pate',
  'Patel',
  'Patrick',
  'Patterson',
  'Patton',
  'Paul',
  'Payne',
  'Pearson',
  'Peck',
  'Pena',
  'Pennington',
  'Perez',
  'Perkins',
  'Perry',
  'Peters',
  'Petersen',
  'Peterson',
  'Petty',
  'Phelps',
  'Phillips',
  'Pickett',
  'Pierce',
  'Pittman',
  'Pitts',
  'Pollard',
  'Poole',
  'Pope',
  'Porter',
  'Potter',
  'Potts',
  'Powell',
  'Powers',
  'Pratt',
  'Preston',
  'Price',
  'Prince',
  'Pruitt',
  'Puckett',
  'Pugh',
  'Quinn',
  'Ramirez',
  'Ramos',
  'Ramsey',
  'Randall',
  'Randolph',
  'Rasmussen',
  'Ratliff',
  'Ray',
  'Raymond',
  'Reed',
  'Reese',
  'Reeves',
  'Reid',
  'Reilly',
  'Reyes',
  'Reynolds',
  'Rhodes',
  'Rice',
  'Rich',
  'Richard',
  'Richards',
  'Richardson',
  'Richmond',
  'Riddle',
  'Riggs',
  'Riley',
  'Rios',
  'Rivas',
  'Rivera',
  'Rivers',
  'Roach',
  'Robbins',
  'Roberson',
  'Roberts',
  'Robertson',
  'Robinson',
  'Robles',
  'Rocha',
  'Rodgers',
  'Rodriguez',
  'Rodriquez',
  'Rogers',
  'Rojas',
  'Rollins',
  'Roman',
  'Romero',
  'Rosa',
  'Rosales',
  'Rosario',
  'Rose',
  'Ross',
  'Roth',
  'Rowe',
  'Rowland',
  'Roy',
  'Ruiz',
  'Rush',
  'Russell',
  'Russo',
  'Rutledge',
  'Ryan',
  'Salas',
  'Salazar',
  'Salinas',
  'Sampson',
  'Sanchez',
  'Sanders',
  'Sandoval',
  'Sanford',
  'Santana',
  'Santiago',
  'Santos',
  'Sargent',
  'Saunders',
  'Savage',
  'Sawyer',
  'Schmidt',
  'Schneider',
  'Schroeder',
  'Schultz',
  'Schwartz',
  'Scott',
  'Sears',
  'Sellers',
  'Serrano',
  'Sexton',
  'Shaffer',
  'Shannon',
  'Sharp',
  'Sharpe',
  'Shaw',
  'Shelton',
  'Shepard',
  'Shepherd',
  'Sheppard',
  'Sherman',
  'Shields',
  'Short',
  'Silva',
  'Simmons',
  'Simon',
  'Simpson',
  'Sims',
  'Singleton',
  'Skinner',
  'Slater',
  'Sloan',
  'Small',
  'Smith',
  'Snider',
  'Snow',
  'Snyder',
  'Solis',
  'Solomon',
  'Sosa',
  'Soto',
  'Sparks',
  'Spears',
  'Spence',
  'Spencer',
  'Stafford',
  'Stanley',
  'Stanton',
  'Stark',
  'Steele',
  'Stein',
  'Stephens',
  'Stephenson',
  'Stevens',
  'Stevenson',
  'Stewart',
  'Stokes',
  'Stone',
  'Stout',
  'Strickland',
  'Strong',
  'Stuart',
  'Suarez',
  'Sullivan',
  'Summers',
  'Sutton',
  'Swanson',
  'Sweeney',
  'Sweet',
  'Sykes',
  'Talley',
  'Tanner',
  'Tate',
  'Taylor',
  'Terrell',
  'Terry',
  'Thomas',
  'Thompson',
  'Thornton',
  'Tillman',
  'Todd',
  'Torres',
  'Townsend',
  'Tran',
  'Travis',
  'Trevino',
  'Trujillo',
  'Tucker',
  'Turner',
  'Tyler',
  'Tyson',
  'Underwood',
  'Valdez',
  'Valencia',
  'Valentine',
  'Valenzuela',
  'Vance',
  'Vang',
  'Vargas',
  'Vasquez',
  'Vaughan',
  'Vaughn',
  'Vazquez',
  'Vega',
  'Velasquez',
  'Velazquez',
  'Velez',
  'Villarreal',
  'Vincent',
  'Vinson',
  'Wade',
  'Wagner',
  'Walker',
  'Wall',
  'Wallace',
  'Waller',
  'Walls',
  'Walsh',
  'Walter',
  'Walters',
  'Walton',
  'Ward',
  'Ware',
  'Warner',
  'Warren',
  'Washington',
  'Waters',
  'Watkins',
  'Watson',
  'Watts',
  'Weaver',
  'Webb',
  'Weber',
  'Webster',
  'Weeks',
  'Weiss',
  'Welch',
  'Wells',
  'West',
  'Wheeler',
  'Whitaker',
  'White',
  'Whitehead',
  'Whitfield',
  'Whitley',
  'Whitney',
  'Wiggins',
  'Wilcox',
  'Wilder',
  'Wiley',
  'Wilkerson',
  'Wilkins',
  'Wilkinson',
  'William',
  'Williams',
  'Williamson',
  'Willis',
  'Wilson',
  'Winters',
  'Wise',
  'Witt',
  'Wolf',
  'Wolfe',
  'Wong',
  'Wood',
  'Woodard',
  'Woods',
  'Woodward',
  'Wooten',
  'Workman',
  'Wright',
  'Wyatt',
  'Wynn',
  'Yang',
  'Yates',
  'York',
  'Young',
  'Zamora',
  'Zimmerman']

In [159]:
print(len(indian_names))
indian_names_list = count_vector.transform(indian_names)
prediction_value = naive_bayes.predict(indian_names_list)
prob = naive_bayes.predict_proba(indian_names_list)


1000


In [160]:
from prettytable import PrettyTable
table = PrettyTable(["Input", "Prediction", "Probability"])
count_name = 0
for name,pred,prob in zip(indian_names,prediction_value,prob):
    if pred == 1:
        count_name = count_name + 1
    table.add_row([name,"address" if pred == 0 else "name",prob])

print("Output of the Classifier")
print("Count of address classified", count_name)
print(table)

Output of the Classifier
Count of address classified 954
+-------------+------------+-------------------------+
|    Input    | Prediction |       Probability       |
+-------------+------------+-------------------------+
|    Abbott   |    name    | [0.29756188 0.70243812] |
|   Acevedo   |    name    | [0.29756188 0.70243812] |
|    Acosta   |    name    | [0.29756188 0.70243812] |
|    Adams    |    name    | [0.32207857 0.67792143] |
|    Adkins   |    name    | [0.29756188 0.70243812] |
|   Aguilar   |    name    | [0.29756188 0.70243812] |
|   Aguirre   |    name    | [0.29756188 0.70243812] |
|    Albert   |    name    | [0.11951838 0.88048162] |
|  Alexander  |    name    | [0.02320366 0.97679634] |
|    Alford   |    name    | [0.29756188 0.70243812] |
|    Allen    |    name    | [0.10616466 0.89383534] |
|   Allison   |    name    | [0.29756188 0.70243812] |
|    Alston   |    name    | [0.29756188 0.70243812] |
|   Alvarado  |    name    | [0.29756188 0.70243812] |
|   Alva