# Header Manipulation

## Import pandas

In [1]:
import pandas as pd
import numpy as np

## Load Data

In [2]:
df = pd.read_csv("company.csv")
df.head()

Unnamed: 0,Index,Organization Id,Name,Website,Country,Description,Founded,Industry,Number of employees
0,1,8cC6B5992C0309c,Acevedo LLC,https://www.donovan.com/,Holy See (Vatican City State),Multi-channeled bottom-line core,2019,Graphic Design / Web Design,7070
1,2,ec094061FeaF7Bc,Walls-Mcdonald,http://arias-willis.net/,Lithuania,Compatible encompassing groupware,2005,Utilities,8156
2,3,DAcC5dbc58946A7,Gregory PLC,http://www.lynch-hoover.net/,Tokelau,Multi-channeled intangible help-desk,2019,Leisure / Travel,6121
3,4,8Dd7beDa37FbeD0,"Byrd, Patterson and Knox",https://www.james-velez.net/,Netherlands,Pre-emptive national function,1982,Furniture,3494
4,5,a3b5c54AEC163e4,Mcdowell-Hopkins,http://fuentes.com/,Mayotte,Cloned bifurcated solution,2016,Online Publishing,36


In [3]:
df.isna().any()

Index                  False
Organization Id        False
Name                   False
Website                False
Country                False
Description            False
Founded                False
Industry               False
Number of employees    False
dtype: bool

In [4]:
df_copy = df.copy()
df_copy.loc[2, "Name"] = np.nan
df_copy.isna().any()

Index                  False
Organization Id        False
Name                    True
Website                False
Country                False
Description            False
Founded                False
Industry               False
Number of employees    False
dtype: bool

## Get NA values

In [5]:
df_copy[df_copy.isna().any(axis=1)]

Unnamed: 0,Index,Organization Id,Name,Website,Country,Description,Founded,Industry,Number of employees
2,3,DAcC5dbc58946A7,,http://www.lynch-hoover.net/,Tokelau,Multi-channeled intangible help-desk,2019,Leisure / Travel,6121


In [6]:
df_copy.isnull().any()

Index                  False
Organization Id        False
Name                    True
Website                False
Country                False
Description            False
Founded                False
Industry               False
Number of employees    False
dtype: bool

In [7]:
df_copy.dropna(axis=1).shape

(100000, 8)

In [8]:
df_copy.dropna(axis=0).shape

(99999, 9)

In [9]:
df_copy.shape

(100000, 9)

In [10]:
df_groupby = df.rename(columns={"Number of employees":"EmployeeCount", "Organization Id":"id"})

In [11]:
df_groupby.groupby("Country").count()

Unnamed: 0_level_0,Index,id,Name,Website,Description,Founded,Industry,EmployeeCount
Country,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
Afghanistan,401,401,401,401,401,401,401,401
Albania,417,417,417,417,417,417,417,417
Algeria,418,418,418,418,418,418,418,418
American Samoa,389,389,389,389,389,389,389,389
Andorra,417,417,417,417,417,417,417,417
...,...,...,...,...,...,...,...,...
Wallis and Futuna,388,388,388,388,388,388,388,388
Western Sahara,428,428,428,428,428,428,428,428
Yemen,409,409,409,409,409,409,409,409
Zambia,396,396,396,396,396,396,396,396


In [12]:
df_groupby.groupby("Country").min()

Unnamed: 0_level_0,Index,id,Name,Website,Description,Founded,Industry,EmployeeCount
Country,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
Afghanistan,353,00aA041edCdb59A,"Acosta, Dominguez and Soto",http://archer.com/,Adaptive 4thgeneration pricing structure,1970,Accounting,34
Albania,171,02995eB8aA7A196,Acosta PLC,http://arias.com/,Adaptive asymmetric utilization,1970,Accounting,1
Algeria,13,0134EBde9d8bED7,Adams PLC,http://alvarado.biz/,Adaptive 24/7 complexity,1970,Accounting,39
American Samoa,462,01b492ce397Df1C,Adams-Bean,http://andersen.com/,Adaptive context-sensitive superstructure,1970,Accounting,8
Andorra,49,01dAE2d0673E381,Acevedo LLC,http://andrade-moses.org/,Adaptive executive array,1970,Alternative Dispute Resolution,6
...,...,...,...,...,...,...,...,...
Wallis and Futuna,480,002BEFF8Cb9A84D,"Acosta, Hurst and Horton",http://acevedo.com/,Adaptive eco-centric forecast,1970,Accounting,70
Western Sahara,9,00b122A8f9241D0,"Acevedo, Brooks and Pineda",http://archer.com/,Adaptive bi-directional infrastructure,1970,Accounting,1
Yemen,321,012077Ffbf40BF5,"Acosta, Williamson and Boone",http://austin-henry.biz/,Adaptive 6thgeneration application,1970,Airlines / Aviation,17
Zambia,649,01390f5Cfb0f7F0,Abbott PLC,http://aguilar-jordan.com/,Adaptive eco-centric middleware,1970,Accounting,25


In [13]:
df_groupby.groupby("Country").max()

Unnamed: 0_level_0,Index,id,Name,Website,Description,Founded,Industry,EmployeeCount
Country,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
Afghanistan,99694,fdCFf3eE3Bf4115,Zuniga PLC,https://www.zamora-walker.biz/,Visionary web-enabled extranet,2022,Writing / Editing,9997
Albania,99763,ffA490CFD572c83,Zuniga-Fleming,https://zamora.com/,Visionary web-enabled help-desk,2022,Writing / Editing,9910
Algeria,99806,ffCEed3dd95Dda4,"Zamora, Wilkins and Rocha",https://www.zavala.net/,Visionary zero administration attitude,2022,Writing / Editing,9972
American Samoa,99900,fe13e3C6CC735CE,Zhang and Sons,https://www.zuniga.com/,Vision-oriented scalable policy,2022,Writing / Editing,9994
Andorra,99863,ff840CA95b71CbA,"Zuniga, Glover and Gonzales",https://yoder.com/,Visionary optimal utilization,2022,Writing / Editing,9997
...,...,...,...,...,...,...,...,...
Wallis and Futuna,99624,fff1d3BA1eCcf9A,Wu-Gaines,https://yu.com/,Visionary value-added functionalities,2022,Writing / Editing,9963
Western Sahara,99545,ff955fB8FCC06Ac,"Zimmerman, Bradshaw and Carpenter",https://www.wright.com/,Visionary tertiary open architecture,2021,Writing / Editing,9951
Yemen,99935,ff0405E19ad1a9C,Zimmerman Inc,https://zavala.org/,Visionary value-added customer loyalty,2022,Writing / Editing,9983
Zambia,99303,ffF48eAaFE55844,Zhang Group,https://zavala.com/,Visionary radical info-mediaries,2022,Writing / Editing,9914


In [14]:
df_groupby.groupby("Country").sum()

Unnamed: 0_level_0,Index,id,Name,Website,Description,Founded,Industry,EmployeeCount
Country,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
Afghanistan,20304948,Fcb6e0ba8aE250C19C8Cff8B0FCc0F2aBdAfc139fAF651...,"Ramos, Dorsey and LynchGray-YoderLee, Kemp and...",http://fernandez.net/http://lamb.org/https://p...,Realigned 24/7 pricing structureUser-centric n...,800399,Military IndustryLaw EnforcementManagement Con...,2083677
Albania,20584065,4351f4c9755DbA6a5B5EDaBE0BAfD9f6588cCE67DAB35f...,"Dominguez and SonsChen, Buck and TerryButler G...",https://mcpherson.com/http://mccoy.net/http://...,Digitized multimedia intranetGrass-roots analy...,831765,Biotechnology / GreentechBusiness Supplies / E...,2197512
Algeria,21244996,1F861fAbeDdCFea28959dbe3BB2FEF78cf9bE1Bb3938F9...,"Arias, Jackson and HesterWebb, Browning and Co...",https://hardin-thompson.com/https://www.strick...,Switchable maximized synergyOptimized bifurcat...,834289,UtilitiesConsumer ElectronicsInternational Tra...,2035454
American Samoa,19650292,Ad4DBe0FdFE82fb5a37136A4EdAbD8cae3A7DFDEDfbF2D...,"Decker, Meyers and FieldsKennedy GroupMartin, ...",https://small.biz/http://www.gill.com/http://w...,Decentralized eco-centric contingencyTotal sol...,775779,PhotographyGambling / CasinosGovernment Admini...,1872544
Andorra,20589295,a5D7abBe4994b43CCaA31E5DeFC4dB1eb076BBFca058E8...,"Ray IncCook IncValentine-ValdezGibson, Key and...",https://www.lowe.com/https://www.cline.com/htt...,Polarized cohesive solutionProactive non-volat...,832163,Program DevelopmentHuman Resources / HRPerform...,2127618
...,...,...,...,...,...,...,...,...
Wallis and Futuna,18824417,730f2ADA27c0Eff8e1c0BFFebEf7Af5EfFEda2138c0CdC...,"Campos, Wong and GordonGuerrero LLCDunlap LLCL...",http://powers-anderson.com/http://www.zamora.c...,Front-line composite moderatorStreamlined 24/7...,774388,Computer HardwareInformation Technology / ITPa...,1978857
Western Sahara,21742075,Cfa1a44106faD4BC6F5Fe2fa151f1Bcb0B580B0BFFaE4A...,"Lucas, Galloway and BenjaminYang-RileyOwen, Fi...",http://silva.info/https://arellano-beasley.com...,Persevering leadingedge abilityCloned bottom-l...,853926,Retail IndustryBusiness Supplies / EquipmentNa...,2068407
Yemen,20987894,A3E4802e2Baf1A69F78589F9d1b98312E57E3c9b4DA61a...,"Bryan, Moses and AlvaradoYu, Gallagher and Jac...",https://www.gibbs.com/http://www.peterson.com/...,Re-contextualized solution-oriented frameRe-en...,816109,VeterinaryMental Health CarePhilanthropyLaw Pr...,1983819
Zambia,20212121,8BCD4297F0eEF378C0359bc571d31253B263c6BBB1c30B...,"Morris, Foster and SchwartzMejia PLCSteele, Di...",http://colon.com/https://mcgee.com/https://lut...,Business-focused responsive orchestrationFace-...,790286,UtilitiesMotion Pictures / FilmComputer Softwa...,1954218


In [15]:
df_groupby.groupby("Country").agg({"EmployeeCount": ["sum", "count"]})

Unnamed: 0_level_0,EmployeeCount,EmployeeCount
Unnamed: 0_level_1,sum,count
Country,Unnamed: 1_level_2,Unnamed: 2_level_2
Afghanistan,2083677,401
Albania,2197512,417
Algeria,2035454,418
American Samoa,1872544,389
Andorra,2127618,417
...,...,...
Wallis and Futuna,1978857,388
Western Sahara,2068407,428
Yemen,1983819,409
Zambia,1954218,396


In [16]:
df_groupby.groupby("Country").describe()

Unnamed: 0_level_0,Index,Index,Index,Index,Index,Index,Index,Index,Founded,Founded,Founded,Founded,Founded,EmployeeCount,EmployeeCount,EmployeeCount,EmployeeCount,EmployeeCount,EmployeeCount,EmployeeCount,EmployeeCount
Unnamed: 0_level_1,count,mean,std,min,25%,50%,75%,max,count,mean,...,75%,max,count,mean,std,min,25%,50%,75%,max
Country,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2
Afghanistan,401.0,50635.780549,28638.569991,353.0,25213.00,48009.0,77539.00,99694.0,401.0,1996.007481,...,2010.00,2022.0,401.0,5196.201995,2901.168523,34.0,2788.0,5073.0,7719.00,9997.0
Albania,417.0,49362.266187,28946.988771,171.0,25419.00,49767.0,73520.00,99763.0,417.0,1994.640288,...,2007.00,2022.0,417.0,5269.812950,2863.537936,1.0,3027.0,5288.0,7716.00,9910.0
Algeria,418.0,50825.349282,29226.730116,13.0,24941.25,51762.5,74490.50,99806.0,418.0,1995.906699,...,2009.75,2022.0,418.0,4869.507177,2854.660193,39.0,2432.0,4627.0,7166.25,9972.0
American Samoa,389.0,50514.889460,28382.093492,462.0,26979.00,48440.0,74786.00,99900.0,389.0,1994.290488,...,2007.00,2022.0,389.0,4813.737789,2944.660284,8.0,2231.0,4606.0,7212.00,9994.0
Andorra,417.0,49374.808153,27911.555339,49.0,25481.00,46554.0,74216.00,99863.0,417.0,1995.594724,...,2009.00,2022.0,417.0,5102.201439,2943.472803,6.0,2631.0,5212.0,7743.00,9997.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Wallis and Futuna,388.0,48516.538660,28717.928734,480.0,24407.25,46832.5,72892.50,99624.0,388.0,1995.845361,...,2010.00,2022.0,388.0,5100.146907,2907.600852,70.0,2573.0,5022.0,7532.00,9963.0
Western Sahara,428.0,50799.240654,29353.495051,9.0,23501.75,53202.0,75408.00,99545.0,428.0,1995.154206,...,2008.00,2021.0,428.0,4832.726636,2875.388593,1.0,2391.0,4727.0,7269.00,9951.0
Yemen,409.0,51315.144254,29785.394468,321.0,25228.00,50974.0,77612.00,99935.0,409.0,1995.376528,...,2009.00,2022.0,409.0,4850.413203,3019.456932,17.0,2105.0,4670.0,7595.00,9983.0
Zambia,396.0,51040.709596,28456.932636,649.0,26752.00,51695.5,75850.25,99303.0,396.0,1995.671717,...,2008.00,2022.0,396.0,4934.893939,2813.835878,25.0,2548.5,5061.0,7416.00,9914.0


In [17]:
df.groupby("Country").groups

{'Afghanistan': [352, 439, 453, 991, 1002, 1185, 1568, 1962, 2314, 3002, 3240, 3299, 3364, 3764, 4229, 4387, 4411, 5616, 5651, 5814, 5850, 5914, 6575, 7355, 7838, 7986, 9335, 9390, 9760, 9781, 10043, 10260, 11088, 11544, 11600, 11724, 11896, 12186, 12416, 12502, 12891, 13152, 13737, 13796, 14035, 14234, 14583, 14959, 14964, 14983, 15127, 15764, 15781, 16248, 16374, 16501, 16637, 16840, 16922, 16927, 17106, 17194, 17262, 17621, 17859, 17900, 18063, 18282, 18312, 18532, 18730, 18752, 18866, 19690, 19733, 20140, 20218, 20228, 20664, 21395, 21497, 21800, 22183, 22204, 22242, 22444, 22464, 22586, 22612, 22651, 22791, 22957, 22993, 23019, 24009, 24231, 24501, 24661, 24987, 25019, ...], 'Albania': [170, 665, 927, 1052, 1260, 1482, 1562, 2372, 2488, 2499, 2527, 2643, 2694, 3217, 3326, 3434, 3457, 3655, 3694, 3857, 4241, 4481, 4612, 5409, 5766, 5900, 6169, 6264, 6313, 6633, 6906, 7279, 8013, 8380, 8495, 8866, 8942, 9144, 9211, 9459, 9649, 9661, 9790, 10140, 10256, 10522, 10858, 10891, 10918, 11

In [18]:
df_group = df.groupby("Country")

In [19]:
df_group.get_group('Afghanistan')

Unnamed: 0,Index,Organization Id,Name,Website,Country,Description,Founded,Industry,Number of employees
352,353,Fcb6e0ba8aE250C,"Ramos, Dorsey and Lynch",http://fernandez.net/,Afghanistan,Realigned 24/7 pricing structure,1989,Military Industry,9857
439,440,19C8Cff8B0FCc0F,Gray-Yoder,http://lamb.org/,Afghanistan,User-centric next generation capacity,2009,Law Enforcement,8116
453,454,2aBdAfc139fAF65,"Lee, Kemp and Levy",https://peters.info/,Afghanistan,Triple-buffered directional access,2005,Management Consulting,4201
991,992,1BcDf04EFC39c1d,Moyer and Sons,https://mccall-hayden.com/,Afghanistan,Re-engineered value-added hierarchy,2020,Printing,8236
1002,1003,3Af7d84cdE9c9E7,"Castro, Franco and Harding",https://www.hendrix.com/,Afghanistan,Visionary eco-centric data-warehouse,2002,Professional Training,4469
...,...,...,...,...,...,...,...,...,...
98736,98737,03c5Ff4c3ACf9c5,Briggs and Sons,http://rivers-blankenship.biz/,Afghanistan,Proactive didactic challenge,1991,Airlines / Aviation,5486
99081,99082,eeee23C566Be37A,Vaughan-Nguyen,http://www.vincent-hendrix.com/,Afghanistan,Customizable maximized groupware,2003,Glass / Ceramics / Concrete,1923
99152,99153,DB70cc5d22b1De8,Bullock-Sellers,https://www.harvey.com/,Afghanistan,Face-to-face motivating Graphical User Interface,1994,Banking / Mortgage,3059
99520,99521,E841a5cC95C76CA,Schneider Group,https://www.park.info/,Afghanistan,Universal logistical customer loyalty,2015,Market Research,8761
