# Análisis estadístico básico de los grupos
En este notebook, se verá un análisis general para los grupos creados, esto con la intención de entender a grandes rasgos la composición de cada grupo

In [1]:
import sys
sys.path.insert(0, './scripts/')

In [2]:
from collections import defaultdict
import gc
import IDTMex
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
import seaborn as sns
import scipy.stats as st


In [3]:
gc.collect()

0

In [4]:
pd.set_option('display.max_columns', None)

### Lectura de Datos

In [5]:
base_path = "./ConjuntosDatos/"
endutih_path = base_path + "ENDUTIH2020/conjuntos_de_datos/"

In [6]:
endutih_vivhogar = pd.read_csv(endutih_path+"viv_hog_agrupados.csv")
endutih_res = pd.read_csv(endutih_path+"residente_agrupados.csv")
endutih_usr = pd.read_csv(endutih_path+"usuario_agrupados.csv", low_memory=False)
endutih_usr2 = pd.read_csv(endutih_path+"usuario2_agrupados.csv", low_memory=False)
endutih_completa = pd.merge(endutih_vivhogar,endutih_res.drop(["UPM_DIS","ESTRATO","ENT","DOMINIO", "EST_DIS", "TLOC","Grupo"], axis=1), on = ["UPM","VIV_SEL", "HOGAR"])

In [7]:
estados = pd.read_csv(base_path+"CodigoEdos.csv")
estados

Unnamed: 0,Codigo,Nombre,ENT
0,1,Aguascalientes,Ags.
1,2,Baja California,B.C.
2,3,Baja California Sur,B.C.S
3,4,Campeche,Camp.
4,5,Coahuila de Zaragoza,Coah.
5,6,Colima,Col.
6,7,Chiapas,Chis.
7,8,Chihuahua,Chih.
8,9,Ciudad de México,C.D.Mx
9,10,Durango,Dgo.


# Todos los grupos

## Combinaciones

In [8]:
dist_all = endutih_vivhogar[["ENT","DOMINIO","Grupo", "FAC_HOG"]].groupby(["ENT","DOMINIO","Grupo"]).agg("sum").reset_index().rename(columns={"FAC_HOG":"Total"})
dist_all["ENT"] = dist_all.ENT.replace({codigo:nombre for codigo,nombre in zip(estados["Codigo"], estados["ENT"])},regex=True)
dist_all["DOMINIO"] = dist_all.DOMINIO.replace({"R":"Rural", "U":"Urbano"},regex=True)
dist_all["perc"] = (dist_all.Total/ dist_all.Total.sum()*100)
dist_all

Unnamed: 0,ENT,DOMINIO,Grupo,Total,perc
0,Ags.,Rural,20,86605,0.242699
1,Ags.,Rural,21,507,0.001421
2,Ags.,Rural,22,473,0.001326
3,Ags.,Rural,23,272,0.000762
4,Ags.,Urbano,20,113614,0.318389
...,...,...,...,...,...
515,Zac.,Urbano,32,149,0.000418
516,Zac.,Urbano,33,80273,0.224955
517,Zac.,Urbano,34,384,0.001076
518,Zac.,Urbano,42,31107,0.087173


## Distribución

In [10]:
dist_grupos = endutih_vivhogar[["ESTRATO","Grupo", "FAC_HOG"]].groupby(["ESTRATO","Grupo"]).agg("sum").reset_index()
dist_grupos

Unnamed: 0,ESTRATO,Grupo,FAC_HOG
0,1,11,6984839
1,2,20,17295201
2,2,21,108498
3,2,22,110877
4,2,23,92468
5,3,30,138234
6,3,31,81353
7,3,32,104798
8,3,33,7106718
9,3,34,43151


In [11]:
dist_grupos.Grupo.nunique()

15

Relativos al total de hogares

In [9]:
(dist_grupos/ dist_grupos.FAC_HOG.sum()*100)

Unnamed: 0_level_0,Unnamed: 1_level_0,FAC_HOG
ESTRATO,Grupo,Unnamed: 2_level_1
1,11,19.57412
2,20,48.467593
2,21,0.304052
2,22,0.310719
2,23,0.25913
3,30,0.387383
3,31,0.227981
3,32,0.293683
3,33,19.91567
3,34,0.120925


## Concentración en estados

In [10]:
grupo_estados = pd.pivot_table(data=endutih_vivhogar, columns="ENT", values= "FAC_HOG", index=["ESTRATO", "Grupo"], aggfunc='sum', fill_value=0)
grupo_estados.columns = estados.ENT
grupo_estados

Unnamed: 0_level_0,ENT,Ags.,B.C.,B.C.S,Camp.,Coah.,Col.,Chis.,Chih.,C.D.Mx,Dgo.,Gto.,Gro.,Hgo.,Jal.,Edo. Méx.,Mich.,Mor.,Nay.,N.L.,Oax.,Pue.,Qro.,Q. Roo.,S.L.P,Sin.,Son.,Tab.,Tamps.,Tlax.,Ver.,Yuc.,Zac.
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1
1,11,0,52722,40490,94288,36088,6864,829585,85504,4040,67991,244784,571453,221026,90597,589821,294591,68508,37842,137973,679375,575579,260256,100184,248857,101965,75450,219350,112459,23378,845979,203493,64347
2,20,200219,507326,111115,116090,400247,137829,464702,478467,1089994,284133,918089,323185,537452,1146740,2608220,811481,371788,249027,625256,414561,816830,225819,329122,284375,434953,371567,393644,596687,283910,1214597,278163,269613
2,21,1519,4220,846,1099,1979,572,2155,0,11364,265,7161,1917,2819,7753,28016,6156,2935,834,926,1151,843,2803,2116,379,978,899,1518,1721,463,11153,1277,661
2,22,2593,2880,1160,1355,1994,1319,3528,626,3704,670,12024,2474,2361,5509,13199,5496,3714,767,3429,2029,5337,2703,3168,1292,2551,1875,2095,4646,738,12936,1104,1601
2,23,1420,1709,684,1789,3652,1373,2577,0,908,238,9479,1125,2225,5185,2385,18619,2069,1075,0,2006,0,1593,1500,1256,4930,412,4792,4945,535,10675,2115,1197
3,30,2227,7336,2127,513,6509,393,785,1650,32531,0,9714,454,0,16543,14126,2586,2686,809,9802,1842,0,1273,1183,1183,4546,3061,898,7086,180,2554,2808,829
3,31,2643,3634,674,515,1848,673,2034,1705,12437,802,3978,1180,409,7568,9700,3511,1685,730,5068,0,1083,1458,1713,1306,3426,1411,0,1839,200,7114,796,213
3,32,769,5485,105,245,537,212,0,1053,41001,0,4820,0,853,13531,4978,1401,2179,302,5453,461,3306,2321,564,388,2934,2077,508,2953,0,4321,1892,149
3,33,122136,334985,54272,21061,347796,35622,55827,398314,1193378,101901,274208,53578,41641,733640,719961,181981,73897,64788,516119,40322,225656,84143,50571,186746,197707,279650,41421,249446,22267,232900,90511,80273
3,34,909,1279,680,399,1891,335,0,525,6117,203,5216,0,0,9146,0,2187,825,326,752,518,0,680,546,836,3417,843,365,1004,400,1520,1848,384


### Relativo al grupo

In [11]:
grupo_estados_rel_grupo = grupo_estados.apply(lambda x: x.div(x.sum()), axis=1)*100
grupo_estados_rel_grupo.style.format(precision=4)

Unnamed: 0_level_0,ENT,Ags.,B.C.,B.C.S,Camp.,Coah.,Col.,Chis.,Chih.,C.D.Mx,Dgo.,Gto.,Gro.,Hgo.,Jal.,Edo. Méx.,Mich.,Mor.,Nay.,N.L.,Oax.,Pue.,Qro.,Q. Roo.,S.L.P,Sin.,Son.,Tab.,Tamps.,Tlax.,Ver.,Yuc.,Zac.
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1
1,11,0.0,0.7548,0.5797,1.3499,0.5167,0.0983,11.8769,1.2241,0.0578,0.9734,3.5045,8.1813,3.1644,1.2971,8.4443,4.2176,0.9808,0.5418,1.9753,9.7264,8.2404,3.726,1.4343,3.5628,1.4598,1.0802,3.1404,1.61,0.3347,12.1116,2.9134,0.9212
2,20,1.1577,2.9333,0.6425,0.6712,2.3142,0.7969,2.6869,2.7665,6.3023,1.6428,5.3083,1.8686,3.1075,6.6304,15.0806,4.6919,2.1497,1.4399,3.6152,2.397,4.7229,1.3057,1.903,1.6442,2.5149,2.1484,2.276,3.45,1.6416,7.0227,1.6083,1.5589
2,21,1.4,3.8895,0.7797,1.0129,1.824,0.5272,1.9862,0.0,10.4739,0.2442,6.6001,1.7669,2.5982,7.1458,25.8217,5.6738,2.7051,0.7687,0.8535,1.0608,0.777,2.5835,1.9503,0.3493,0.9014,0.8286,1.3991,1.5862,0.4267,10.2795,1.177,0.6092
2,22,2.3386,2.5975,1.0462,1.2221,1.7984,1.1896,3.1819,0.5646,3.3406,0.6043,10.8444,2.2313,2.1294,4.9686,11.9042,4.9568,3.3497,0.6918,3.0926,1.83,4.8134,2.4378,2.8572,1.1653,2.3007,1.6911,1.8895,4.1902,0.6656,11.667,0.9957,1.4439
2,23,1.5357,1.8482,0.7397,1.9347,3.9495,1.4848,2.7869,0.0,0.982,0.2574,10.2511,1.2166,2.4062,5.6073,2.5793,20.1356,2.2375,1.1626,0.0,2.1694,0.0,1.7228,1.6222,1.3583,5.3316,0.4456,5.1823,5.3478,0.5786,11.5445,2.2873,1.2945
3,30,1.611,5.3069,1.5387,0.3711,4.7087,0.2843,0.5679,1.1936,23.5333,0.0,7.0272,0.3284,0.0,11.9674,10.2189,1.8707,1.9431,0.5852,7.0909,1.3325,0.0,0.9209,0.8558,0.8558,3.2886,2.2144,0.6496,5.1261,0.1302,1.8476,2.0313,0.5997
3,31,3.2488,4.467,0.8285,0.633,2.2716,0.8273,2.5002,2.0958,15.2877,0.9858,4.8898,1.4505,0.5027,9.3027,11.9233,4.3158,2.0712,0.8973,6.2296,0.0,1.3312,1.7922,2.1056,1.6053,4.2113,1.7344,0.0,2.2605,0.2458,8.7446,0.9785,0.2618
3,32,0.7338,5.2339,0.1002,0.2338,0.5124,0.2023,0.0,1.0048,39.1238,0.0,4.5993,0.0,0.8139,12.9115,4.7501,1.3369,2.0792,0.2882,5.2033,0.4399,3.1546,2.2147,0.5382,0.3702,2.7997,1.9819,0.4847,2.8178,0.0,4.1232,1.8054,0.1422
3,33,1.7186,4.7136,0.7637,0.2964,4.8939,0.5012,0.7856,5.6048,16.7923,1.4339,3.8584,0.7539,0.5859,10.3232,10.1307,2.5607,1.0398,0.9116,7.2624,0.5674,3.1752,1.184,0.7116,2.6277,2.782,3.935,0.5828,3.51,0.3133,3.2772,1.2736,1.1295
3,34,2.1066,2.964,1.5759,0.9247,4.3823,0.7763,0.0,1.2167,14.1758,0.4704,12.0878,0.0,0.0,21.1953,0.0,5.0682,1.9119,0.7555,1.7427,1.2004,0.0,1.5759,1.2653,1.9374,7.9187,1.9536,0.8459,2.3267,0.927,3.5225,4.2826,0.8899


De forma general, parece que hay una buena distribución de los grupos en los estados

### Relativo a la Entidad

In [12]:
grupo_estados_rel_ent = grupo_estados.apply(lambda x: x.div(x.sum()), axis=0)*100
grupo_estados_rel_ent.style.format(precision=4)

Unnamed: 0_level_0,ENT,Ags.,B.C.,B.C.S,Camp.,Coah.,Col.,Chis.,Chih.,C.D.Mx,Dgo.,Gto.,Gro.,Hgo.,Jal.,Edo. Méx.,Mich.,Mor.,Nay.,N.L.,Oax.,Pue.,Qro.,Q. Roo.,S.L.P,Sin.,Son.,Tab.,Tamps.,Tlax.,Ver.,Yuc.,Zac.
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1
1,11,0.0,4.7443,16.2675,36.9132,3.9855,2.9969,59.9927,7.5614,0.1389,13.4485,15.2251,59.6996,26.0753,3.8634,12.7904,21.5521,12.3287,10.0952,8.3565,59.1376,33.0746,39.2867,17.467,30.9252,11.778,8.8626,32.0845,10.2383,6.7223,35.0068,30.8538,14.2705
2,20,52.0355,45.6533,44.6422,45.4485,44.2029,60.1771,33.6056,42.3122,37.4733,56.2009,57.1035,33.7631,63.4053,48.9018,56.5598,59.3676,66.9071,66.4336,37.8694,36.0863,46.9376,34.0883,57.3822,35.339,50.2414,43.6453,57.5787,54.3225,81.6375,50.2603,42.1753,59.7932
2,21,0.3948,0.3797,0.3399,0.4303,0.2186,0.2497,0.1558,0.0,0.3907,0.0524,0.4454,0.2003,0.3326,0.3306,0.6075,0.4504,0.5282,0.2225,0.0561,0.1002,0.0484,0.4231,0.3689,0.0471,0.113,0.1056,0.222,0.1567,0.1331,0.4615,0.1936,0.1466
2,22,0.6739,0.2592,0.466,0.5305,0.2202,0.5759,0.2551,0.0554,0.1273,0.1325,0.7479,0.2585,0.2785,0.2349,0.2862,0.4021,0.6684,0.2046,0.2077,0.1766,0.3067,0.408,0.5523,0.1606,0.2947,0.2202,0.3064,0.423,0.2122,0.5353,0.1674,0.3551
2,23,0.369,0.1538,0.2748,0.7004,0.4033,0.5995,0.1864,0.0,0.0312,0.0471,0.5896,0.1175,0.2625,0.2211,0.0517,1.3622,0.3723,0.2868,0.0,0.1746,0.0,0.2405,0.2615,0.1561,0.5695,0.0484,0.7009,0.4502,0.1538,0.4417,0.3207,0.2655
3,30,0.5788,0.6602,0.8546,0.2008,0.7188,0.1716,0.0568,0.1459,1.1184,0.0,0.6042,0.0474,0.0,0.7055,0.3063,0.1892,0.4834,0.2158,0.5937,0.1603,0.0,0.1922,0.2063,0.147,0.5251,0.3596,0.1314,0.6451,0.0518,0.1057,0.4258,0.1839
3,31,0.6869,0.327,0.2708,0.2016,0.2041,0.2938,0.1471,0.1508,0.4276,0.1586,0.2474,0.1233,0.0483,0.3227,0.2103,0.2569,0.3032,0.1947,0.3069,0.0,0.0622,0.2201,0.2987,0.1623,0.3957,0.1657,0.0,0.1674,0.0575,0.2944,0.1207,0.0472
3,32,0.1999,0.4936,0.0422,0.0959,0.0593,0.0926,0.0,0.0931,1.4096,0.0,0.2998,0.0,0.1006,0.577,0.1079,0.1025,0.3921,0.0806,0.3303,0.0401,0.19,0.3504,0.0983,0.0482,0.3389,0.244,0.0743,0.2688,0.0,0.1788,0.2869,0.033
3,33,31.7423,30.1446,21.8047,8.2452,38.4103,15.5528,4.0372,35.2241,41.0276,20.1558,17.0553,5.5973,4.9126,31.2855,15.6125,13.3136,13.2985,17.2837,31.2594,3.5099,12.9669,12.7017,8.817,23.2068,22.8371,32.8485,6.0587,22.7096,6.4028,9.6375,13.7234,17.8025
3,34,0.2362,0.1151,0.2732,0.1562,0.2088,0.1463,0.0,0.0464,0.2103,0.0402,0.3244,0.0,0.0,0.39,0.0,0.16,0.1485,0.087,0.0455,0.0451,0.0,0.1026,0.0952,0.1039,0.3947,0.099,0.0534,0.0914,0.115,0.0629,0.2802,0.0852


In [13]:
np.amax(grupo_estados_rel_ent)

  return reduction(axis=axis, out=out, **passkwargs)


ENT
Ags.         52.035481
B.C.         45.653264
B.C.S        44.642247
Camp.        45.448495
Coah.        44.202890
Col.         60.177088
Chis.        59.992653
Chih.        42.312219
C.D.Mx       41.027628
Dgo.         56.200860
Gto.         57.103503
Gro.         59.699607
Hgo.         63.405317
Jal.         48.901847
Edo. Méx.    56.559761
Mich.        59.367565
Mor.         66.907094
Nay.         66.433596
N.L.         37.869424
Oax.         59.137642
Pue.         46.937617
Qro.         39.286652
Q. Roo.      57.382214
S.L.P        35.339037
Sin.         50.241358
Son.         43.645319
Tab.         57.578661
Tamps.       54.322547
Tlax.        81.637524
Ver.         50.260302
Yuc.         42.175304
Zac.         59.793218
dtype: float64

La mayoría se encuentra en el grupo 20, que es donde está casi la mitad de los hogares mexicanos

## Internet

In [14]:
grupo_internet = pd.pivot_table(data=endutih_vivhogar, columns="P4_4", values= "FAC_HOG", index=["ESTRATO", "Grupo"], aggfunc='sum', fill_value=0)
grupo_internet.columns = pd.Series(["Sí", "No"], name="Internet en el hogar")
grupo_internet

Unnamed: 0_level_0,Internet en el hogar,Sí,No
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,1767283,5217556
2,20,10168088,7127113
2,21,108134,364
2,22,110877,0
2,23,47795,44673
3,30,125409,12825
3,31,59912,21441
3,32,104798,0
3,33,5561698,1545020
3,34,43151,0


### Relativo al grupo

In [15]:
grupo_internet_rel_grupo = grupo_internet.apply(lambda x: x.div(x.sum()), axis=1)*100
grupo_internet_rel_grupo.style.format(precision=4)

Unnamed: 0_level_0,Internet en el hogar,Sí,No
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,25.3017,74.6983
2,20,58.7914,41.2086
2,21,99.6645,0.3355
2,22,100.0,0.0
2,23,51.6882,48.3118
3,30,90.7223,9.2777
3,31,73.6445,26.3555
3,32,100.0,0.0
3,33,78.2597,21.7403
3,34,100.0,0.0


Hay variaciones dentro de los grupos, sin embargo, destaca el hecho de que hay grupos donde todos los hogares tienen Internet

### Relativo a la Disponibilidad de internet

In [16]:
grupo_internet_rel_int = grupo_internet.apply(lambda x: x.div(x.sum()), axis=0)*100
grupo_internet_rel_int.style.format(precision=4)

Unnamed: 0_level_0,Internet en el hogar,Sí,No
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,8.2626,36.4986
2,20,47.5392,49.8566
2,21,0.5056,0.0025
2,22,0.5184,0.0
2,23,0.2235,0.3125
3,30,0.5863,0.0897
3,31,0.2801,0.15
3,32,0.49,0.0
3,33,26.0028,10.808
3,34,0.2017,0.0


### Internet Detalles

In [17]:
grupo_internet_tipo = pd.pivot_table(data=endutih_vivhogar.loc[endutih_vivhogar.P4_4==1], columns="P4_5", values= "FAC_HOG", index=["ESTRATO", "Grupo"], aggfunc='sum', fill_value=0)
grupo_internet_tipo.columns = pd.Series(["Fija", "Móvil", "Ambas", "No sabe"], name="Tipo de Internet en el hogar")
grupo_internet_tipo

Unnamed: 0_level_0,Tipo de Internet en el hogar,Fija,Móvil,Ambas,No sabe
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
1,11,1129636,415595,214295,7757
2,20,6785857,768901,2576932,36398
2,21,76096,750,27372,3916
2,22,84507,0,23244,3126
2,23,36662,3387,5906,1840
3,30,78400,4079,42930,0
3,31,42975,452,14191,2294
3,32,56224,0,48574,0
3,33,3290073,187424,2076314,7887
3,34,26185,0,15539,1427


#### Relativo al grupo

In [18]:
grupo_internet_tipo_rel_grupo = grupo_internet_tipo.apply(lambda x: x.div(x.sum()), axis=1)*100
grupo_internet_tipo_rel_grupo.style.format(precision=4)

Unnamed: 0_level_0,Tipo de Internet en el hogar,Fija,Móvil,Ambas,No sabe
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
1,11,63.9194,23.516,12.1257,0.4389
2,20,66.7368,7.5619,25.3433,0.358
2,21,70.3719,0.6936,25.313,3.6214
2,22,76.2169,0.0,20.9638,2.8193
2,23,76.7068,7.0865,12.3569,3.8498
3,30,62.5154,3.2526,34.232,0.0
3,31,71.7302,0.7544,23.6864,3.8289
3,32,53.6499,0.0,46.3501,0.0
3,33,59.1559,3.3699,37.3324,0.1418
3,34,60.6823,0.0,36.0108,3.307


De los hogares que tienen internet, en su mayoría lo tienen de forma fija

#### Relativo al tipo de Internet

In [19]:
grupo_internet_tipo_rel_tipo = grupo_internet_tipo.apply(lambda x: x.div(x.sum()), axis=0)*100
grupo_internet_tipo_rel_tipo.style.format(precision=4)

Unnamed: 0_level_0,Tipo de Internet en el hogar,Fija,Móvil,Ambas,No sabe
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
1,11,8.3346,28.9254,3.3884,10.4693
2,20,50.0669,53.5155,40.7459,49.1247
2,21,0.5614,0.0522,0.4328,5.2852
2,22,0.6235,0.0,0.3675,4.219
2,23,0.2705,0.2357,0.0934,2.4834
3,30,0.5784,0.2839,0.6788,0.0
3,31,0.3171,0.0315,0.2244,3.0961
3,32,0.4148,0.0,0.768,0.0
3,33,24.2746,13.0447,32.8302,10.6447
3,34,0.1932,0.0,0.2457,1.926


## Electricidad

In [20]:
grupo_electricidad = pd.pivot_table(data=endutih_vivhogar, columns="P1_4", values= "FAC_HOG", index=["ESTRATO", "Grupo"], aggfunc='sum', fill_value=0)
grupo_electricidad.columns = pd.Series(["Sí", "No"], name="Electricidad")
grupo_electricidad

Unnamed: 0_level_0,Electricidad,Sí,No
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,6870009,114830
2,20,17249295,45906
2,21,108498,0
2,22,110877,0
2,23,92468,0
3,30,138234,0
3,31,81353,0
3,32,104798,0
3,33,7092239,14479
3,34,43151,0


### Relativo al grupo

In [21]:
grupo_electricidad_rel_grupo = grupo_electricidad.apply(lambda x: x.div(x.sum()), axis=1)*100
grupo_electricidad_rel_grupo.style.format(precision=4)

Unnamed: 0_level_0,Electricidad,Sí,No
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,98.356,1.644
2,20,99.7346,0.2654
2,21,100.0,0.0
2,22,100.0,0.0
2,23,100.0,0.0
3,30,100.0,0.0
3,31,100.0,0.0
3,32,100.0,0.0
3,33,99.7963,0.2037
3,34,100.0,0.0


Como la mayoría de los hogares tienen electricidad, no consideraremos este factor como una limitante

## Computadora

In [22]:
endutih_vivhogar["COMPU"] = (endutih_vivhogar[["P4_2_1", "P4_2_2", "P4_2_3"]]==1).any(axis=1)

In [23]:
grupo_compu = pd.pivot_table(data=endutih_vivhogar, columns="COMPU", values= "FAC_HOG", index=["ESTRATO", "Grupo"], aggfunc='sum', fill_value=0)
grupo_compu.columns = pd.Series(["No", "Sí"], name="Computadora en el hogar")
grupo_compu

Unnamed: 0_level_0,Computadora en el hogar,No,Sí
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,5874989,1109850
2,20,10410499,6884702
2,21,28615,79883
2,22,48555,62322
2,23,54205,38263
3,30,41005,97229
3,31,36945,44408
3,32,22979,81819
3,33,2825919,4280799
3,34,16688,26463


### Relativo al grupo

In [24]:
grupo_compu_rel_grupo = grupo_compu.apply(lambda x: x.div(x.sum()), axis=1)*100
grupo_compu_rel_grupo.style.format(precision=4)

Unnamed: 0_level_0,Computadora en el hogar,No,Sí
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,84.1106,15.8894
2,20,60.193,39.807
2,21,26.3738,73.6262
2,22,43.7918,56.2082
2,23,58.6203,41.3797
3,30,29.6635,70.3365
3,31,45.4132,54.5868
3,32,21.9269,78.0731
3,33,39.7641,60.2359
3,34,38.6735,61.3265


Vemos que en su mayoría no cuentan con un equipo de cómputo

### Detalles

In [25]:
grupo_compu_tipo = endutih_vivhogar[(endutih_vivhogar.COMPU==True)&(endutih_vivhogar.P4_2_1==1)][["ESTRATO", "Grupo", "FAC_HOG"]].groupby(["ESTRATO", "Grupo"]).agg("sum")
grupo_compu_tipo.columns = ["Ordenador"]
grupo_compu_tipo

Unnamed: 0_level_0,Unnamed: 1_level_0,Ordenador
ESTRATO,Grupo,Unnamed: 2_level_1
1,11,198187
2,20,2082084
2,21,36247
2,22,17407
2,23,8069
3,30,47775
3,31,13896
3,32,34766
3,33,1480728
3,34,8115


In [26]:
grupo_compu_tipo["Laptop"] = endutih_vivhogar[(endutih_vivhogar.COMPU==True)&(endutih_vivhogar.P4_2_2==1)][["ESTRATO", "Grupo", "FAC_HOG"]].groupby(["ESTRATO", "Grupo"]).agg("sum")
grupo_compu_tipo["Tablet"] = endutih_vivhogar[(endutih_vivhogar.COMPU==True)&(endutih_vivhogar.P4_2_3==1)][["ESTRATO", "Grupo", "FAC_HOG"]].groupby(["ESTRATO", "Grupo"]).agg("sum")
grupo_compu_tipo

Unnamed: 0_level_0,Unnamed: 1_level_0,Ordenador,Laptop,Tablet
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
1,11,198187,785620,353407
2,20,2082084,4828180,2437367
2,21,36247,45183,26237
2,22,17407,36152,21112
2,23,8069,24177,13594
3,30,47775,65313,39595
3,31,13896,31700,19362
3,32,34766,65720,32345
3,33,1480728,3282566,1621163
3,34,8115,19804,12515


In [27]:
grupo_compu_tipo_rel_grupo = grupo_compu_tipo/np.array(grupo_compu["Sí"]).repeat(3).reshape(15,3)
grupo_compu_tipo_rel_grupo

Unnamed: 0_level_0,Unnamed: 1_level_0,Ordenador,Laptop,Tablet
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
1,11,0.178571,0.707861,0.318428
2,20,0.302422,0.701291,0.354027
2,21,0.453751,0.565615,0.328443
2,22,0.279307,0.580084,0.338757
2,23,0.210883,0.631864,0.355278
3,30,0.491366,0.671744,0.407234
3,31,0.312917,0.713835,0.436003
3,32,0.424914,0.803236,0.395324
3,33,0.3459,0.766812,0.378706
3,34,0.306655,0.748366,0.472924


Las laptops son claramente dominates a comparación de las otras opciones

## Número de integrantes Promedio*
*Mayores de 15 años

In [28]:
integrantes = endutih_res[["ESTRATO", "Grupo", "UPM", "VIV_SEL", "HOGAR", "FAC_HOGAR"]].groupby(["ESTRATO", "Grupo", "UPM", "VIV_SEL", "HOGAR"]).agg(["count"])
integrantes.columns = ["Total"]

In [29]:
endutih_vivhogar["Integrantes_total"] = np.array(integrantes["Total"])*endutih_vivhogar["FAC_HOG"]

In [30]:
grupo_integrantes = endutih_vivhogar[["ESTRATO", "Grupo", "Integrantes_total"]].groupby(["ESTRATO", "Grupo"]).agg("sum")
grupo_integrantes = grupo_integrantes.div(dist_grupos.FAC_HOG, axis=0)
grupo_integrantes

Unnamed: 0_level_0,Unnamed: 1_level_0,Integrantes_total
ESTRATO,Grupo,Unnamed: 2_level_1
1,11,3.834178
2,20,3.620158
2,21,3.956064
2,22,3.444718
2,23,3.413505
3,30,3.27324
3,31,3.294421
3,32,3.222666
3,33,3.293917
3,34,3.578411


De forma general, parece que se tomaron 3 residentes por hogar

## Línea telefónica

In [31]:
grupo_tel = pd.pivot_table(data=endutih_vivhogar, columns="P5_5", values= "FAC_HOG", index=["ESTRATO", "Grupo"], aggfunc='sum', fill_value=0)
grupo_tel.columns = pd.Series(["Sí", "No"], name="Línea telefónica en el hogar")
grupo_tel

Unnamed: 0_level_0,Línea telefónica en el hogar,Sí,No
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,705474,6279365
2,20,5940495,11354706
2,21,105090,3408
2,22,3415,107462
2,23,18818,73650
3,30,114319,23915
3,31,43488,37865
3,32,101976,2822
3,33,4158208,2948510
3,34,795,42356


### Relativo al grupo

In [32]:
grupo_tel_rel_grupo = grupo_tel.apply(lambda x: x.div(x.sum()), axis=1)*100
grupo_tel_rel_grupo.style.format(precision=4)

Unnamed: 0_level_0,Línea telefónica en el hogar,Sí,No
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,10.1001,89.8999
2,20,34.3476,65.6524
2,21,96.8589,3.1411
2,22,3.08,96.92
2,23,20.3508,79.6492
3,30,82.6996,17.3004
3,31,53.4559,46.5441
3,32,97.3072,2.6928
3,33,58.5109,41.4891
3,34,1.8424,98.1576


Llama la atención cómo la línea telefónica no es tan usada como el Internet

## Actividad Laboral

In [33]:
grupo_trabajo = pd.pivot_table(data=endutih_res, columns="P3_10", values= "FAC_HOGAR", index=["ESTRATO", "Grupo"], aggfunc='sum', fill_value=0)
grupo_trabajo.columns = pd.Series(["Trabajó","No fue al trabajo", "Buscó trabajo", "Está jubilado", "Se dedicó a estudiar", "Quehaceres del hogar", "Limitación para trabajar", "No trabajó"], name="Actividad laboral")
grupo_trabajo

Unnamed: 0_level_0,Actividad laboral,Trabajó,No fue al trabajo,Buscó trabajo,Está jubilado,Se dedicó a estudiar,Quehaceres del hogar,Limitación para trabajar,No trabajó
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1,11,9525436,215513,295312,133837,2471815,6314638,385096,1265210
2,20,25754175,700073,1034490,1511948,7281888,10710202,813520,2743109
2,21,185196,2063,11385,24360,56621,75116,3484,14111
2,22,182042,4515,2772,3774,56983,69991,3299,22769
2,23,118521,3454,6027,8836,42554,62293,8023,12073
3,30,219058,7646,1556,33219,60321,65070,5656,20641
3,31,102179,3954,3452,17669,27470,39400,1229,14633
3,32,161331,2683,1247,30508,46862,60851,4862,16870
3,33,10457646,287738,431892,1412323,2899165,3242856,219067,965542
3,34,66138,2324,2826,9713,16935,24025,326,9265


### Relativo al grupo

In [34]:
grupo_trabajo_rel_grupo = grupo_trabajo.apply(lambda x: x.div(x.sum()), axis=1)*100
grupo_trabajo_rel_grupo.style.format(precision=4)

Unnamed: 0_level_0,Actividad laboral,Trabajó,No fue al trabajo,Buscó trabajo,Está jubilado,Se dedicó a estudiar,Quehaceres del hogar,Limitación para trabajar,No trabajó
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1,11,46.2246,1.0458,1.4331,0.6495,11.9951,30.6434,1.8688,6.1398
2,20,50.9485,1.3849,2.0465,2.991,14.4055,21.1876,1.6094,5.4266
2,21,49.7389,0.5541,3.0577,6.5425,15.207,20.1743,0.9357,3.7899
2,22,52.5913,1.3044,0.8008,1.0903,16.4622,20.2201,0.9531,6.5779
2,23,45.2749,1.3194,2.3023,3.3753,16.2556,23.7958,3.0648,4.6119
3,30,53.0192,1.8506,0.3766,8.0401,14.5997,15.7491,1.3689,4.9958
3,31,48.6599,1.883,1.6439,8.4144,13.0818,18.7632,0.5853,6.9686
3,32,49.6076,0.825,0.3834,9.3809,14.4096,18.7111,1.495,5.1874
3,33,52.5082,1.4447,2.1685,7.0913,14.5568,16.2825,1.0999,4.848
3,34,50.2752,1.7666,2.1482,7.3834,12.8732,18.2627,0.2478,7.0428


De manera general, podemos ver que la mayoría d elos integrantes de los grupos son población económicamente activa, sin embargo, llama la atención que en el grupo 11, haya un alto porcentaje de residentes que se dedican a los quehaceres del hogar

## EDUCACIÓN

In [35]:
grupo_edu = pd.pivot_table(data=endutih_res, columns=["NIVEL"], values= "FAC_HOGAR", index=["ESTRATO", "Grupo"], aggfunc='sum', fill_value=0)
grupo_edu.columns = pd.Series(["Ninguno", "Preescolar", "Primaria", "Secundaria","Normal básica", "Estudio técnico", "Preparatoria", "Estudio técnico superior", "Licenciatura o ingeniería", "Especialidad", "Maestría", "Doctorado", "No sabe"], name="Nivel Educativo")
grupo_edu

Unnamed: 0_level_0,Nivel Educativo,Ninguno,Preescolar,Primaria,Secundaria,Normal básica,Estudio técnico,Preparatoria,Estudio técnico superior,Licenciatura o ingeniería,Especialidad,Maestría,Doctorado,No sabe
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1
1,11,2328351,555378,10344537,6600272,8154,51324,3072305,73902,987122,5582,22756,2323,67653
2,20,2316109,928185,17869900,16862237,59624,569721,10637604,732938,6680481,49808,297437,41919,277423
2,21,10221,1590,85454,101620,300,4681,100593,2737,76376,0,7217,0,8547
2,22,6149,9369,101749,120734,0,3876,79380,2466,48998,0,2464,283,11172
2,23,15785,5526,82985,74972,0,3401,52727,618,42766,0,3304,1064,7355
3,30,5767,6838,75262,83698,1116,19658,83810,7724,129959,800,10859,3733,15422
3,31,6579,0,44995,48468,426,1999,31191,4737,67996,397,6503,0,6926
3,32,8222,4279,46359,57706,1863,3624,77996,12764,108482,1477,8028,904,8074
3,33,354243,270736,4586229,5072811,51231,473072,4727311,534272,5205682,51670,376964,69993,123639
3,34,3123,1290,31860,41553,0,287,23861,1063,33240,158,2066,478,1250


### Relativo al grupo

In [36]:
grupo_edu_rel_grupo = grupo_edu.apply(lambda x: x.div(x.sum()), axis=1)*100
grupo_edu_rel_grupo.style.format(precision=4)

Unnamed: 0_level_0,Nivel Educativo,Ninguno,Preescolar,Primaria,Secundaria,Normal básica,Estudio técnico,Preparatoria,Estudio técnico superior,Licenciatura o ingeniería,Especialidad,Maestría,Doctorado,No sabe
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1
1,11,9.6533,2.3026,42.8884,27.3647,0.0338,0.2128,12.7378,0.3064,4.0926,0.0231,0.0943,0.0096,0.2805
2,20,4.0404,1.6192,31.1738,29.416,0.104,0.9939,18.5572,1.2786,11.654,0.0869,0.5189,0.0731,0.484
2,21,2.5595,0.3982,21.399,25.4472,0.0751,1.1722,25.1901,0.6854,19.1257,0.0,1.8073,0.0,2.1403
2,22,1.5904,2.4232,26.3162,31.2265,0.0,1.0025,20.5307,0.6378,12.6728,0.0,0.6373,0.0732,2.8895
2,23,5.4337,1.9022,28.566,25.8077,0.0,1.1707,18.1502,0.2127,14.7214,0.0,1.1373,0.3663,2.5318
3,30,1.297,1.5379,16.9263,18.8235,0.251,4.421,18.8487,1.7371,29.2275,0.1799,2.4422,0.8395,3.4684
3,31,2.9875,0.0,20.4321,22.0092,0.1934,0.9077,14.1638,2.1511,30.8768,0.1803,2.953,0.0,3.1451
3,32,2.4198,1.2594,13.6439,16.9834,0.5483,1.0666,22.955,3.7566,31.9273,0.4347,2.3627,0.2661,2.3763
3,33,1.6177,1.2364,20.9437,23.1658,0.234,2.1604,21.588,2.4398,23.7726,0.236,1.7215,0.3196,0.5646
3,34,2.2271,0.9199,22.72,29.6322,0.0,0.2047,17.0157,0.758,23.7041,0.1127,1.4733,0.3409,0.8914


## Celular

In [37]:
grupo_cel = pd.pivot_table(data=endutih_vivhogar, columns="P4_1_6", values= "FAC_HOG", index=["ESTRATO", "Grupo"], aggfunc='sum', fill_value=0)
grupo_cel.columns = pd.Series(["Sí", "No"], name="Celular en el hogar")
grupo_cel

Unnamed: 0_level_0,Celular en el hogar,Sí,No
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,5672484,1312355
2,20,16103426,1191775
2,21,103537,4961
2,22,108007,2870
2,23,83789,8679
3,30,133743,4491
3,31,67281,14072
3,32,103209,1589
3,33,6798418,308300
3,34,42420,731


### Relativo al grupo

In [38]:
grupo_cel_rel_grupo = grupo_cel.apply(lambda x: x.div(x.sum()), axis=1)*100
grupo_cel_rel_grupo.style.format(precision=4)

Unnamed: 0_level_0,Celular en el hogar,Sí,No
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,81.2114,18.7886
2,20,93.1092,6.8908
2,21,95.4276,4.5724
2,22,97.4115,2.5885
2,23,90.6141,9.3859
3,30,96.7512,3.2488
3,31,82.7025,17.2975
3,32,98.4837,1.5163
3,33,95.6619,4.3381
3,34,98.3059,1.6941


### Detalles

In [39]:
endutih_vivhogar["Movil"] = endutih_vivhogar["FAC_HOG"]*endutih_vivhogar["P4_1_6_1"]
endutih_vivhogar["Smartphone"] = endutih_vivhogar["FAC_HOG"]*endutih_vivhogar["P4_1_6_2"]

In [40]:
grupo_cel_tipo = endutih_vivhogar[(endutih_vivhogar.P4_1_6==1)][["ESTRATO", "Grupo", "FAC_HOG",]].groupby(["ESTRATO", "Grupo"]).agg("sum")
grupo_cel_tipo.columns = ["Total"]
grupo_cel_tipo["Móvil"]= endutih_vivhogar[(endutih_vivhogar.P4_1_6==1)&(endutih_vivhogar.P4_1_6_1>0)][["ESTRATO", "Grupo", "Movil",]].groupby(["ESTRATO", "Grupo"]).agg("sum")
grupo_cel_tipo["Smartphone"] = endutih_vivhogar[(endutih_vivhogar.P4_1_6==1)&(endutih_vivhogar.P4_1_6_2>0)][["ESTRATO", "Grupo", "Smartphone"]].groupby(["ESTRATO", "Grupo"]).agg("sum")
grupo_cel_tipo

Unnamed: 0_level_0,Unnamed: 1_level_0,Total,Móvil,Smartphone
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
1,11,5672484,11641015.0,9943009.0
2,20,16103426,40562730.0,36991337.0
2,21,103537,314914.0,307501.0
2,22,108007,295927.0,311581.0
2,23,83789,208323.0,199622.0
3,30,133743,414680.0,387996.0
3,31,67281,166236.0,169948.0
3,32,103209,298661.0,277190.0
3,33,6798418,18108388.0,17183848.0
3,34,42420,123270.0,117358.0


In [41]:
grupo_cel_tipo_promedio = grupo_cel_tipo[["Móvil", "Smartphone"]].div(grupo_cel_tipo.Total, axis=0)
grupo_cel_tipo_promedio

Unnamed: 0_level_0,Unnamed: 1_level_0,Móvil,Smartphone
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,2.05219,1.752849
2,20,2.518888,2.29711
2,21,3.04156,2.969962
2,22,2.739887,2.884822
2,23,2.486281,2.382437
3,30,3.100573,2.901057
3,31,2.470772,2.525943
3,32,2.89375,2.685715
3,33,2.663618,2.527625
3,34,2.905941,2.766572


## Sexo

In [42]:
grupo_sexo = pd.pivot_table(data=endutih_res, index=["ESTRATO","Grupo"], columns="SEXO", values="FAC_HOGAR", aggfunc="sum")
grupo_sexo.columns = pd.Series(["Hombre","Mujer"], name="SEXO")
grupo_sexo

Unnamed: 0_level_0,SEXO,Hombre,Mujer
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,13202300,13864855
2,20,30487305,32364627
2,21,198773,222898
2,22,193702,231715
2,23,149508,163263
3,30,206177,254475
3,31,96885,131775
3,32,159500,200386
3,33,11362394,12025241
3,34,76740,79702


### Relativo al grupo

In [43]:
grupo_sexo_rel_grupo = grupo_sexo.apply(lambda x: x.div(x.sum()), axis=1)*100
grupo_sexo_rel_grupo

Unnamed: 0_level_0,SEXO,Hombre,Mujer
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1
1,11,48.77609,51.22391
2,20,48.506552,51.493448
2,21,47.139357,52.860643
2,22,45.532266,54.467734
2,23,47.801107,52.198893
3,30,44.757648,55.242352
3,31,42.370769,57.629231
3,32,44.31959,55.68041
3,33,48.582911,51.417089
3,34,49.053323,50.946677


## IDTMex

In [9]:
IDTMex_grupos_edo = pd.pivot_table(data=endutih_completa, columns="ENT", index=["ESTRATO", "Grupo"], aggfunc=IDTMex.IDTMex, fill_value=0)
IDTMex_grupos_edo.columns = estados.ENT
IDTMex_grupos_edo

  IDTMex_grupos_edo = pd.pivot_table(data=endutih_completa, columns="ENT", index=["ESTRATO", "Grupo"], aggfunc=IDTMex.IDTMex, fill_value=0)


Unnamed: 0_level_0,ENT,Ags.,B.C.,B.C.S,Camp.,Coah.,Col.,Chis.,Chih.,C.D.Mx,Dgo.,Gto.,Gro.,Hgo.,Jal.,Edo. Méx.,Mich.,Mor.,Nay.,N.L.,Oax.,Pue.,Qro.,Q. Roo.,S.L.P,Sin.,Son.,Tab.,Tamps.,Tlax.,Ver.,Yuc.,Zac.
ESTRATO,Grupo,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1
1,11,0.0,3.509422,4.32251,3.152224,2.249533,3.963927,2.136097,2.704921,4.913072,3.019904,3.679311,3.401621,2.955906,2.92644,3.197817,2.357045,4.041712,2.402178,3.824849,3.023366,2.975564,3.399068,3.741518,2.51633,3.22153,4.208157,3.203083,3.959875,2.672378,2.655897,3.283595,3.084682
2,20,4.715311,5.865413,5.45355,5.451482,4.782666,5.155523,4.516427,5.19666,6.676073,4.547788,4.341657,5.353832,4.667045,4.989033,5.654172,4.491235,5.307903,4.775072,6.036698,4.886265,4.705495,5.50679,5.390431,5.114548,4.619368,5.894004,4.694628,5.356183,4.501066,4.687334,4.800562,4.485534
2,21,7.212964,8.055016,8.17397,8.091542,6.232668,7.447854,6.791951,0.0,7.723988,7.666667,7.163437,6.664675,6.520644,7.873503,7.621675,7.308558,7.332781,8.003444,7.333333,8.564876,8.555556,7.788282,7.676731,8.333333,8.925734,8.341163,7.169012,7.391567,6.884443,7.37413,7.824705,8.318033
2,22,6.318044,6.640156,6.356524,5.950369,5.74393,6.0359,6.536865,7.833333,6.546627,5.7375,6.787817,6.4364,4.786023,6.831785,6.162905,5.713394,5.69665,6.529955,6.791345,6.618869,5.500858,6.4057,5.90399,6.348436,5.950587,7.761097,6.414862,6.685359,5.29103,5.831469,5.91706,5.564964
2,23,4.545903,4.770804,5.15437,4.265302,4.278083,5.150232,3.061872,0.0,4.666667,2.888889,3.965488,4.573409,5.007581,5.635662,4.666667,4.397901,3.773863,3.631431,0.0,5.264356,0.0,5.085087,4.807236,5.245774,5.365899,8.333333,4.675206,5.697418,1.789002,5.517515,4.543416,3.455004
3,30,7.340089,7.944129,7.368104,7.188754,6.801749,7.772515,6.333333,6.371514,8.303545,0.0,7.598358,1.666667,0.0,7.181075,7.299473,7.746778,6.993305,8.87101,7.38046,7.676996,0.0,6.717189,6.678219,5.179583,7.00301,8.230919,7.061192,6.892241,8.666667,7.514096,7.259495,6.778885
3,31,5.516981,7.971836,6.597414,6.250826,4.375062,6.547206,6.963058,5.290554,7.253774,6.461579,6.536398,5.698692,1.666667,3.916692,4.486712,6.556072,6.016331,5.599994,5.42827,0.0,6.666667,6.63554,6.379702,7.862977,5.893047,5.78654,0.0,6.958246,8.533333,6.660744,5.877466,4.0
3,32,7.064853,8.008826,5.0,7.897286,8.444444,8.324895,0.0,8.198852,8.796732,0.0,8.150335,0.0,7.127682,7.438901,7.932486,6.969107,8.165602,8.222222,8.359036,7.777778,8.455407,7.707584,7.547274,7.119048,7.052934,8.808401,8.666667,7.076945,0.0,8.234914,7.702095,6.0
3,33,6.177313,7.108091,6.580328,6.732477,6.197529,6.695836,6.618886,6.295855,7.448001,6.276785,6.313263,7.533533,6.425261,6.164887,6.861031,5.999945,6.379561,6.985303,6.904691,6.958877,6.622479,6.955064,6.683844,6.709901,6.222475,7.204768,6.50715,6.340984,6.414961,6.554611,6.617724,6.651896
3,34,6.090581,8.034558,6.377292,7.475884,7.510594,5.652965,0.0,9.0,8.591047,5.833333,6.578192,0.0,0.0,5.983468,0.0,5.749542,6.52202,6.406769,5.166667,7.333333,0.0,6.926497,7.138289,4.940632,6.392205,7.855865,7.222222,5.713063,7.589849,6.111111,5.971142,7.067073


In [10]:
IDTMex_grupos_edo.to_csv(base_path+"IDTMex_grupos_edo.csv")

In [13]:
IDTMex_dominio_grupos_edo = pd.pivot_table(data=endutih_completa, columns="ENT", index=["ESTRATO","DOMINIO","Grupo"], aggfunc=IDTMex.IDTMex, fill_value=0)
IDTMex_dominio_grupos_edo.columns = estados.ENT
IDTMex_dominio_grupos_edo

  IDTMex_dominio_grupos_edo = pd.pivot_table(data=endutih_completa, columns="ENT", index=["ESTRATO","DOMINIO","Grupo"], aggfunc=IDTMex.IDTMex, fill_value=0)


Unnamed: 0_level_0,Unnamed: 1_level_0,ENT,Ags.,B.C.,B.C.S,Camp.,Coah.,Col.,Chis.,Chih.,C.D.Mx,Dgo.,Gto.,Gro.,Hgo.,Jal.,Edo. Méx.,Mich.,Mor.,Nay.,N.L.,Oax.,Pue.,Qro.,Q. Roo.,S.L.P,Sin.,Son.,Tab.,Tamps.,Tlax.,Ver.,Yuc.,Zac.
ESTRATO,DOMINIO,Grupo,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1
1,R,11,0.0,3.411529,3.066407,3.058415,2.214322,3.963927,1.927872,2.5961,0.0,2.493391,3.622589,3.012724,2.940582,2.942555,2.878523,2.294252,4.014961,2.402178,3.902891,3.048186,3.074114,3.373671,2.829675,2.527151,3.159647,3.953149,3.208921,3.789917,2.416861,2.657592,3.122539,3.084682
1,U,11,0.0,5.046326,5.00664,3.352829,2.779101,0.0,2.85451,6.896296,4.913072,7.30379,4.612415,4.227316,4.626263,2.822222,3.989717,2.558556,4.120816,0.0,3.097799,2.908738,2.782734,3.930312,4.541718,2.422759,4.487582,5.013222,3.171525,4.799163,3.247217,2.645744,3.374351,0.0
2,R,20,4.70361,4.703621,5.115594,0.0,3.13687,4.474019,3.168165,4.208359,6.175713,3.847917,3.528747,0.0,4.145539,4.509161,4.843588,3.986112,5.03662,3.696058,6.996182,4.358288,3.992689,4.826562,3.403262,4.027668,3.648104,4.830451,3.718298,4.717778,4.152751,3.71481,4.026589,3.78265
2,R,21,6.985203,0.0,8.111111,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.867514,0.0,8.111111,0.0,9.0,7.666667,0.0,0.0,0.0,5.966667,0.0,8.333333,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,R,22,6.028424,7.555556,4.996379,0.0,0.0,0.0,0.0,7.833333,0.0,6.888889,7.444444,0.0,5.025865,0.0,0.0,3.777778,6.133333,6.540362,0.0,0.0,4.533333,6.333333,0.0,0.0,0.0,7.222222,7.0,0.0,0.0,4.666667,0.0,5.53093
2,R,23,5.333333,0.0,6.423571,0.0,1.666667,7.333333,0.0,0.0,0.0,2.888889,4.768689,0.0,0.0,5.666667,0.0,6.078945,2.333333,3.881818,0.0,4.111111,0.0,5.311147,0.0,0.0,4.400066,0.0,1.511805,0.0,1.789002,6.844444,2.666667,3.668753
2,U,20,4.724455,6.039523,5.549181,5.451482,5.069195,5.267386,4.673123,5.418688,6.683631,4.84532,4.660503,5.353832,4.906963,5.146406,5.746621,4.652499,5.364835,5.24053,5.795651,5.003387,4.782921,5.893011,5.49034,5.312781,4.999762,6.127174,5.067515,5.398708,4.58111,4.88268,4.87036,4.969656
2,U,21,7.310672,8.055016,8.180849,8.091542,6.232668,7.447854,6.791951,0.0,7.723988,7.666667,7.163437,6.664675,6.309344,7.873503,7.592591,7.308558,7.069271,8.024554,7.333333,8.564876,8.555556,8.143419,7.676731,0.0,8.925734,8.341163,7.169012,7.391567,6.884443,7.37413,7.824705,8.318033
2,U,22,6.390171,6.379414,7.138617,5.950369,5.74393,6.0359,6.536865,0.0,6.546627,2.666667,6.669142,6.4364,4.591853,6.831785,6.162905,6.041708,5.674674,6.45282,6.791345,6.618869,5.634551,6.439208,5.90399,6.348436,5.950587,7.961839,6.379578,6.685359,5.29103,5.947808,5.91706,5.670049
2,U,23,4.395722,4.770804,3.206079,4.265302,5.030954,4.915124,3.061872,0.0,4.666667,0.0,3.659231,4.573409,5.007581,5.602432,4.666667,3.759629,4.02952,2.666667,0.0,5.799471,0.0,4.837021,4.807236,5.245774,5.727419,8.333333,5.308114,5.697418,0.0,5.270904,5.458304,3.142558


In [14]:
IDTMex_dominio_grupos_edo.to_csv(base_path+"IDTMex_dominio_grupos_edo.csv")

# Estrato Bajo

## Grupo 11

In [61]:
grupo11_vivhogar = endutih_vivhogar.loc[endutih_vivhogar.Grupo==11]
grupo11_res = endutih_res.loc[endutih_res.Grupo==11]
grupo11_usr = endutih_usr.loc[endutih_usr.Grupo==11]
grupo11_usr2 = endutih_usr2.loc[endutih_usr2.Grupo==11]

### Actividad laboral por sexo

In [62]:
sit_trabajo = ["Trabajó","No fue al trabajo", "Buscó trabajo", "Está jubilado", "Se dedicó a estudiar", "Quehaceres del hogar", "Limitación para trabajar", "No trabajó"]
sexos = ["Hombre", "Mujer"]
combinaciones = [(situacion,sexo) for situacion in sit_trabajo for sexo in sexos]

In [63]:
trabajo_sexo_grupo11 = pd.pivot_table(data=grupo11_res, columns="SEXO", index="P3_10", values="FAC_HOGAR", aggfunc="sum")
trabajo_sexo_grupo11.index = pd.Series(sit_trabajo, name="Actividad laboral")
trabajo_sexo_grupo11.columns = pd.Series(sexos, name="SEXO")
trabajo_sexo_grupo11

SEXO,Hombre,Mujer
Actividad laboral,Unnamed: 1_level_1,Unnamed: 2_level_1
Trabajó,7038453,2486983
No fue al trabajo,156245,59268
Buscó trabajo,252706,42606
Está jubilado,100942,32895
Se dedicó a estudiar,1118822,1352993
Quehaceres del hogar,123600,6191038
Limitación para trabajar,231152,153944
No trabajó,875157,390053


In [64]:
trabajo_sexo_grupo11_rel_grupo = trabajo_sexo_grupo11.apply(lambda x: x.div(x.sum()), axis=1)*100
trabajo_sexo_grupo11_rel_grupo

SEXO,Hombre,Mujer
Actividad laboral,Unnamed: 1_level_1,Unnamed: 2_level_1
Trabajó,73.891137,26.108863
No fue al trabajo,72.499107,27.500893
Buscó trabajo,85.572547,14.427453
Está jubilado,75.421595,24.578405
Se dedicó a estudiar,45.263177,54.736823
Quehaceres del hogar,1.957357,98.042643
Limitación para trabajar,60.024513,39.975487
No trabajó,69.170889,30.829111


In [65]:
trabajo_sexo_grupo11_rel_sexo = trabajo_sexo_grupo11.apply(lambda x: x.div(x.sum()), axis=0)*100
trabajo_sexo_grupo11_rel_sexo

SEXO,Hombre,Mujer
Actividad laboral,Unnamed: 1_level_1,Unnamed: 2_level_1
Trabajó,71.116482,23.221607
No fue al trabajo,1.578698,0.553401
Buscó trabajo,2.55334,0.397823
Está jubilado,1.019917,0.307149
Se dedicó a estudiar,11.30457,12.633247
Quehaceres del hogar,1.248854,57.807331
Limitación para trabajar,2.335558,1.437415
No trabajó,8.84258,3.642026
