Path: blob/main/Trabajo_grupal/WG5/Tarea grupal 5-COMPLETA grupo 8.py
2714 views
import numpy as np1import pandas as pd2from pandas import DataFrame, Series3import statistics4import pyreadr #Load R dataset5import inspect6import os7from scipy.stats import t # t - student89#for usernanme y set directorio1011user = os.getlogin() # Username1213# Set directorio1415os.chdir(f"C:/Users/{user}/Documents/GitHub/1ECO35_2022_2") # Set directorio1617cps2012_env = pyreadr.read_r("data/cps2012.Rdata") # output formato diccionario181920cps2012_env # es un diccionario. En la llave "data" está la base de datos21cps2012 = cps2012_env[ 'data' ] # extrae información almacenada en la llave data del diccionario cps2012_env22dt = cps2012.describe()2324#Para crear lista hay que hacer algo con listas25lista = ['lnw','female','widowed', 'divorced', 'separated', 'nevermarried', 'hsd08', 'hsd911', 'hsg', 'cg', 'ad', 'mw', 'so', 'we', 'exp1', 'exp2', 'exp3', 'exp4', 'weight', 'ne', 'sc']26#Creamos la clase27class OLSRegClass(object):28__slots__ = [ '__X', 'Y', 'lista', 'RobustStandardError']29def __init__(self, X:pd.DataFrame, Y:pd.Series, lista, RobustStandardError=False):3031self.__X = X32self.Y = Y33self.RobustStandarError=RobustStandardError34self.lista = lista3536#Método 13738def Coeficientes(self):3940self.columns = self.X.columns.tolist() # nombre de la base de datos como objeto lista4142self.n = self.X.shape[0] # numero de observaciones, # self.n "Se crea un nuevo atributo"43k = self.X.shape[1] + 1 #numero de variables y el intercepto44self.X1 = np.column_stack((np.ones(self.n ), self.X.to_numpy() )) # self.X.to_numpy() # DataFrame to numpy45self.Y1 = self.Y.to_numpy().reshape(self.n ,1) #reshape(-1 ,1)4647self.beta = np.linalg.inv(self.X1.T @ self.X1) @ ((self.X1.T) @ self.Y1 )48self.nk = self.n - k4950#Método 2 y 351def Error_var_cov_intcof(self):5253if self.RobustStandardError:5455self.y_est = self.X1 @ self.beta56self.error = self.Y1 - self.y_est57sigma = sum(list( map( lambda x: x**2 , self.error) )) / self.nk58self.Var = sigma*np.linalg.inv(self.X.T @ self.X) #Matríz de varianzas y covarianzas caso no robusto59self.sd = np.sqrt( np.diag(self.Var) ) #Desviación estandar o errores estandar60self.límite_inferior = self.beta-1.96*self.sd61self.límite_superior = self.beta+1.96*self.sd6263else:6465self.y_est = self.X1 @ self.beta66self.error = self.Y1 - self.y_est67matrix_robust = np.diag(list( map( lambda x: x**2 , self.error)))68self.Var = np.linalg.inv(self.X.T @ self.X) @ self.X.T @ matrix_robust @ self.X @ np.linalg.inv(self.X.T @ self.X)69self.sd = np.sqrt( np.diag(self.Var) )70self.límite_inferior = self.beta-1.96*self.sd71self.límite_superior = self.beta+1.96*self.sd7273#Método 47475def R2yMSE(self):7677self.Coeficientes() # run function7879self.SCR = sum(list( map( lambda x: x**2 , self.error)))80self.SCT = sum(list( map( lambda x: x**2 , self.Y - np.mean(self.y_est))))81self.rmse = (self.SCR/self.n)**0.582R2 = 1 - self.SCR/self.SCT8384#Método 58586def _Table(self, *Kargs):8788lista = ['lnw','female','widowed', 'divorced', 'separated', 'nevermarried', 'hsd08', 'hsd911', 'hsg', 'cg', 'ad', 'mw', 'so', 'we', 'exp1', 'exp2', 'exp3', 'exp4', 'weight', 'ne', 'sc']89# run functions9091self.R2()92self.Coeficientes()93scr = self.SCR94sigma = scr / self.nk95Var = sigma*np.linalg.inv(self.X1.T @ self.X1)96sd = np.sqrt( np.diag(Var) )97t_est = np.absolute(self.beta/sd)98pvalue = (1 - t.cdf(t_est, df=self.nk) ) * 299lower_bound = self.beta-1.96*sd100upper_bound = self.beta+1.96*sd101rmse = (scr/self.n)**0.5102103if (Kargs['Output'] == "DataFrame"):104105df = pd.DataFrame( {"OLS": self.beta.flatten() , "standar_error" : sd.flatten(),"Pvalue" : pvalue.flatten() , "Lower_bound":lower_bound.flatten() ,106"Upper_bound":upper_bound.flatten() , "Root_MSE":rmse.flatten() , "R2": self.R2.flatten()})107108#self.beta.flatten() # multy-array a simple array109110elif (Kargs['Output'] == "Diccionario"):111112df ={"OLS": self.beta.flatten() , "standar_error" : sd.flatten(),"Pvalue" : pvalue.flatten() , "Lower_bound":lower_bound.flatten() ,113"Upper_bound":upper_bound.flatten() , "Root_MSE":rmse.flatten() , "R2": self.R2.flatten()}114115116return df117118cps2012_env # es un diccionario. En la llave "data" está la base de datos119cps2012 = cps2012_env[ 'data' ] # extrae información almacenada en la llave data del diccionario cps2012_env120121variance_cols = cps2012.var().to_numpy() # to numpy122Dataset = cps2012.iloc[ : , np.where( variance_cols != 0 )[0] ]123X = Dataset.iloc[:,1:10]124Y = Dataset[['lnw']]125OLSRegClass(X, Y,lista,RobustStandardError=True)126127#Pregunta 2####128{129"cells": [130{131"cell_type": "code",132"execution_count": 5,133"id": "90e53f84",134"metadata": {},135"outputs": [136{137"data": {138"text/html": [139"\n",140"<style>\n",141" div#notebook-container { width: 75%; }\n",142" div#menubar-container { width: 95%; }\n",143" div#maintoolbar-container { width: 65%; }a\n",144"</style>\n"145],146"text/plain": [147"<IPython.core.display.HTML object>"148]149},150"metadata": {},151"output_type": "display_data"152}153],154"source": [155"from IPython.display import display, HTML\n",156"\n",157"display(HTML(data=\"\"\"\n",158"<style>\n",159" div#notebook-container { width: 75%; }\n",160" div#menubar-container { width: 95%; }\n",161" div#maintoolbar-container { width: 65%; }a\n",162"</style>\n",163"\"\"\"))"164]165},166{167"cell_type": "code",168"execution_count": 6,169"id": "d596a6bf",170"metadata": {},171"outputs": [],172"source": [173"import numpy as np\n",174"import pandas as pd\n",175"from pandas import DataFrame,Series"176]177},178{179"cell_type": "code",180"execution_count": 7,181"id": "d5d95a3c",182"metadata": {183"scrolled": true184},185"outputs": [186{187"name": "stdout",188"output_type": "stream",189"text": [190"Requirement already satisfied: pyreadstat in c:\\users\\sabina\\anaconda3\\lib\\site-packages (1.1.9)\n",191"Requirement already satisfied: pandas>=1.2.0 in c:\\users\\sabina\\anaconda3\\lib\\site-packages (from pyreadstat) (1.4.2)\n",192"Requirement already satisfied: numpy>=1.18.5 in c:\\users\\sabina\\anaconda3\\lib\\site-packages (from pandas>=1.2.0->pyreadstat) (1.21.5)\n",193"Requirement already satisfied: pytz>=2020.1 in c:\\users\\sabina\\anaconda3\\lib\\site-packages (from pandas>=1.2.0->pyreadstat) (2021.3)\n",194"Requirement already satisfied: python-dateutil>=2.8.1 in c:\\users\\sabina\\anaconda3\\lib\\site-packages (from pandas>=1.2.0->pyreadstat) (2.8.2)\n",195"Requirement already satisfied: six>=1.5 in c:\\users\\sabina\\anaconda3\\lib\\site-packages (from python-dateutil>=2.8.1->pandas>=1.2.0->pyreadstat) (1.16.0)\n"196]197}198],199"source": [200"!pip install pyreadstat "201]202},203{204"cell_type": "code",205"execution_count": 8,206"id": "1778f7a7",207"metadata": {},208"outputs": [209{210"name": "stdout",211"output_type": "stream",212"text": [213"Requirement already satisfied: savReaderWriter in c:\\users\\sabina\\anaconda3\\lib\\site-packages (3.4.2)\n"214]215}216],217"source": [218"# para guardar y abrir en formato spss\n",219"!pip install savReaderWriter \n"220]221},222{223"cell_type": "code",224"execution_count": 9,225"id": "6b95cf54",226"metadata": {},227"outputs": [],228"source": [229"# cargamos sav usando pandas\n",230"data_administrativa = pd.read_spss( r\"../../data/data_administrativa.sav\" )"231]232},233{234"cell_type": "code",235"execution_count": 10,236"id": "14432a93",237"metadata": {},238"outputs": [239{240"data": {241"text/html": [242"<div>\n",243"<style scoped>\n",244" .dataframe tbody tr th:only-of-type {\n",245" vertical-align: middle;\n",246" }\n",247"\n",248" .dataframe tbody tr th {\n",249" vertical-align: top;\n",250" }\n",251"\n",252" .dataframe thead th {\n",253" text-align: right;\n",254" }\n",255"</style>\n",256"<table border=\"1\" class=\"dataframe\">\n",257" <thead>\n",258" <tr style=\"text-align: right;\">\n",259" <th></th>\n",260" <th>year</th>\n",261" <th>MES</th>\n",262" <th>CONGLOME</th>\n",263" <th>VIVIENDA</th>\n",264" <th>HOGAR</th>\n",265" <th>CODPERSO</th>\n",266" <th>UBIGEO</th>\n",267" <th>DOMINIO</th>\n",268" <th>ESTRATO</th>\n",269" <th>P201P</th>\n",270" <th>P203</th>\n",271" <th>P203A</th>\n",272" <th>P203B</th>\n",273" <th>P204</th>\n",274" <th>P205</th>\n",275" <th>P206</th>\n",276" <th>P207</th>\n",277" <th>P208A</th>\n",278" <th>P208B</th>\n",279" <th>P209</th>\n",280" </tr>\n",281" </thead>\n",282" <tbody>\n",283" <tr>\n",284" <th>0</th>\n",285" <td>2020</td>\n",286" <td>06</td>\n",287" <td>010108</td>\n",288" <td>136</td>\n",289" <td>11</td>\n",290" <td>02</td>\n",291" <td>100111</td>\n",292" <td>Sierra Centro</td>\n",293" <td>De 100 000 a 499 999 habitantes</td>\n",294" <td>20200101081361102</td>\n",295" <td>Esposo(a)/compañero(a)</td>\n",296" <td>NaN</td>\n",297" <td>NaN</td>\n",298" <td>Si</td>\n",299" <td>No</td>\n",300" <td>NaN</td>\n",301" <td>Mujer</td>\n",302" <td>43.0</td>\n",303" <td>NaN</td>\n",304" <td>Casado(a)</td>\n",305" </tr>\n",306" <tr>\n",307" <th>1</th>\n",308" <td>2020</td>\n",309" <td>06</td>\n",310" <td>020257</td>\n",311" <td>093</td>\n",312" <td>11</td>\n",313" <td>04</td>\n",314" <td>250107</td>\n",315" <td>Selva</td>\n",316" <td>De 100 000 a 499 999 habitantes</td>\n",317" <td>20200202570931104</td>\n",318" <td>Hijo(a)/Hijastro(a)</td>\n",319" <td>NaN</td>\n",320" <td>NaN</td>\n",321" <td>Si</td>\n",322" <td>No</td>\n",323" <td>NaN</td>\n",324" <td>Hombre</td>\n",325" <td>17.0</td>\n",326" <td>NaN</td>\n",327" <td>Soltero(a)</td>\n",328" </tr>\n",329" <tr>\n",330" <th>2</th>\n",331" <td>2020</td>\n",332" <td>06</td>\n",333" <td>015537</td>\n",334" <td>065</td>\n",335" <td>11</td>\n",336" <td>04</td>\n",337" <td>040126</td>\n",338" <td>Sierra Sur</td>\n",339" <td>De 500 000 a más habitantes</td>\n",340" <td>20200155370651104</td>\n",341" <td>Hijo(a)/Hijastro(a)</td>\n",342" <td>NaN</td>\n",343" <td>NaN</td>\n",344" <td>Si</td>\n",345" <td>No</td>\n",346" <td>NaN</td>\n",347" <td>Mujer</td>\n",348" <td>9.0</td>\n",349" <td>NaN</td>\n",350" <td>NaN</td>\n",351" </tr>\n",352" <tr>\n",353" <th>3</th>\n",354" <td>2019</td>\n",355" <td>10</td>\n",356" <td>010614</td>\n",357" <td>043</td>\n",358" <td>11</td>\n",359" <td>07</td>\n",360" <td>130901</td>\n",361" <td>Sierra Norte</td>\n",362" <td>De 20 000 a 49 999 habitantes</td>\n",363" <td>20190106140431107</td>\n",364" <td>Otros parientes</td>\n",365" <td>2.0</td>\n",366" <td>Hijo(a)</td>\n",367" <td>No</td>\n",368" <td>NaN</td>\n",369" <td>No</td>\n",370" <td>Mujer</td>\n",371" <td>4.0</td>\n",372" <td>NaN</td>\n",373" <td>NaN</td>\n",374" </tr>\n",375" <tr>\n",376" <th>4</th>\n",377" <td>2020</td>\n",378" <td>06</td>\n",379" <td>009390</td>\n",380" <td>096</td>\n",381" <td>11</td>\n",382" <td>04</td>\n",383" <td>230110</td>\n",384" <td>Costa Sur</td>\n",385" <td>De 100 000 a 499 999 habitantes</td>\n",386" <td>20180093900961104</td>\n",387" <td>Panel</td>\n",388" <td>NaN</td>\n",389" <td>NaN</td>\n",390" <td>NaN</td>\n",391" <td>NaN</td>\n",392" <td>NaN</td>\n",393" <td>NaN</td>\n",394" <td>NaN</td>\n",395" <td>NaN</td>\n",396" <td>NaN</td>\n",397" </tr>\n",398" <tr>\n",399" <th>...</th>\n",400" <td>...</td>\n",401" <td>...</td>\n",402" <td>...</td>\n",403" <td>...</td>\n",404" <td>...</td>\n",405" <td>...</td>\n",406" <td>...</td>\n",407" <td>...</td>\n",408" <td>...</td>\n",409" <td>...</td>\n",410" <td>...</td>\n",411" <td>...</td>\n",412" <td>...</td>\n",413" <td>...</td>\n",414" <td>...</td>\n",415" <td>...</td>\n",416" <td>...</td>\n",417" <td>...</td>\n",418" <td>...</td>\n",419" <td>...</td>\n",420" </tr>\n",421" <tr>\n",422" <th>85030</th>\n",423" <td>2020</td>\n",424" <td>12</td>\n",425" <td>007337</td>\n",426" <td>004</td>\n",427" <td>11</td>\n",428" <td>01</td>\n",429" <td>140105</td>\n",430" <td>Costa Norte</td>\n",431" <td>De 100 000 a 499 999 habitantes</td>\n",432" <td>20200073370041101</td>\n",433" <td>Jefe/Jefa</td>\n",434" <td>1.0</td>\n",435" <td>Jefe/jefa de hogar</td>\n",436" <td>Si</td>\n",437" <td>No</td>\n",438" <td>NaN</td>\n",439" <td>Hombre</td>\n",440" <td>65.0</td>\n",441" <td>NaN</td>\n",442" <td>Casado(a)</td>\n",443" </tr>\n",444" <tr>\n",445" <th>85031</th>\n",446" <td>2019</td>\n",447" <td>04</td>\n",448" <td>008226</td>\n",449" <td>084</td>\n",450" <td>13</td>\n",451" <td>02</td>\n",452" <td>160112</td>\n",453" <td>Selva</td>\n",454" <td>De 100 000 a 499 999 habitantes</td>\n",455" <td>20190082260841302</td>\n",456" <td>Otros no parientes</td>\n",457" <td>0.0</td>\n",458" <td>Jefe/jefa de hogar</td>\n",459" <td>Si</td>\n",460" <td>No</td>\n",461" <td>NaN</td>\n",462" <td>Mujer</td>\n",463" <td>89.0</td>\n",464" <td>NaN</td>\n",465" <td>Viudo(a)</td>\n",466" </tr>\n",467" <tr>\n",468" <th>85032</th>\n",469" <td>2019</td>\n",470" <td>05</td>\n",471" <td>008965</td>\n",472" <td>060</td>\n",473" <td>11</td>\n",474" <td>03</td>\n",475" <td>210101</td>\n",476" <td>Sierra Sur</td>\n",477" <td>De 100 000 a 499 999 habitantes</td>\n",478" <td>20190089650601103</td>\n",479" <td>Hijo(a)/Hijastro(a)</td>\n",480" <td>1.0</td>\n",481" <td>Hijo(a)</td>\n",482" <td>Si</td>\n",483" <td>No</td>\n",484" <td>NaN</td>\n",485" <td>Hombre</td>\n",486" <td>20.0</td>\n",487" <td>NaN</td>\n",488" <td>Soltero(a)</td>\n",489" </tr>\n",490" <tr>\n",491" <th>85033</th>\n",492" <td>2020</td>\n",493" <td>05</td>\n",494" <td>010311</td>\n",495" <td>022</td>\n",496" <td>11</td>\n",497" <td>02</td>\n",498" <td>200501</td>\n",499" <td>Costa Norte</td>\n",500" <td>De 50 000 a 99 999 habitantes</td>\n",501" <td>20200103110221102</td>\n",502" <td>Esposo(a)/compañero(a)</td>\n",503" <td>NaN</td>\n",504" <td>NaN</td>\n",505" <td>Si</td>\n",506" <td>No</td>\n",507" <td>NaN</td>\n",508" <td>Mujer</td>\n",509" <td>48.0</td>\n",510" <td>NaN</td>\n",511" <td>Casado(a)</td>\n",512" </tr>\n",513" <tr>\n",514" <th>85034</th>\n",515" <td>2020</td>\n",516" <td>11</td>\n",517" <td>018778</td>\n",518" <td>155</td>\n",519" <td>11</td>\n",520" <td>06</td>\n",521" <td>160404</td>\n",522" <td>Selva</td>\n",523" <td>Área de Empadronamiento Rural (AER) Compuesto</td>\n",524" <td>20200187781551106</td>\n",525" <td>Hijo(a)/Hijastro(a)</td>\n",526" <td>2.0</td>\n",527" <td>Jefe/jefa de hogar</td>\n",528" <td>Si</td>\n",529" <td>No</td>\n",530" <td>NaN</td>\n",531" <td>Hombre</td>\n",532" <td>22.0</td>\n",533" <td>NaN</td>\n",534" <td>Conviviente</td>\n",535" </tr>\n",536" </tbody>\n",537"</table>\n",538"<p>85035 rows × 20 columns</p>\n",539"</div>"540],541"text/plain": [542" year MES CONGLOME VIVIENDA HOGAR CODPERSO UBIGEO DOMINIO \\\n",543"0 2020 06 010108 136 11 02 100111 Sierra Centro \n",544"1 2020 06 020257 093 11 04 250107 Selva \n",545"2 2020 06 015537 065 11 04 040126 Sierra Sur \n",546"3 2019 10 010614 043 11 07 130901 Sierra Norte \n",547"4 2020 06 009390 096 11 04 230110 Costa Sur \n",548"... ... .. ... ... ... ... ... ... \n",549"85030 2020 12 007337 004 11 01 140105 Costa Norte \n",550"85031 2019 04 008226 084 13 02 160112 Selva \n",551"85032 2019 05 008965 060 11 03 210101 Sierra Sur \n",552"85033 2020 05 010311 022 11 02 200501 Costa Norte \n",553"85034 2020 11 018778 155 11 06 160404 Selva \n",554"\n",555" ESTRATO P201P \\\n",556"0 De 100 000 a 499 999 habitantes 20200101081361102 \n",557"1 De 100 000 a 499 999 habitantes 20200202570931104 \n",558"2 De 500 000 a más habitantes 20200155370651104 \n",559"3 De 20 000 a 49 999 habitantes 20190106140431107 \n",560"4 De 100 000 a 499 999 habitantes 20180093900961104 \n",561"... ... ... \n",562"85030 De 100 000 a 499 999 habitantes 20200073370041101 \n",563"85031 De 100 000 a 499 999 habitantes 20190082260841302 \n",564"85032 De 100 000 a 499 999 habitantes 20190089650601103 \n",565"85033 De 50 000 a 99 999 habitantes 20200103110221102 \n",566"85034 Área de Empadronamiento Rural (AER) Compuesto 20200187781551106 \n",567"\n",568" P203 P203A P203B P204 P205 P206 \\\n",569"0 Esposo(a)/compañero(a) NaN NaN Si No NaN \n",570"1 Hijo(a)/Hijastro(a) NaN NaN Si No NaN \n",571"2 Hijo(a)/Hijastro(a) NaN NaN Si No NaN \n",572"3 Otros parientes 2.0 Hijo(a) No NaN No \n",573"4 Panel NaN NaN NaN NaN NaN \n",574"... ... ... ... ... ... ... \n",575"85030 Jefe/Jefa 1.0 Jefe/jefa de hogar Si No NaN \n",576"85031 Otros no parientes 0.0 Jefe/jefa de hogar Si No NaN \n",577"85032 Hijo(a)/Hijastro(a) 1.0 Hijo(a) Si No NaN \n",578"85033 Esposo(a)/compañero(a) NaN NaN Si No NaN \n",579"85034 Hijo(a)/Hijastro(a) 2.0 Jefe/jefa de hogar Si No NaN \n",580"\n",581" P207 P208A P208B P209 \n",582"0 Mujer 43.0 NaN Casado(a) \n",583"1 Hombre 17.0 NaN Soltero(a) \n",584"2 Mujer 9.0 NaN NaN \n",585"3 Mujer 4.0 NaN NaN \n",586"4 NaN NaN NaN NaN \n",587"... ... ... ... ... \n",588"85030 Hombre 65.0 NaN Casado(a) \n",589"85031 Mujer 89.0 NaN Viudo(a) \n",590"85032 Hombre 20.0 NaN Soltero(a) \n",591"85033 Mujer 48.0 NaN Casado(a) \n",592"85034 Hombre 22.0 NaN Conviviente \n",593"\n",594"[85035 rows x 20 columns]"595]596},597"execution_count": 10,598"metadata": {},599"output_type": "execute_result"600}601],602"source": [603"data_administrativa"604]605},606{607"cell_type": "code",608"execution_count": 11,609"id": "376cb6a9",610"metadata": {},611"outputs": [612{613"data": {614"text/html": [615"<div>\n",616"<style scoped>\n",617" .dataframe tbody tr th:only-of-type {\n",618" vertical-align: middle;\n",619" }\n",620"\n",621" .dataframe tbody tr th {\n",622" vertical-align: top;\n",623" }\n",624"\n",625" .dataframe thead th {\n",626" text-align: right;\n",627" }\n",628"</style>\n",629"<table border=\"1\" class=\"dataframe\">\n",630" <thead>\n",631" <tr style=\"text-align: right;\">\n",632" <th></th>\n",633" <th>year</th>\n",634" <th>MES</th>\n",635" <th>CONGLOME</th>\n",636" <th>VIVIENDA</th>\n",637" <th>HOGAR</th>\n",638" <th>CODPERSO</th>\n",639" <th>UBIGEO</th>\n",640" <th>DOMINIO</th>\n",641" <th>ESTRATO</th>\n",642" <th>P201P</th>\n",643" <th>P203</th>\n",644" <th>P203A</th>\n",645" <th>P203B</th>\n",646" <th>P204</th>\n",647" <th>P205</th>\n",648" <th>P206</th>\n",649" <th>P207</th>\n",650" <th>P208A</th>\n",651" <th>P208B</th>\n",652" <th>P209</th>\n",653" </tr>\n",654" </thead>\n",655" <tbody>\n",656" <tr>\n",657" <th>0</th>\n",658" <td>False</td>\n",659" <td>False</td>\n",660" <td>False</td>\n",661" <td>False</td>\n",662" <td>False</td>\n",663" <td>False</td>\n",664" <td>False</td>\n",665" <td>False</td>\n",666" <td>False</td>\n",667" <td>False</td>\n",668" <td>False</td>\n",669" <td>True</td>\n",670" <td>True</td>\n",671" <td>False</td>\n",672" <td>False</td>\n",673" <td>True</td>\n",674" <td>False</td>\n",675" <td>False</td>\n",676" <td>True</td>\n",677" <td>False</td>\n",678" </tr>\n",679" <tr>\n",680" <th>1</th>\n",681" <td>False</td>\n",682" <td>False</td>\n",683" <td>False</td>\n",684" <td>False</td>\n",685" <td>False</td>\n",686" <td>False</td>\n",687" <td>False</td>\n",688" <td>False</td>\n",689" <td>False</td>\n",690" <td>False</td>\n",691" <td>False</td>\n",692" <td>True</td>\n",693" <td>True</td>\n",694" <td>False</td>\n",695" <td>False</td>\n",696" <td>True</td>\n",697" <td>False</td>\n",698" <td>False</td>\n",699" <td>True</td>\n",700" <td>False</td>\n",701" </tr>\n",702" <tr>\n",703" <th>2</th>\n",704" <td>False</td>\n",705" <td>False</td>\n",706" <td>False</td>\n",707" <td>False</td>\n",708" <td>False</td>\n",709" <td>False</td>\n",710" <td>False</td>\n",711" <td>False</td>\n",712" <td>False</td>\n",713" <td>False</td>\n",714" <td>False</td>\n",715" <td>True</td>\n",716" <td>True</td>\n",717" <td>False</td>\n",718" <td>False</td>\n",719" <td>True</td>\n",720" <td>False</td>\n",721" <td>False</td>\n",722" <td>True</td>\n",723" <td>True</td>\n",724" </tr>\n",725" <tr>\n",726" <th>3</th>\n",727" <td>False</td>\n",728" <td>False</td>\n",729" <td>False</td>\n",730" <td>False</td>\n",731" <td>False</td>\n",732" <td>False</td>\n",733" <td>False</td>\n",734" <td>False</td>\n",735" <td>False</td>\n",736" <td>False</td>\n",737" <td>False</td>\n",738" <td>False</td>\n",739" <td>False</td>\n",740" <td>False</td>\n",741" <td>True</td>\n",742" <td>False</td>\n",743" <td>False</td>\n",744" <td>False</td>\n",745" <td>True</td>\n",746" <td>True</td>\n",747" </tr>\n",748" <tr>\n",749" <th>4</th>\n",750" <td>False</td>\n",751" <td>False</td>\n",752" <td>False</td>\n",753" <td>False</td>\n",754" <td>False</td>\n",755" <td>False</td>\n",756" <td>False</td>\n",757" <td>False</td>\n",758" <td>False</td>\n",759" <td>False</td>\n",760" <td>False</td>\n",761" <td>True</td>\n",762" <td>True</td>\n",763" <td>True</td>\n",764" <td>True</td>\n",765" <td>True</td>\n",766" <td>True</td>\n",767" <td>True</td>\n",768" <td>True</td>\n",769" <td>True</td>\n",770" </tr>\n",771" <tr>\n",772" <th>...</th>\n",773" <td>...</td>\n",774" <td>...</td>\n",775" <td>...</td>\n",776" <td>...</td>\n",777" <td>...</td>\n",778" <td>...</td>\n",779" <td>...</td>\n",780" <td>...</td>\n",781" <td>...</td>\n",782" <td>...</td>\n",783" <td>...</td>\n",784" <td>...</td>\n",785" <td>...</td>\n",786" <td>...</td>\n",787" <td>...</td>\n",788" <td>...</td>\n",789" <td>...</td>\n",790" <td>...</td>\n",791" <td>...</td>\n",792" <td>...</td>\n",793" </tr>\n",794" <tr>\n",795" <th>85030</th>\n",796" <td>False</td>\n",797" <td>False</td>\n",798" <td>False</td>\n",799" <td>False</td>\n",800" <td>False</td>\n",801" <td>False</td>\n",802" <td>False</td>\n",803" <td>False</td>\n",804" <td>False</td>\n",805" <td>False</td>\n",806" <td>False</td>\n",807" <td>False</td>\n",808" <td>False</td>\n",809" <td>False</td>\n",810" <td>False</td>\n",811" <td>True</td>\n",812" <td>False</td>\n",813" <td>False</td>\n",814" <td>True</td>\n",815" <td>False</td>\n",816" </tr>\n",817" <tr>\n",818" <th>85031</th>\n",819" <td>False</td>\n",820" <td>False</td>\n",821" <td>False</td>\n",822" <td>False</td>\n",823" <td>False</td>\n",824" <td>False</td>\n",825" <td>False</td>\n",826" <td>False</td>\n",827" <td>False</td>\n",828" <td>False</td>\n",829" <td>False</td>\n",830" <td>False</td>\n",831" <td>False</td>\n",832" <td>False</td>\n",833" <td>False</td>\n",834" <td>True</td>\n",835" <td>False</td>\n",836" <td>False</td>\n",837" <td>True</td>\n",838" <td>False</td>\n",839" </tr>\n",840" <tr>\n",841" <th>85032</th>\n",842" <td>False</td>\n",843" <td>False</td>\n",844" <td>False</td>\n",845" <td>False</td>\n",846" <td>False</td>\n",847" <td>False</td>\n",848" <td>False</td>\n",849" <td>False</td>\n",850" <td>False</td>\n",851" <td>False</td>\n",852" <td>False</td>\n",853" <td>False</td>\n",854" <td>False</td>\n",855" <td>False</td>\n",856" <td>False</td>\n",857" <td>True</td>\n",858" <td>False</td>\n",859" <td>False</td>\n",860" <td>True</td>\n",861" <td>False</td>\n",862" </tr>\n",863" <tr>\n",864" <th>85033</th>\n",865" <td>False</td>\n",866" <td>False</td>\n",867" <td>False</td>\n",868" <td>False</td>\n",869" <td>False</td>\n",870" <td>False</td>\n",871" <td>False</td>\n",872" <td>False</td>\n",873" <td>False</td>\n",874" <td>False</td>\n",875" <td>False</td>\n",876" <td>True</td>\n",877" <td>True</td>\n",878" <td>False</td>\n",879" <td>False</td>\n",880" <td>True</td>\n",881" <td>False</td>\n",882" <td>False</td>\n",883" <td>True</td>\n",884" <td>False</td>\n",885" </tr>\n",886" <tr>\n",887" <th>85034</th>\n",888" <td>False</td>\n",889" <td>False</td>\n",890" <td>False</td>\n",891" <td>False</td>\n",892" <td>False</td>\n",893" <td>False</td>\n",894" <td>False</td>\n",895" <td>False</td>\n",896" <td>False</td>\n",897" <td>False</td>\n",898" <td>False</td>\n",899" <td>False</td>\n",900" <td>False</td>\n",901" <td>False</td>\n",902" <td>False</td>\n",903" <td>True</td>\n",904" <td>False</td>\n",905" <td>False</td>\n",906" <td>True</td>\n",907" <td>False</td>\n",908" </tr>\n",909" </tbody>\n",910"</table>\n",911"<p>85035 rows × 20 columns</p>\n",912"</div>"913],914"text/plain": [915" year MES CONGLOME VIVIENDA HOGAR CODPERSO UBIGEO DOMINIO \\\n",916"0 False False False False False False False False \n",917"1 False False False False False False False False \n",918"2 False False False False False False False False \n",919"3 False False False False False False False False \n",920"4 False False False False False False False False \n",921"... ... ... ... ... ... ... ... ... \n",922"85030 False False False False False False False False \n",923"85031 False False False False False False False False \n",924"85032 False False False False False False False False \n",925"85033 False False False False False False False False \n",926"85034 False False False False False False False False \n",927"\n",928" ESTRATO P201P P203 P203A P203B P204 P205 P206 P207 P208A \\\n",929"0 False False False True True False False True False False \n",930"1 False False False True True False False True False False \n",931"2 False False False True True False False True False False \n",932"3 False False False False False False True False False False \n",933"4 False False False True True True True True True True \n",934"... ... ... ... ... ... ... ... ... ... ... \n",935"85030 False False False False False False False True False False \n",936"85031 False False False False False False False True False False \n",937"85032 False False False False False False False True False False \n",938"85033 False False False True True False False True False False \n",939"85034 False False False False False False False True False False \n",940"\n",941" P208B P209 \n",942"0 True False \n",943"1 True False \n",944"2 True True \n",945"3 True True \n",946"4 True True \n",947"... ... ... \n",948"85030 True False \n",949"85031 True False \n",950"85032 True False \n",951"85033 True False \n",952"85034 True False \n",953"\n",954"[85035 rows x 20 columns]"955]956},957"execution_count": 11,958"metadata": {},959"output_type": "execute_result"960}961],962"source": [963"# Mostramos las variables que presentan missing values\n",964"\n",965"data_administrativa. isnull()\n",966"\n",967"# Se puede observar que hay missing values en las siguientes vairables:\n",968"# P203A, P203B, P204, P205, P206, P207, P208A, P208B, P209"969]970},971{972"cell_type": "code",973"execution_count": 12,974"id": "3d54b206",975"metadata": {},976"outputs": [],977"source": [978"import savReaderWriter as sav # importamos sav (paquete)\n",979"\n",980"\n",981"with sav.SavHeaderReader( r\"../../data/data_administrativa.sav\" , ioUtf8=True) as header:\n",982" metadata = header.all() # guardamos dataset\n",983" labels_data_administrativa = metadata.valueLabels # para obtener etiquetas de los valores de variables \n",984" var_labels_data_administrativa = metadata.varLabels # etiquetas de varibales \n",985" "986]987},988{989"cell_type": "code",990"execution_count": 13,991"id": "69240e49",992"metadata": {},993"outputs": [994{995"data": {996"text/plain": [997"dict"998]999},1000"execution_count": 13,1001"metadata": {},1002"output_type": "execute_result"1003}1004],1005"source": [1006"type(labels_data_administrativa)"1007]1008},1009{1010"cell_type": "code",1011"execution_count": 14,1012"id": "b6510251",1013"metadata": {},1014"outputs": [1015{1016"data": {1017"text/plain": [1018"dict_keys(['DOMINIO', 'ESTRATO', 'P203', 'P203B', 'P204', 'P205', 'P206', 'P207', 'P209'])"1019]1020},1021"execution_count": 14,1022"metadata": {},1023"output_type": "execute_result"1024}1025],1026"source": [1027"labels_data_administrativa.keys()"1028]1029},1030{1031"cell_type": "code",1032"execution_count": 15,1033"id": "742e3ab0",1034"metadata": {1035"scrolled": true1036},1037"outputs": [1038{1039"data": {1040"text/html": [1041"<div>\n",1042"<style scoped>\n",1043" .dataframe tbody tr th:only-of-type {\n",1044" vertical-align: middle;\n",1045" }\n",1046"\n",1047" .dataframe tbody tr th {\n",1048" vertical-align: top;\n",1049" }\n",1050"\n",1051" .dataframe thead th {\n",1052" text-align: right;\n",1053" }\n",1054"</style>\n",1055"<table border=\"1\" class=\"dataframe\">\n",1056" <thead>\n",1057" <tr style=\"text-align: right;\">\n",1058" <th></th>\n",1059" <th>year</th>\n",1060" <th>MES</th>\n",1061" <th>CONGLOME</th>\n",1062" <th>VIVIENDA</th>\n",1063" <th>HOGAR</th>\n",1064" <th>CODPERSO</th>\n",1065" <th>UBIGEO</th>\n",1066" <th>DOMINIO</th>\n",1067" <th>ESTRATO</th>\n",1068" <th>P201P</th>\n",1069" <th>P203</th>\n",1070" <th>P203A</th>\n",1071" <th>P203B</th>\n",1072" <th>P204</th>\n",1073" <th>P205</th>\n",1074" <th>P206</th>\n",1075" <th>P207</th>\n",1076" <th>P208A</th>\n",1077" <th>P208B</th>\n",1078" <th>P209</th>\n",1079" </tr>\n",1080" </thead>\n",1081" <tbody>\n",1082" <tr>\n",1083" <th>0</th>\n",1084" <td>2020</td>\n",1085" <td>06</td>\n",1086" <td>010108</td>\n",1087" <td>136</td>\n",1088" <td>11</td>\n",1089" <td>02</td>\n",1090" <td>100111</td>\n",1091" <td>Sierra Centro</td>\n",1092" <td>De 100 000 a 499 999 habitantes</td>\n",1093" <td>20200101081361102</td>\n",1094" <td>Esposo(a)/compañero(a)</td>\n",1095" <td>NaN</td>\n",1096" <td>NaN</td>\n",1097" <td>Si</td>\n",1098" <td>No</td>\n",1099" <td>NaN</td>\n",1100" <td>Mujer</td>\n",1101" <td>43.0</td>\n",1102" <td>NaN</td>\n",1103" <td>Casado(a)</td>\n",1104" </tr>\n",1105" <tr>\n",1106" <th>1</th>\n",1107" <td>2020</td>\n",1108" <td>06</td>\n",1109" <td>020257</td>\n",1110" <td>093</td>\n",1111" <td>11</td>\n",1112" <td>04</td>\n",1113" <td>250107</td>\n",1114" <td>Selva</td>\n",1115" <td>De 100 000 a 499 999 habitantes</td>\n",1116" <td>20200202570931104</td>\n",1117" <td>Hijo(a)/Hijastro(a)</td>\n",1118" <td>NaN</td>\n",1119" <td>NaN</td>\n",1120" <td>Si</td>\n",1121" <td>No</td>\n",1122" <td>NaN</td>\n",1123" <td>Hombre</td>\n",1124" <td>17.0</td>\n",1125" <td>NaN</td>\n",1126" <td>Soltero(a)</td>\n",1127" </tr>\n",1128" <tr>\n",1129" <th>2</th>\n",1130" <td>2020</td>\n",1131" <td>06</td>\n",1132" <td>015537</td>\n",1133" <td>065</td>\n",1134" <td>11</td>\n",1135" <td>04</td>\n",1136" <td>040126</td>\n",1137" <td>Sierra Sur</td>\n",1138" <td>De 500 000 a más habitantes</td>\n",1139" <td>20200155370651104</td>\n",1140" <td>Hijo(a)/Hijastro(a)</td>\n",1141" <td>NaN</td>\n",1142" <td>NaN</td>\n",1143" <td>Si</td>\n",1144" <td>No</td>\n",1145" <td>NaN</td>\n",1146" <td>Mujer</td>\n",1147" <td>9.0</td>\n",1148" <td>NaN</td>\n",1149" <td>NaN</td>\n",1150" </tr>\n",1151" <tr>\n",1152" <th>3</th>\n",1153" <td>2019</td>\n",1154" <td>10</td>\n",1155" <td>010614</td>\n",1156" <td>043</td>\n",1157" <td>11</td>\n",1158" <td>07</td>\n",1159" <td>130901</td>\n",1160" <td>Sierra Norte</td>\n",1161" <td>De 20 000 a 49 999 habitantes</td>\n",1162" <td>20190106140431107</td>\n",1163" <td>Otros parientes</td>\n",1164" <td>2.0</td>\n",1165" <td>Hijo(a)</td>\n",1166" <td>No</td>\n",1167" <td>NaN</td>\n",1168" <td>No</td>\n",1169" <td>Mujer</td>\n",1170" <td>4.0</td>\n",1171" <td>NaN</td>\n",1172" <td>NaN</td>\n",1173" </tr>\n",1174" <tr>\n",1175" <th>4</th>\n",1176" <td>2020</td>\n",1177" <td>06</td>\n",1178" <td>009390</td>\n",1179" <td>096</td>\n",1180" <td>11</td>\n",1181" <td>04</td>\n",1182" <td>230110</td>\n",1183" <td>Costa Sur</td>\n",1184" <td>De 100 000 a 499 999 habitantes</td>\n",1185" <td>20180093900961104</td>\n",1186" <td>Panel</td>\n",1187" <td>NaN</td>\n",1188" <td>NaN</td>\n",1189" <td>NaN</td>\n",1190" <td>NaN</td>\n",1191" <td>NaN</td>\n",1192" <td>NaN</td>\n",1193" <td>NaN</td>\n",1194" <td>NaN</td>\n",1195" <td>NaN</td>\n",1196" </tr>\n",1197" <tr>\n",1198" <th>...</th>\n",1199" <td>...</td>\n",1200" <td>...</td>\n",1201" <td>...</td>\n",1202" <td>...</td>\n",1203" <td>...</td>\n",1204" <td>...</td>\n",1205" <td>...</td>\n",1206" <td>...</td>\n",1207" <td>...</td>\n",1208" <td>...</td>\n",1209" <td>...</td>\n",1210" <td>...</td>\n",1211" <td>...</td>\n",1212" <td>...</td>\n",1213" <td>...</td>\n",1214" <td>...</td>\n",1215" <td>...</td>\n",1216" <td>...</td>\n",1217" <td>...</td>\n",1218" <td>...</td>\n",1219" </tr>\n",1220" <tr>\n",1221" <th>85030</th>\n",1222" <td>2020</td>\n",1223" <td>12</td>\n",1224" <td>007337</td>\n",1225" <td>004</td>\n",1226" <td>11</td>\n",1227" <td>01</td>\n",1228" <td>140105</td>\n",1229" <td>Costa Norte</td>\n",1230" <td>De 100 000 a 499 999 habitantes</td>\n",1231" <td>20200073370041101</td>\n",1232" <td>Jefe/Jefa</td>\n",1233" <td>1.0</td>\n",1234" <td>Jefe/jefa de hogar</td>\n",1235" <td>Si</td>\n",1236" <td>No</td>\n",1237" <td>NaN</td>\n",1238" <td>Hombre</td>\n",1239" <td>65.0</td>\n",1240" <td>NaN</td>\n",1241" <td>Casado(a)</td>\n",1242" </tr>\n",1243" <tr>\n",1244" <th>85031</th>\n",1245" <td>2019</td>\n",1246" <td>04</td>\n",1247" <td>008226</td>\n",1248" <td>084</td>\n",1249" <td>13</td>\n",1250" <td>02</td>\n",1251" <td>160112</td>\n",1252" <td>Selva</td>\n",1253" <td>De 100 000 a 499 999 habitantes</td>\n",1254" <td>20190082260841302</td>\n",1255" <td>Otros no parientes</td>\n",1256" <td>0.0</td>\n",1257" <td>Jefe/jefa de hogar</td>\n",1258" <td>Si</td>\n",1259" <td>No</td>\n",1260" <td>NaN</td>\n",1261" <td>Mujer</td>\n",1262" <td>89.0</td>\n",1263" <td>NaN</td>\n",1264" <td>Viudo(a)</td>\n",1265" </tr>\n",1266" <tr>\n",1267" <th>85032</th>\n",1268" <td>2019</td>\n",1269" <td>05</td>\n",1270" <td>008965</td>\n",1271" <td>060</td>\n",1272" <td>11</td>\n",1273" <td>03</td>\n",1274" <td>210101</td>\n",1275" <td>Sierra Sur</td>\n",1276" <td>De 100 000 a 499 999 habitantes</td>\n",1277" <td>20190089650601103</td>\n",1278" <td>Hijo(a)/Hijastro(a)</td>\n",1279" <td>1.0</td>\n",1280" <td>Hijo(a)</td>\n",1281" <td>Si</td>\n",1282" <td>No</td>\n",1283" <td>NaN</td>\n",1284" <td>Hombre</td>\n",1285" <td>20.0</td>\n",1286" <td>NaN</td>\n",1287" <td>Soltero(a)</td>\n",1288" </tr>\n",1289" <tr>\n",1290" <th>85033</th>\n",1291" <td>2020</td>\n",1292" <td>05</td>\n",1293" <td>010311</td>\n",1294" <td>022</td>\n",1295" <td>11</td>\n",1296" <td>02</td>\n",1297" <td>200501</td>\n",1298" <td>Costa Norte</td>\n",1299" <td>De 50 000 a 99 999 habitantes</td>\n",1300" <td>20200103110221102</td>\n",1301" <td>Esposo(a)/compañero(a)</td>\n",1302" <td>NaN</td>\n",1303" <td>NaN</td>\n",1304" <td>Si</td>\n",1305" <td>No</td>\n",1306" <td>NaN</td>\n",1307" <td>Mujer</td>\n",1308" <td>48.0</td>\n",1309" <td>NaN</td>\n",1310" <td>Casado(a)</td>\n",1311" </tr>\n",1312" <tr>\n",1313" <th>85034</th>\n",1314" <td>2020</td>\n",1315" <td>11</td>\n",1316" <td>018778</td>\n",1317" <td>155</td>\n",1318" <td>11</td>\n",1319" <td>06</td>\n",1320" <td>160404</td>\n",1321" <td>Selva</td>\n",1322" <td>Área de Empadronamiento Rural (AER) Compuesto</td>\n",1323" <td>20200187781551106</td>\n",1324" <td>Hijo(a)/Hijastro(a)</td>\n",1325" <td>2.0</td>\n",1326" <td>Jefe/jefa de hogar</td>\n",1327" <td>Si</td>\n",1328" <td>No</td>\n",1329" <td>NaN</td>\n",1330" <td>Hombre</td>\n",1331" <td>22.0</td>\n",1332" <td>NaN</td>\n",1333" <td>Conviviente</td>\n",1334" </tr>\n",1335" </tbody>\n",1336"</table>\n",1337"<p>85035 rows × 20 columns</p>\n",1338"</div>"1339],1340"text/plain": [1341" year MES CONGLOME VIVIENDA HOGAR CODPERSO UBIGEO DOMINIO \\\n",1342"0 2020 06 010108 136 11 02 100111 Sierra Centro \n",1343"1 2020 06 020257 093 11 04 250107 Selva \n",1344"2 2020 06 015537 065 11 04 040126 Sierra Sur \n",1345"3 2019 10 010614 043 11 07 130901 Sierra Norte \n",1346"4 2020 06 009390 096 11 04 230110 Costa Sur \n",1347"... ... .. ... ... ... ... ... ... \n",1348"85030 2020 12 007337 004 11 01 140105 Costa Norte \n",1349"85031 2019 04 008226 084 13 02 160112 Selva \n",1350"85032 2019 05 008965 060 11 03 210101 Sierra Sur \n",1351"85033 2020 05 010311 022 11 02 200501 Costa Norte \n",1352"85034 2020 11 018778 155 11 06 160404 Selva \n",1353"\n",1354" ESTRATO P201P \\\n",1355"0 De 100 000 a 499 999 habitantes 20200101081361102 \n",1356"1 De 100 000 a 499 999 habitantes 20200202570931104 \n",1357"2 De 500 000 a más habitantes 20200155370651104 \n",1358"3 De 20 000 a 49 999 habitantes 20190106140431107 \n",1359"4 De 100 000 a 499 999 habitantes 20180093900961104 \n",1360"... ... ... \n",1361"85030 De 100 000 a 499 999 habitantes 20200073370041101 \n",1362"85031 De 100 000 a 499 999 habitantes 20190082260841302 \n",1363"85032 De 100 000 a 499 999 habitantes 20190089650601103 \n",1364"85033 De 50 000 a 99 999 habitantes 20200103110221102 \n",1365"85034 Área de Empadronamiento Rural (AER) Compuesto 20200187781551106 \n",1366"\n",1367" P203 P203A P203B P204 P205 P206 \\\n",1368"0 Esposo(a)/compañero(a) NaN NaN Si No NaN \n",1369"1 Hijo(a)/Hijastro(a) NaN NaN Si No NaN \n",1370"2 Hijo(a)/Hijastro(a) NaN NaN Si No NaN \n",1371"3 Otros parientes 2.0 Hijo(a) No NaN No \n",1372"4 Panel NaN NaN NaN NaN NaN \n",1373"... ... ... ... ... ... ... \n",1374"85030 Jefe/Jefa 1.0 Jefe/jefa de hogar Si No NaN \n",1375"85031 Otros no parientes 0.0 Jefe/jefa de hogar Si No NaN \n",1376"85032 Hijo(a)/Hijastro(a) 1.0 Hijo(a) Si No NaN \n",1377"85033 Esposo(a)/compañero(a) NaN NaN Si No NaN \n",1378"85034 Hijo(a)/Hijastro(a) 2.0 Jefe/jefa de hogar Si No NaN \n",1379"\n",1380" P207 P208A P208B P209 \n",1381"0 Mujer 43.0 NaN Casado(a) \n",1382"1 Hombre 17.0 NaN Soltero(a) \n",1383"2 Mujer 9.0 NaN NaN \n",1384"3 Mujer 4.0 NaN NaN \n",1385"4 NaN NaN NaN NaN \n",1386"... ... ... ... ... \n",1387"85030 Hombre 65.0 NaN Casado(a) \n",1388"85031 Mujer 89.0 NaN Viudo(a) \n",1389"85032 Hombre 20.0 NaN Soltero(a) \n",1390"85033 Mujer 48.0 NaN Casado(a) \n",1391"85034 Hombre 22.0 NaN Conviviente \n",1392"\n",1393"[85035 rows x 20 columns]"1394]1395},1396"execution_count": 15,1397"metadata": {},1398"output_type": "execute_result"1399}1400],1401"source": [1402"data_administrativa"1403]1404},1405{1406"cell_type": "code",1407"execution_count": 16,1408"id": "734c2f7b",1409"metadata": {},1410"outputs": [1411{1412"data": {1413"text/plain": [1414"{'DOMINIO': {1.0: 'Costa Norte',\n",1415" 2.0: 'Costa Centro',\n",1416" 3.0: 'Costa Sur',\n",1417" 4.0: 'Sierra Norte',\n",1418" 5.0: 'Sierra Centro',\n",1419" 6.0: 'Sierra Sur',\n",1420" 7.0: 'Selva',\n",1421" 8.0: 'Lima Metropolitana'},\n",1422" 'ESTRATO': {1.0: ' De 500 000 a más habitantes',\n",1423" 2.0: ' De 100 000 a 499 999 habitantes',\n",1424" 3.0: ' De 50 000 a 99 999 habitantes',\n",1425" 4.0: ' De 20 000 a 49 999 habitantes',\n",1426" 5.0: 'De 2 000 a 19 999 habitantes',\n",1427" 6.0: ' De 500 a 1 999 habitantes',\n",1428" 7.0: ' Área de Empadronamiento Rural (AER) Compuesto',\n",1429" 8.0: ' Área de Empadronamiento Rural (AER) Simple'},\n",1430" 'P203': {0.0: 'Panel',\n",1431" 1.0: 'Jefe/Jefa',\n",1432" 2.0: 'Esposo(a)/compañero(a)',\n",1433" 3.0: 'Hijo(a)/Hijastro(a)',\n",1434" 4.0: 'Yerno/Nuera',\n",1435" 5.0: 'Nieto(a)',\n",1436" 6.0: 'Padres/Suegros',\n",1437" 7.0: 'Otros parientes',\n",1438" 8.0: 'Trabajador Hogar',\n",1439" 9.0: 'Pensionista',\n",1440" 10.0: 'Otros no parientes',\n",1441" 11.0: 'Hermano(a)'},\n",1442" 'P203B': {1.0: 'Jefe/jefa de hogar',\n",1443" 2.0: 'Esposa(o)',\n",1444" 3.0: 'Hijo(a)',\n",1445" 6.0: 'Padres/suegros'},\n",1446" 'P204': {1.0: 'Si', 2.0: 'No'},\n",1447" 'P205': {1.0: 'Si', 2.0: 'No'},\n",1448" 'P206': {1.0: 'Si', 2.0: 'No'},\n",1449" 'P207': {1.0: 'Hombre', 2.0: 'Mujer'},\n",1450" 'P209': {1.0: 'Conviviente',\n",1451" 2.0: 'Casado(a)',\n",1452" 3.0: 'Viudo(a)',\n",1453" 4.0: 'Divorciado(a)',\n",1454" 5.0: 'Separado(a)',\n",1455" 6.0: 'Soltero(a)'}}"1456]1457},1458"execution_count": 16,1459"metadata": {},1460"output_type": "execute_result"1461}1462],1463"source": [1464"labels_data_administrativa"1465]1466},1467{1468"cell_type": "code",1469"execution_count": 17,1470"id": "10327135",1471"metadata": {},1472"outputs": [1473{1474"data": {1475"text/plain": [1476"{'year': '',\n",1477" 'MES': '',\n",1478" 'CONGLOME': '',\n",1479" 'VIVIENDA': '',\n",1480" 'HOGAR': '',\n",1481" 'CODPERSO': '',\n",1482" 'UBIGEO': '',\n",1483" 'DOMINIO': 'Dominio geográfico',\n",1484" 'ESTRATO': 'Estrato geográfico',\n",1485" 'P201P': '',\n",1486" 'P203': '¿Cuál es la relación de parentesco con el jefe(a) del hogar',\n",1487" 'P203A': '',\n",1488" 'P203B': 'Relación de parentesco con el jefe(a) del núcleo familiar',\n",1489" 'P204': '¿Es miembro del hogar?',\n",1490" 'P205': '¿Se encuentra ausente del hogar 30 días o más?',\n",1491" 'P206': '¿Está presente en el hogar 30 días o más?',\n",1492" 'P207': 'Sexo',\n",1493" 'P208A': '',\n",1494" 'P208B': '',\n",1495" 'P209': '¿Cuál es su estado civil o conyugal?'}"1496]1497},1498"execution_count": 17,1499"metadata": {},1500"output_type": "execute_result"1501}1502],1503"source": [1504"var_labels_data_administrativa"1505]1506},1507{1508"cell_type": "code",1509"execution_count": 18,1510"id": "4867bdeb",1511"metadata": {},1512"outputs": [],1513"source": [1514"# adding labels to variables enapres2020_1 from pandas \n",1515"\n",1516"data_administrativa.attrs[ 'value_labels' ] = labels_data_administrativa # value's labels \n",1517"data_administrativa.attrs[ 'var_labels' ] = var_labels_data_administrativa # var labels"1518]1519},1520{1521"cell_type": "code",1522"execution_count": 19,1523"id": "f205f280",1524"metadata": {},1525"outputs": [1526{1527"data": {1528"text/html": [1529"<div>\n",1530"<style scoped>\n",1531" .dataframe tbody tr th:only-of-type {\n",1532" vertical-align: middle;\n",1533" }\n",1534"\n",1535" .dataframe tbody tr th {\n",1536" vertical-align: top;\n",1537" }\n",1538"\n",1539" .dataframe thead th {\n",1540" text-align: right;\n",1541" }\n",1542"</style>\n",1543"<table border=\"1\" class=\"dataframe\">\n",1544" <thead>\n",1545" <tr style=\"text-align: right;\">\n",1546" <th></th>\n",1547" <th>year</th>\n",1548" <th>MES</th>\n",1549" <th>CONGLOME</th>\n",1550" <th>VIVIENDA</th>\n",1551" <th>HOGAR</th>\n",1552" <th>CODPERSO</th>\n",1553" <th>UBIGEO</th>\n",1554" <th>DOMINIO</th>\n",1555" <th>ESTRATO</th>\n",1556" <th>P201P</th>\n",1557" <th>P203</th>\n",1558" <th>P203A</th>\n",1559" <th>P203B</th>\n",1560" <th>P204</th>\n",1561" <th>P205</th>\n",1562" <th>P206</th>\n",1563" <th>P207</th>\n",1564" <th>P208A</th>\n",1565" <th>P208B</th>\n",1566" <th>P209</th>\n",1567" </tr>\n",1568" </thead>\n",1569" <tbody>\n",1570" <tr>\n",1571" <th>0</th>\n",1572" <td>2020</td>\n",1573" <td>06</td>\n",1574" <td>010108</td>\n",1575" <td>136</td>\n",1576" <td>11</td>\n",1577" <td>02</td>\n",1578" <td>100111</td>\n",1579" <td>Sierra Centro</td>\n",1580" <td>De 100 000 a 499 999 habitantes</td>\n",1581" <td>20200101081361102</td>\n",1582" <td>Esposo(a)/compañero(a)</td>\n",1583" <td>NaN</td>\n",1584" <td>NaN</td>\n",1585" <td>Si</td>\n",1586" <td>No</td>\n",1587" <td>NaN</td>\n",1588" <td>Mujer</td>\n",1589" <td>43.0</td>\n",1590" <td>NaN</td>\n",1591" <td>Casado(a)</td>\n",1592" </tr>\n",1593" <tr>\n",1594" <th>1</th>\n",1595" <td>2020</td>\n",1596" <td>06</td>\n",1597" <td>020257</td>\n",1598" <td>093</td>\n",1599" <td>11</td>\n",1600" <td>04</td>\n",1601" <td>250107</td>\n",1602" <td>Selva</td>\n",1603" <td>De 100 000 a 499 999 habitantes</td>\n",1604" <td>20200202570931104</td>\n",1605" <td>Hijo(a)/Hijastro(a)</td>\n",1606" <td>NaN</td>\n",1607" <td>NaN</td>\n",1608" <td>Si</td>\n",1609" <td>No</td>\n",1610" <td>NaN</td>\n",1611" <td>Hombre</td>\n",1612" <td>17.0</td>\n",1613" <td>NaN</td>\n",1614" <td>Soltero(a)</td>\n",1615" </tr>\n",1616" <tr>\n",1617" <th>2</th>\n",1618" <td>2020</td>\n",1619" <td>06</td>\n",1620" <td>015537</td>\n",1621" <td>065</td>\n",1622" <td>11</td>\n",1623" <td>04</td>\n",1624" <td>040126</td>\n",1625" <td>Sierra Sur</td>\n",1626" <td>De 500 000 a más habitantes</td>\n",1627" <td>20200155370651104</td>\n",1628" <td>Hijo(a)/Hijastro(a)</td>\n",1629" <td>NaN</td>\n",1630" <td>NaN</td>\n",1631" <td>Si</td>\n",1632" <td>No</td>\n",1633" <td>NaN</td>\n",1634" <td>Mujer</td>\n",1635" <td>9.0</td>\n",1636" <td>NaN</td>\n",1637" <td>NaN</td>\n",1638" </tr>\n",1639" <tr>\n",1640" <th>3</th>\n",1641" <td>2019</td>\n",1642" <td>10</td>\n",1643" <td>010614</td>\n",1644" <td>043</td>\n",1645" <td>11</td>\n",1646" <td>07</td>\n",1647" <td>130901</td>\n",1648" <td>Sierra Norte</td>\n",1649" <td>De 20 000 a 49 999 habitantes</td>\n",1650" <td>20190106140431107</td>\n",1651" <td>Otros parientes</td>\n",1652" <td>2.0</td>\n",1653" <td>Hijo(a)</td>\n",1654" <td>No</td>\n",1655" <td>NaN</td>\n",1656" <td>No</td>\n",1657" <td>Mujer</td>\n",1658" <td>4.0</td>\n",1659" <td>NaN</td>\n",1660" <td>NaN</td>\n",1661" </tr>\n",1662" <tr>\n",1663" <th>4</th>\n",1664" <td>2020</td>\n",1665" <td>06</td>\n",1666" <td>009390</td>\n",1667" <td>096</td>\n",1668" <td>11</td>\n",1669" <td>04</td>\n",1670" <td>230110</td>\n",1671" <td>Costa Sur</td>\n",1672" <td>De 100 000 a 499 999 habitantes</td>\n",1673" <td>20180093900961104</td>\n",1674" <td>Panel</td>\n",1675" <td>NaN</td>\n",1676" <td>NaN</td>\n",1677" <td>NaN</td>\n",1678" <td>NaN</td>\n",1679" <td>NaN</td>\n",1680" <td>NaN</td>\n",1681" <td>NaN</td>\n",1682" <td>NaN</td>\n",1683" <td>NaN</td>\n",1684" </tr>\n",1685" <tr>\n",1686" <th>...</th>\n",1687" <td>...</td>\n",1688" <td>...</td>\n",1689" <td>...</td>\n",1690" <td>...</td>\n",1691" <td>...</td>\n",1692" <td>...</td>\n",1693" <td>...</td>\n",1694" <td>...</td>\n",1695" <td>...</td>\n",1696" <td>...</td>\n",1697" <td>...</td>\n",1698" <td>...</td>\n",1699" <td>...</td>\n",1700" <td>...</td>\n",1701" <td>...</td>\n",1702" <td>...</td>\n",1703" <td>...</td>\n",1704" <td>...</td>\n",1705" <td>...</td>\n",1706" <td>...</td>\n",1707" </tr>\n",1708" <tr>\n",1709" <th>85030</th>\n",1710" <td>2020</td>\n",1711" <td>12</td>\n",1712" <td>007337</td>\n",1713" <td>004</td>\n",1714" <td>11</td>\n",1715" <td>01</td>\n",1716" <td>140105</td>\n",1717" <td>Costa Norte</td>\n",1718" <td>De 100 000 a 499 999 habitantes</td>\n",1719" <td>20200073370041101</td>\n",1720" <td>Jefe/Jefa</td>\n",1721" <td>1.0</td>\n",1722" <td>Jefe/jefa de hogar</td>\n",1723" <td>Si</td>\n",1724" <td>No</td>\n",1725" <td>NaN</td>\n",1726" <td>Hombre</td>\n",1727" <td>65.0</td>\n",1728" <td>NaN</td>\n",1729" <td>Casado(a)</td>\n",1730" </tr>\n",1731" <tr>\n",1732" <th>85031</th>\n",1733" <td>2019</td>\n",1734" <td>04</td>\n",1735" <td>008226</td>\n",1736" <td>084</td>\n",1737" <td>13</td>\n",1738" <td>02</td>\n",1739" <td>160112</td>\n",1740" <td>Selva</td>\n",1741" <td>De 100 000 a 499 999 habitantes</td>\n",1742" <td>20190082260841302</td>\n",1743" <td>Otros no parientes</td>\n",1744" <td>0.0</td>\n",1745" <td>Jefe/jefa de hogar</td>\n",1746" <td>Si</td>\n",1747" <td>No</td>\n",1748" <td>NaN</td>\n",1749" <td>Mujer</td>\n",1750" <td>89.0</td>\n",1751" <td>NaN</td>\n",1752" <td>Viudo(a)</td>\n",1753" </tr>\n",1754" <tr>\n",1755" <th>85032</th>\n",1756" <td>2019</td>\n",1757" <td>05</td>\n",1758" <td>008965</td>\n",1759" <td>060</td>\n",1760" <td>11</td>\n",1761" <td>03</td>\n",1762" <td>210101</td>\n",1763" <td>Sierra Sur</td>\n",1764" <td>De 100 000 a 499 999 habitantes</td>\n",1765" <td>20190089650601103</td>\n",1766" <td>Hijo(a)/Hijastro(a)</td>\n",1767" <td>1.0</td>\n",1768" <td>Hijo(a)</td>\n",1769" <td>Si</td>\n",1770" <td>No</td>\n",1771" <td>NaN</td>\n",1772" <td>Hombre</td>\n",1773" <td>20.0</td>\n",1774" <td>NaN</td>\n",1775" <td>Soltero(a)</td>\n",1776" </tr>\n",1777" <tr>\n",1778" <th>85033</th>\n",1779" <td>2020</td>\n",1780" <td>05</td>\n",1781" <td>010311</td>\n",1782" <td>022</td>\n",1783" <td>11</td>\n",1784" <td>02</td>\n",1785" <td>200501</td>\n",1786" <td>Costa Norte</td>\n",1787" <td>De 50 000 a 99 999 habitantes</td>\n",1788" <td>20200103110221102</td>\n",1789" <td>Esposo(a)/compañero(a)</td>\n",1790" <td>NaN</td>\n",1791" <td>NaN</td>\n",1792" <td>Si</td>\n",1793" <td>No</td>\n",1794" <td>NaN</td>\n",1795" <td>Mujer</td>\n",1796" <td>48.0</td>\n",1797" <td>NaN</td>\n",1798" <td>Casado(a)</td>\n",1799" </tr>\n",1800" <tr>\n",1801" <th>85034</th>\n",1802" <td>2020</td>\n",1803" <td>11</td>\n",1804" <td>018778</td>\n",1805" <td>155</td>\n",1806" <td>11</td>\n",1807" <td>06</td>\n",1808" <td>160404</td>\n",1809" <td>Selva</td>\n",1810" <td>Área de Empadronamiento Rural (AER) Compuesto</td>\n",1811" <td>20200187781551106</td>\n",1812" <td>Hijo(a)/Hijastro(a)</td>\n",1813" <td>2.0</td>\n",1814" <td>Jefe/jefa de hogar</td>\n",1815" <td>Si</td>\n",1816" <td>No</td>\n",1817" <td>NaN</td>\n",1818" <td>Hombre</td>\n",1819" <td>22.0</td>\n",1820" <td>NaN</td>\n",1821" <td>Conviviente</td>\n",1822" </tr>\n",1823" </tbody>\n",1824"</table>\n",1825"<p>85035 rows × 20 columns</p>\n",1826"</div>"1827],1828"text/plain": [1829" year MES CONGLOME VIVIENDA HOGAR CODPERSO UBIGEO DOMINIO \\\n",1830"0 2020 06 010108 136 11 02 100111 Sierra Centro \n",1831"1 2020 06 020257 093 11 04 250107 Selva \n",1832"2 2020 06 015537 065 11 04 040126 Sierra Sur \n",1833"3 2019 10 010614 043 11 07 130901 Sierra Norte \n",1834"4 2020 06 009390 096 11 04 230110 Costa Sur \n",1835"... ... .. ... ... ... ... ... ... \n",1836"85030 2020 12 007337 004 11 01 140105 Costa Norte \n",1837"85031 2019 04 008226 084 13 02 160112 Selva \n",1838"85032 2019 05 008965 060 11 03 210101 Sierra Sur \n",1839"85033 2020 05 010311 022 11 02 200501 Costa Norte \n",1840"85034 2020 11 018778 155 11 06 160404 Selva \n",1841"\n",1842" ESTRATO P201P \\\n",1843"0 De 100 000 a 499 999 habitantes 20200101081361102 \n",1844"1 De 100 000 a 499 999 habitantes 20200202570931104 \n",1845"2 De 500 000 a más habitantes 20200155370651104 \n",1846"3 De 20 000 a 49 999 habitantes 20190106140431107 \n",1847"4 De 100 000 a 499 999 habitantes 20180093900961104 \n",1848"... ... ... \n",1849"85030 De 100 000 a 499 999 habitantes 20200073370041101 \n",1850"85031 De 100 000 a 499 999 habitantes 20190082260841302 \n",1851"85032 De 100 000 a 499 999 habitantes 20190089650601103 \n",1852"85033 De 50 000 a 99 999 habitantes 20200103110221102 \n",1853"85034 Área de Empadronamiento Rural (AER) Compuesto 20200187781551106 \n",1854"\n",1855" P203 P203A P203B P204 P205 P206 \\\n",1856"0 Esposo(a)/compañero(a) NaN NaN Si No NaN \n",1857"1 Hijo(a)/Hijastro(a) NaN NaN Si No NaN \n",1858"2 Hijo(a)/Hijastro(a) NaN NaN Si No NaN \n",1859"3 Otros parientes 2.0 Hijo(a) No NaN No \n",1860"4 Panel NaN NaN NaN NaN NaN \n",1861"... ... ... ... ... ... ... \n",1862"85030 Jefe/Jefa 1.0 Jefe/jefa de hogar Si No NaN \n",1863"85031 Otros no parientes 0.0 Jefe/jefa de hogar Si No NaN \n",1864"85032 Hijo(a)/Hijastro(a) 1.0 Hijo(a) Si No NaN \n",1865"85033 Esposo(a)/compañero(a) NaN NaN Si No NaN \n",1866"85034 Hijo(a)/Hijastro(a) 2.0 Jefe/jefa de hogar Si No NaN \n",1867"\n",1868" P207 P208A P208B P209 \n",1869"0 Mujer 43.0 NaN Casado(a) \n",1870"1 Hombre 17.0 NaN Soltero(a) \n",1871"2 Mujer 9.0 NaN NaN \n",1872"3 Mujer 4.0 NaN NaN \n",1873"4 NaN NaN NaN NaN \n",1874"... ... ... ... ... \n",1875"85030 Hombre 65.0 NaN Casado(a) \n",1876"85031 Mujer 89.0 NaN Viudo(a) \n",1877"85032 Hombre 20.0 NaN Soltero(a) \n",1878"85033 Mujer 48.0 NaN Casado(a) \n",1879"85034 Hombre 22.0 NaN Conviviente \n",1880"\n",1881"[85035 rows x 20 columns]"1882]1883},1884"execution_count": 19,1885"metadata": {},1886"output_type": "execute_result"1887}1888],1889"source": [1890"data_administrativa"1891]1892},1893{1894"cell_type": "code",1895"execution_count": 20,1896"id": "5a21ed2d",1897"metadata": {},1898"outputs": [1899{1900"data": {1901"text/html": [1902"<div>\n",1903"<style scoped>\n",1904" .dataframe tbody tr th:only-of-type {\n",1905" vertical-align: middle;\n",1906" }\n",1907"\n",1908" .dataframe tbody tr th {\n",1909" vertical-align: top;\n",1910" }\n",1911"\n",1912" .dataframe thead th {\n",1913" text-align: right;\n",1914" }\n",1915"</style>\n",1916"<table border=\"1\" class=\"dataframe\">\n",1917" <thead>\n",1918" <tr style=\"text-align: right;\">\n",1919" <th></th>\n",1920" <th>year</th>\n",1921" <th>MES</th>\n",1922" <th>CONGLOME</th>\n",1923" <th>VIVIENDA</th>\n",1924" <th>HOGAR</th>\n",1925" <th>CODPERSO</th>\n",1926" <th>UBIGEO</th>\n",1927" <th>DOMINIO</th>\n",1928" <th>ESTRATO</th>\n",1929" <th>P201P</th>\n",1930" <th>P203</th>\n",1931" <th>P203A</th>\n",1932" <th>P203B</th>\n",1933" <th>P204</th>\n",1934" <th>P205</th>\n",1935" <th>P206</th>\n",1936" <th>P207</th>\n",1937" <th>P208A</th>\n",1938" <th>P208B</th>\n",1939" <th>P209</th>\n",1940" </tr>\n",1941" </thead>\n",1942" <tbody>\n",1943" <tr>\n",1944" <th>3</th>\n",1945" <td>2019</td>\n",1946" <td>10</td>\n",1947" <td>010614</td>\n",1948" <td>043</td>\n",1949" <td>11</td>\n",1950" <td>07</td>\n",1951" <td>130901</td>\n",1952" <td>Sierra Norte</td>\n",1953" <td>De 20 000 a 49 999 habitantes</td>\n",1954" <td>20190106140431107</td>\n",1955" <td>Otros parientes</td>\n",1956" <td>2.0</td>\n",1957" <td>Hijo(a)</td>\n",1958" <td>No</td>\n",1959" <td>NaN</td>\n",1960" <td>No</td>\n",1961" <td>Mujer</td>\n",1962" <td>4.0</td>\n",1963" <td>NaN</td>\n",1964" <td>NaN</td>\n",1965" </tr>\n",1966" <tr>\n",1967" <th>5</th>\n",1968" <td>2019</td>\n",1969" <td>03</td>\n",1970" <td>008010</td>\n",1971" <td>059</td>\n",1972" <td>11</td>\n",1973" <td>03</td>\n",1974" <td>150801</td>\n",1975" <td>Costa Centro</td>\n",1976" <td>De 100 000 a 499 999 habitantes</td>\n",1977" <td>20190080100591103</td>\n",1978" <td>Otros parientes</td>\n",1979" <td>1.0</td>\n",1980" <td>Hijo(a)</td>\n",1981" <td>Si</td>\n",1982" <td>No</td>\n",1983" <td>NaN</td>\n",1984" <td>Hombre</td>\n",1985" <td>32.0</td>\n",1986" <td>NaN</td>\n",1987" <td>Soltero(a)</td>\n",1988" </tr>\n",1989" <tr>\n",1990" <th>24</th>\n",1991" <td>2019</td>\n",1992" <td>07</td>\n",1993" <td>009625</td>\n",1994" <td>071</td>\n",1995" <td>11</td>\n",1996" <td>01</td>\n",1997" <td>250105</td>\n",1998" <td>Selva</td>\n",1999" <td>De 100 000 a 499 999 habitantes</td>\n",2000" <td>20190096250711101</td>\n",2001" <td>Jefe/Jefa</td>\n",2002" <td>1.0</td>\n",2003" <td>Jefe/jefa de hogar</td>\n",2004" <td>Si</td>\n",2005" <td>No</td>\n",2006" <td>NaN</td>\n",2007" <td>Hombre</td>\n",2008" <td>64.0</td>\n",2009" <td>NaN</td>\n",2010" <td>Conviviente</td>\n",2011" </tr>\n",2012" <tr>\n",2013" <th>33</th>\n",2014" <td>2020</td>\n",2015" <td>07</td>\n",2016" <td>010368</td>\n",2017" <td>081</td>\n",2018" <td>11</td>\n",2019" <td>04</td>\n",2020" <td>230104</td>\n",2021" <td>Costa Sur</td>\n",2022" <td>De 100 000 a 499 999 habitantes</td>\n",2023" <td>20180103680811105</td>\n",2024" <td>Hijo(a)/Hijastro(a)</td>\n",2025" <td>NaN</td>\n",2026" <td>NaN</td>\n",2027" <td>Si</td>\n",2028" <td>No</td>\n",2029" <td>NaN</td>\n",2030" <td>Hombre</td>\n",2031" <td>14.0</td>\n",2032" <td>NaN</td>\n",2033" <td>Soltero(a)</td>\n",2034" </tr>\n",2035" <tr>\n",2036" <th>52</th>\n",2037" <td>2019</td>\n",2038" <td>12</td>\n",2039" <td>005867</td>\n",2040" <td>034</td>\n",2041" <td>11</td>\n",2042" <td>02</td>\n",2043" <td>060101</td>\n",2044" <td>Sierra Norte</td>\n",2045" <td>De 100 000 a 499 999 habitantes</td>\n",2046" <td>20170058670341102</td>\n",2047" <td>Esposo(a)/compañero(a)</td>\n",2048" <td>1.0</td>\n",2049" <td>Esposa(o)</td>\n",2050" <td>Si</td>\n",2051" <td>No</td>\n",2052" <td>NaN</td>\n",2053" <td>Mujer</td>\n",2054" <td>53.0</td>\n",2055" <td>NaN</td>\n",2056" <td>Casado(a)</td>\n",2057" </tr>\n",2058" <tr>\n",2059" <th>...</th>\n",2060" <td>...</td>\n",2061" <td>...</td>\n",2062" <td>...</td>\n",2063" <td>...</td>\n",2064" <td>...</td>\n",2065" <td>...</td>\n",2066" <td>...</td>\n",2067" <td>...</td>\n",2068" <td>...</td>\n",2069" <td>...</td>\n",2070" <td>...</td>\n",2071" <td>...</td>\n",2072" <td>...</td>\n",2073" <td>...</td>\n",2074" <td>...</td>\n",2075" <td>...</td>\n",2076" <td>...</td>\n",2077" <td>...</td>\n",2078" <td>...</td>\n",2079" <td>...</td>\n",2080" </tr>\n",2081" <tr>\n",2082" <th>84940</th>\n",2083" <td>2019</td>\n",2084" <td>12</td>\n",2085" <td>008253</td>\n",2086" <td>047</td>\n",2087" <td>11</td>\n",2088" <td>01</td>\n",2089" <td>160113</td>\n",2090" <td>Selva</td>\n",2091" <td>De 100 000 a 499 999 habitantes</td>\n",2092" <td>20170082530471101</td>\n",2093" <td>Jefe/Jefa</td>\n",2094" <td>1.0</td>\n",2095" <td>Jefe/jefa de hogar</td>\n",2096" <td>Si</td>\n",2097" <td>No</td>\n",2098" <td>NaN</td>\n",2099" <td>Hombre</td>\n",2100" <td>80.0</td>\n",2101" <td>NaN</td>\n",2102" <td>Conviviente</td>\n",2103" </tr>\n",2104" <tr>\n",2105" <th>84945</th>\n",2106" <td>2019</td>\n",2107" <td>06</td>\n",2108" <td>007982</td>\n",2109" <td>008</td>\n",2110" <td>11</td>\n",2111" <td>02</td>\n",2112" <td>150202</td>\n",2113" <td>Costa Centro</td>\n",2114" <td>De 20 000 a 49 999 habitantes</td>\n",2115" <td>20170079820081102</td>\n",2116" <td>Hijo(a)/Hijastro(a)</td>\n",2117" <td>1.0</td>\n",2118" <td>Hijo(a)</td>\n",2119" <td>Si</td>\n",2120" <td>No</td>\n",2121" <td>NaN</td>\n",2122" <td>Hombre</td>\n",2123" <td>19.0</td>\n",2124" <td>NaN</td>\n",2125" <td>Soltero(a)</td>\n",2126" </tr>\n",2127" <tr>\n",2128" <th>84975</th>\n",2129" <td>2020</td>\n",2130" <td>09</td>\n",2131" <td>007221</td>\n",2132" <td>043</td>\n",2133" <td>11</td>\n",2134" <td>03</td>\n",2135" <td>130901</td>\n",2136" <td>Sierra Norte</td>\n",2137" <td>De 20 000 a 49 999 habitantes</td>\n",2138" <td>20170072210431103</td>\n",2139" <td>Yerno/Nuera</td>\n",2140" <td>NaN</td>\n",2141" <td>NaN</td>\n",2142" <td>Si</td>\n",2143" <td>No</td>\n",2144" <td>NaN</td>\n",2145" <td>Hombre</td>\n",2146" <td>38.0</td>\n",2147" <td>NaN</td>\n",2148" <td>Conviviente</td>\n",2149" </tr>\n",2150" <tr>\n",2151" <th>84982</th>\n",2152" <td>2019</td>\n",2153" <td>07</td>\n",2154" <td>008806</td>\n",2155" <td>114</td>\n",2156" <td>11</td>\n",2157" <td>04</td>\n",2158" <td>200701</td>\n",2159" <td>Costa Norte</td>\n",2160" <td>De 50 000 a 99 999 habitantes</td>\n",2161" <td>20170088061141104</td>\n",2162" <td>Nieto(a)</td>\n",2163" <td>2.0</td>\n",2164" <td>Hijo(a)</td>\n",2165" <td>Si</td>\n",2166" <td>No</td>\n",2167" <td>NaN</td>\n",2168" <td>Hombre</td>\n",2169" <td>6.0</td>\n",2170" <td>NaN</td>\n",2171" <td>NaN</td>\n",2172" </tr>\n",2173" <tr>\n",2174" <th>85000</th>\n",2175" <td>2020</td>\n",2176" <td>02</td>\n",2177" <td>009338</td>\n",2178" <td>017</td>\n",2179" <td>11</td>\n",2180" <td>03</td>\n",2181" <td>230108</td>\n",2182" <td>Costa Sur</td>\n",2183" <td>De 100 000 a 499 999 habitantes</td>\n",2184" <td>20190093380171103</td>\n",2185" <td>Hijo(a)/Hijastro(a)</td>\n",2186" <td>1.0</td>\n",2187" <td>Hijo(a)</td>\n",2188" <td>Si</td>\n",2189" <td>No</td>\n",2190" <td>NaN</td>\n",2191" <td>Hombre</td>\n",2192" <td>25.0</td>\n",2193" <td>NaN</td>\n",2194" <td>Soltero(a)</td>\n",2195" </tr>\n",2196" </tbody>\n",2197"</table>\n",2198"<p>8270 rows × 20 columns</p>\n",2199"</div>"2200],2201"text/plain": [2202" year MES CONGLOME VIVIENDA HOGAR CODPERSO UBIGEO DOMINIO \\\n",2203"3 2019 10 010614 043 11 07 130901 Sierra Norte \n",2204"5 2019 03 008010 059 11 03 150801 Costa Centro \n",2205"24 2019 07 009625 071 11 01 250105 Selva \n",2206"33 2020 07 010368 081 11 04 230104 Costa Sur \n",2207"52 2019 12 005867 034 11 02 060101 Sierra Norte \n",2208"... ... .. ... ... ... ... ... ... \n",2209"84940 2019 12 008253 047 11 01 160113 Selva \n",2210"84945 2019 06 007982 008 11 02 150202 Costa Centro \n",2211"84975 2020 09 007221 043 11 03 130901 Sierra Norte \n",2212"84982 2019 07 008806 114 11 04 200701 Costa Norte \n",2213"85000 2020 02 009338 017 11 03 230108 Costa Sur \n",2214"\n",2215" ESTRATO P201P \\\n",2216"3 De 20 000 a 49 999 habitantes 20190106140431107 \n",2217"5 De 100 000 a 499 999 habitantes 20190080100591103 \n",2218"24 De 100 000 a 499 999 habitantes 20190096250711101 \n",2219"33 De 100 000 a 499 999 habitantes 20180103680811105 \n",2220"52 De 100 000 a 499 999 habitantes 20170058670341102 \n",2221"... ... ... \n",2222"84940 De 100 000 a 499 999 habitantes 20170082530471101 \n",2223"84945 De 20 000 a 49 999 habitantes 20170079820081102 \n",2224"84975 De 20 000 a 49 999 habitantes 20170072210431103 \n",2225"84982 De 50 000 a 99 999 habitantes 20170088061141104 \n",2226"85000 De 100 000 a 499 999 habitantes 20190093380171103 \n",2227"\n",2228" P203 P203A P203B P204 P205 P206 \\\n",2229"3 Otros parientes 2.0 Hijo(a) No NaN No \n",2230"5 Otros parientes 1.0 Hijo(a) Si No NaN \n",2231"24 Jefe/Jefa 1.0 Jefe/jefa de hogar Si No NaN \n",2232"33 Hijo(a)/Hijastro(a) NaN NaN Si No NaN \n",2233"52 Esposo(a)/compañero(a) 1.0 Esposa(o) Si No NaN \n",2234"... ... ... ... ... ... ... \n",2235"84940 Jefe/Jefa 1.0 Jefe/jefa de hogar Si No NaN \n",2236"84945 Hijo(a)/Hijastro(a) 1.0 Hijo(a) Si No NaN \n",2237"84975 Yerno/Nuera NaN NaN Si No NaN \n",2238"84982 Nieto(a) 2.0 Hijo(a) Si No NaN \n",2239"85000 Hijo(a)/Hijastro(a) 1.0 Hijo(a) Si No NaN \n",2240"\n",2241" P207 P208A P208B P209 \n",2242"3 Mujer 4.0 NaN NaN \n",2243"5 Hombre 32.0 NaN Soltero(a) \n",2244"24 Hombre 64.0 NaN Conviviente \n",2245"33 Hombre 14.0 NaN Soltero(a) \n",2246"52 Mujer 53.0 NaN Casado(a) \n",2247"... ... ... ... ... \n",2248"84940 Hombre 80.0 NaN Conviviente \n",2249"84945 Hombre 19.0 NaN Soltero(a) \n",2250"84975 Hombre 38.0 NaN Conviviente \n",2251"84982 Hombre 6.0 NaN NaN \n",2252"85000 Hombre 25.0 NaN Soltero(a) \n",2253"\n",2254"[8270 rows x 20 columns]"2255]2256},2257"execution_count": 20,2258"metadata": {},2259"output_type": "execute_result"2260}2261],2262"source": [2263"# Se le pide detectar personas que fueran entrevistadas en ambos años. \n",2264"# para ello, se pide detectar duplicados a partir del identificador por persona : \n",2265"# conglome, vivienda, hogar y codperso.\n",2266"\n",2267"data_administrativa[ data_administrativa.loc[:, ['CONGLOME' , 'VIVIENDA', 'HOGAR', 'CODPERSO']].duplicated(keep = False) ]\n"2268]2269},2270{2271"cell_type": "code",2272"execution_count": 21,2273"id": "9171167c",2274"metadata": {2275"scrolled": true2276},2277"outputs": [2278{2279"data": {2280"text/html": [2281"<div>\n",2282"<style scoped>\n",2283" .dataframe tbody tr th:only-of-type {\n",2284" vertical-align: middle;\n",2285" }\n",2286"\n",2287" .dataframe tbody tr th {\n",2288" vertical-align: top;\n",2289" }\n",2290"\n",2291" .dataframe thead th {\n",2292" text-align: right;\n",2293" }\n",2294"</style>\n",2295"<table border=\"1\" class=\"dataframe\">\n",2296" <thead>\n",2297" <tr style=\"text-align: right;\">\n",2298" <th></th>\n",2299" <th>year</th>\n",2300" <th>MES</th>\n",2301" <th>CONGLOME</th>\n",2302" <th>VIVIENDA</th>\n",2303" <th>HOGAR</th>\n",2304" <th>CODPERSO</th>\n",2305" <th>UBIGEO</th>\n",2306" <th>DOMINIO</th>\n",2307" <th>ESTRATO</th>\n",2308" <th>P201P</th>\n",2309" <th>P203</th>\n",2310" <th>P203A</th>\n",2311" <th>P203B</th>\n",2312" <th>P204</th>\n",2313" <th>P205</th>\n",2314" <th>P206</th>\n",2315" <th>P207</th>\n",2316" <th>P208A</th>\n",2317" <th>P208B</th>\n",2318" <th>P209</th>\n",2319" </tr>\n",2320" </thead>\n",2321" <tbody>\n",2322" <tr>\n",2323" <th>56662</th>\n",2324" <td>2019</td>\n",2325" <td>04</td>\n",2326" <td>005031</td>\n",2327" <td>101</td>\n",2328" <td>11</td>\n",2329" <td>01</td>\n",2330" <td>010201</td>\n",2331" <td>Selva</td>\n",2332" <td>De 20 000 a 49 999 habitantes</td>\n",2333" <td>20190050311011101</td>\n",2334" <td>Jefe/Jefa</td>\n",2335" <td>1.0</td>\n",2336" <td>Jefe/jefa de hogar</td>\n",2337" <td>Si</td>\n",2338" <td>No</td>\n",2339" <td>NaN</td>\n",2340" <td>Hombre</td>\n",2341" <td>45.0</td>\n",2342" <td>NaN</td>\n",2343" <td>Casado(a)</td>\n",2344" </tr>\n",2345" <tr>\n",2346" <th>70184</th>\n",2347" <td>2019</td>\n",2348" <td>02</td>\n",2349" <td>005024</td>\n",2350" <td>003</td>\n",2351" <td>11</td>\n",2352" <td>07</td>\n",2353" <td>010401</td>\n",2354" <td>Selva</td>\n",2355" <td>De 2 000 a 19 999 habitantes</td>\n",2356" <td>20150050240031105</td>\n",2357" <td>Hijo(a)/Hijastro(a)</td>\n",2358" <td>1.0</td>\n",2359" <td>Hijo(a)</td>\n",2360" <td>Si</td>\n",2361" <td>Si</td>\n",2362" <td>NaN</td>\n",2363" <td>Mujer</td>\n",2364" <td>18.0</td>\n",2365" <td>NaN</td>\n",2366" <td>Soltero(a)</td>\n",2367" </tr>\n",2368" <tr>\n",2369" <th>49277</th>\n",2370" <td>2019</td>\n",2371" <td>11</td>\n",2372" <td>009172</td>\n",2373" <td>119</td>\n",2374" <td>11</td>\n",2375" <td>02</td>\n",2376" <td>220501</td>\n",2377" <td>Selva</td>\n",2378" <td>De 2 000 a 19 999 habitantes</td>\n",2379" <td>20160091721191102</td>\n",2380" <td>Esposo(a)/compañero(a)</td>\n",2381" <td>1.0</td>\n",2382" <td>Esposa(o)</td>\n",2383" <td>Si</td>\n",2384" <td>No</td>\n",2385" <td>NaN</td>\n",2386" <td>Mujer</td>\n",2387" <td>32.0</td>\n",2388" <td>NaN</td>\n",2389" <td>Conviviente</td>\n",2390" </tr>\n",2391" <tr>\n",2392" <th>49275</th>\n",2393" <td>2019</td>\n",2394" <td>12</td>\n",2395" <td>005011</td>\n",2396" <td>031</td>\n",2397" <td>11</td>\n",2398" <td>01</td>\n",2399" <td>010101</td>\n",2400" <td>Sierra Norte</td>\n",2401" <td>De 20 000 a 49 999 habitantes</td>\n",2402" <td>20190050110311101</td>\n",2403" <td>Jefe/Jefa</td>\n",2404" <td>1.0</td>\n",2405" <td>Jefe/jefa de hogar</td>\n",2406" <td>Si</td>\n",2407" <td>No</td>\n",2408" <td>NaN</td>\n",2409" <td>Hombre</td>\n",2410" <td>58.0</td>\n",2411" <td>NaN</td>\n",2412" <td>Casado(a)</td>\n",2413" </tr>\n",2414" <tr>\n",2415" <th>70179</th>\n",2416" <td>2019</td>\n",2417" <td>01</td>\n",2418" <td>008006</td>\n",2419" <td>091</td>\n",2420" <td>11</td>\n",2421" <td>03</td>\n",2422" <td>150801</td>\n",2423" <td>Costa Centro</td>\n",2424" <td>De 100 000 a 499 999 habitantes</td>\n",2425" <td>20190080060911103</td>\n",2426" <td>Hijo(a)/Hijastro(a)</td>\n",2427" <td>1.0</td>\n",2428" <td>Hijo(a)</td>\n",2429" <td>Si</td>\n",2430" <td>No</td>\n",2431" <td>NaN</td>\n",2432" <td>Hombre</td>\n",2433" <td>19.0</td>\n",2434" <td>NaN</td>\n",2435" <td>Soltero(a)</td>\n",2436" </tr>\n",2437" <tr>\n",2438" <th>...</th>\n",2439" <td>...</td>\n",2440" <td>...</td>\n",2441" <td>...</td>\n",2442" <td>...</td>\n",2443" <td>...</td>\n",2444" <td>...</td>\n",2445" <td>...</td>\n",2446" <td>...</td>\n",2447" <td>...</td>\n",2448" <td>...</td>\n",2449" <td>...</td>\n",2450" <td>...</td>\n",2451" <td>...</td>\n",2452" <td>...</td>\n",2453" <td>...</td>\n",2454" <td>...</td>\n",2455" <td>...</td>\n",2456" <td>...</td>\n",2457" <td>...</td>\n",2458" <td>...</td>\n",2459" </tr>\n",2460" <tr>\n",2461" <th>37969</th>\n",2462" <td>2020</td>\n",2463" <td>04</td>\n",2464" <td>016182</td>\n",2465" <td>079</td>\n",2466" <td>11</td>\n",2467" <td>01</td>\n",2468" <td>070102</td>\n",2469" <td>Lima Metropolitana</td>\n",2470" <td>De 500 000 a más habitantes</td>\n",2471" <td>20200161820791101</td>\n",2472" <td>Jefe/Jefa</td>\n",2473" <td>NaN</td>\n",2474" <td>NaN</td>\n",2475" <td>Si</td>\n",2476" <td>No</td>\n",2477" <td>NaN</td>\n",2478" <td>Mujer</td>\n",2479" <td>43.0</td>\n",2480" <td>NaN</td>\n",2481" <td>Casado(a)</td>\n",2482" </tr>\n",2483" <tr>\n",2484" <th>37970</th>\n",2485" <td>2020</td>\n",2486" <td>11</td>\n",2487" <td>016370</td>\n",2488" <td>028</td>\n",2489" <td>11</td>\n",2490" <td>02</td>\n",2491" <td>080106</td>\n",2492" <td>Sierra Sur</td>\n",2493" <td>De 100 000 a 499 999 habitantes</td>\n",2494" <td>20200163700281102</td>\n",2495" <td>Hijo(a)/Hijastro(a)</td>\n",2496" <td>1.0</td>\n",2497" <td>Hijo(a)</td>\n",2498" <td>Si</td>\n",2499" <td>No</td>\n",2500" <td>NaN</td>\n",2501" <td>Mujer</td>\n",2502" <td>27.0</td>\n",2503" <td>NaN</td>\n",2504" <td>Soltero(a)</td>\n",2505" </tr>\n",2506" <tr>\n",2507" <th>37971</th>\n",2508" <td>2020</td>\n",2509" <td>09</td>\n",2510" <td>015516</td>\n",2511" <td>011</td>\n",2512" <td>11</td>\n",2513" <td>04</td>\n",2514" <td>030401</td>\n",2515" <td>Sierra Sur</td>\n",2516" <td>Área de Empadronamiento Rural (AER) Compuesto</td>\n",2517" <td>20200155160111104</td>\n",2518" <td>Hijo(a)/Hijastro(a)</td>\n",2519" <td>NaN</td>\n",2520" <td>NaN</td>\n",2521" <td>Si</td>\n",2522" <td>No</td>\n",2523" <td>NaN</td>\n",2524" <td>Hombre</td>\n",2525" <td>15.0</td>\n",2526" <td>NaN</td>\n",2527" <td>Soltero(a)</td>\n",2528" </tr>\n",2529" <tr>\n",2530" <th>37958</th>\n",2531" <td>2020</td>\n",2532" <td>09</td>\n",2533" <td>005523</td>\n",2534" <td>138</td>\n",2535" <td>11</td>\n",2536" <td>07</td>\n",2537" <td>040102</td>\n",2538" <td>Sierra Sur</td>\n",2539" <td>De 500 000 a más habitantes</td>\n",2540" <td>20170055231381103</td>\n",2541" <td>Hermano(a)</td>\n",2542" <td>NaN</td>\n",2543" <td>NaN</td>\n",2544" <td>Si</td>\n",2545" <td>No</td>\n",2546" <td>NaN</td>\n",2547" <td>Mujer</td>\n",2548" <td>48.0</td>\n",2549" <td>NaN</td>\n",2550" <td>Soltero(a)</td>\n",2551" </tr>\n",2552" <tr>\n",2553" <th>85034</th>\n",2554" <td>2020</td>\n",2555" <td>11</td>\n",2556" <td>018778</td>\n",2557" <td>155</td>\n",2558" <td>11</td>\n",2559" <td>06</td>\n",2560" <td>160404</td>\n",2561" <td>Selva</td>\n",2562" <td>Área de Empadronamiento Rural (AER) Compuesto</td>\n",2563" <td>20200187781551106</td>\n",2564" <td>Hijo(a)/Hijastro(a)</td>\n",2565" <td>2.0</td>\n",2566" <td>Jefe/jefa de hogar</td>\n",2567" <td>Si</td>\n",2568" <td>No</td>\n",2569" <td>NaN</td>\n",2570" <td>Hombre</td>\n",2571" <td>22.0</td>\n",2572" <td>NaN</td>\n",2573" <td>Conviviente</td>\n",2574" </tr>\n",2575" </tbody>\n",2576"</table>\n",2577"<p>85035 rows × 20 columns</p>\n",2578"</div>"2579],2580"text/plain": [2581" year MES CONGLOME VIVIENDA HOGAR CODPERSO UBIGEO DOMINIO \\\n",2582"56662 2019 04 005031 101 11 01 010201 Selva \n",2583"70184 2019 02 005024 003 11 07 010401 Selva \n",2584"49277 2019 11 009172 119 11 02 220501 Selva \n",2585"49275 2019 12 005011 031 11 01 010101 Sierra Norte \n",2586"70179 2019 01 008006 091 11 03 150801 Costa Centro \n",2587"... ... .. ... ... ... ... ... ... \n",2588"37969 2020 04 016182 079 11 01 070102 Lima Metropolitana \n",2589"37970 2020 11 016370 028 11 02 080106 Sierra Sur \n",2590"37971 2020 09 015516 011 11 04 030401 Sierra Sur \n",2591"37958 2020 09 005523 138 11 07 040102 Sierra Sur \n",2592"85034 2020 11 018778 155 11 06 160404 Selva \n",2593"\n",2594" ESTRATO P201P \\\n",2595"56662 De 20 000 a 49 999 habitantes 20190050311011101 \n",2596"70184 De 2 000 a 19 999 habitantes 20150050240031105 \n",2597"49277 De 2 000 a 19 999 habitantes 20160091721191102 \n",2598"49275 De 20 000 a 49 999 habitantes 20190050110311101 \n",2599"70179 De 100 000 a 499 999 habitantes 20190080060911103 \n",2600"... ... ... \n",2601"37969 De 500 000 a más habitantes 20200161820791101 \n",2602"37970 De 100 000 a 499 999 habitantes 20200163700281102 \n",2603"37971 Área de Empadronamiento Rural (AER) Compuesto 20200155160111104 \n",2604"37958 De 500 000 a más habitantes 20170055231381103 \n",2605"85034 Área de Empadronamiento Rural (AER) Compuesto 20200187781551106 \n",2606"\n",2607" P203 P203A P203B P204 P205 P206 \\\n",2608"56662 Jefe/Jefa 1.0 Jefe/jefa de hogar Si No NaN \n",2609"70184 Hijo(a)/Hijastro(a) 1.0 Hijo(a) Si Si NaN \n",2610"49277 Esposo(a)/compañero(a) 1.0 Esposa(o) Si No NaN \n",2611"49275 Jefe/Jefa 1.0 Jefe/jefa de hogar Si No NaN \n",2612"70179 Hijo(a)/Hijastro(a) 1.0 Hijo(a) Si No NaN \n",2613"... ... ... ... ... ... ... \n",2614"37969 Jefe/Jefa NaN NaN Si No NaN \n",2615"37970 Hijo(a)/Hijastro(a) 1.0 Hijo(a) Si No NaN \n",2616"37971 Hijo(a)/Hijastro(a) NaN NaN Si No NaN \n",2617"37958 Hermano(a) NaN NaN Si No NaN \n",2618"85034 Hijo(a)/Hijastro(a) 2.0 Jefe/jefa de hogar Si No NaN \n",2619"\n",2620" P207 P208A P208B P209 \n",2621"56662 Hombre 45.0 NaN Casado(a) \n",2622"70184 Mujer 18.0 NaN Soltero(a) \n",2623"49277 Mujer 32.0 NaN Conviviente \n",2624"49275 Hombre 58.0 NaN Casado(a) \n",2625"70179 Hombre 19.0 NaN Soltero(a) \n",2626"... ... ... ... ... \n",2627"37969 Mujer 43.0 NaN Casado(a) \n",2628"37970 Mujer 27.0 NaN Soltero(a) \n",2629"37971 Hombre 15.0 NaN Soltero(a) \n",2630"37958 Mujer 48.0 NaN Soltero(a) \n",2631"85034 Hombre 22.0 NaN Conviviente \n",2632"\n",2633"[85035 rows x 20 columns]"2634]2635},2636"execution_count": 21,2637"metadata": {},2638"output_type": "execute_result"2639}2640],2641"source": [2642"# Ordene la base de datos a partir de las variables que identifican cada miembro y la variable de año (year) \n",2643"# Así podrá observar a cada individuo en ambos años.\n",2644"\n",2645"by_year = data_administrativa.sort_values('year',ascending=True)\n",2646"by_year\n"2647]2648},2649{2650"cell_type": "code",2651"execution_count": null,2652"id": "33245bf4",2653"metadata": {},2654"outputs": [],2655"source": [2656"# Finalmente crear una base de datos para cada año \n",2657"\n",2658"# Base de datos del año 2019 \n",2659"df_2019 = data_administrativa.loc[ data_administrativa.year == '2019', : ]\n",2660"df_2019\n",2661"# guardamos\n",2662"import pyreadstat\n",2663"pyreadstat.write_sav(data_administrativa, r\"../../data/data_administrativa/data_2019_grupo8.sav\")\n",2664"\n",2665"# Base de datos del año 2020\n",2666"df_2020 = data_administrativa.loc[ data_administrativa.year == '2020', : ]\n",2667"df_2020\n",2668"\n",2669"pyreadstat.write_sav(data_administrativa, r\"../../data/data_administrativa/data_2020_grupo8.sav\")"2670]2671},2672{2673"cell_type": "code",2674"execution_count": null,2675"id": "d76c0298",2676"metadata": {},2677"outputs": [],2678"source": []2679}2680],2681"metadata": {2682"kernelspec": {2683"display_name": "Python 3 (ipykernel)",2684"language": "python",2685"name": "python3"2686},2687"language_info": {2688"codemirror_mode": {2689"name": "ipython",2690"version": 32691},2692"file_extension": ".py",2693"mimetype": "text/x-python",2694"name": "python",2695"nbconvert_exporter": "python",2696"pygments_lexer": "ipython3",2697"version": "3.9.12"2698}2699},2700"nbformat": 4,2701"nbformat_minor": 52702}270327042705