Path: blob/main/Trabajo_final/grupo7/PREGUNTA_2_Spyder.py
2714 views
#!pip install openpyxl1#importar la librería pandas2import pandas as pd3import os45user = os.getlogin() # Username6#se cambia el directorio de trabajo78os.chdir(f"C:/Users/{user}/Desktop/trabfinal")910#se exporta los dataframes para los años desde 2014 hasta 2021, para luego editarlos1112#20141314det2014 = pd.read_excel(f"C:/Users/{user}/Desktop/trabfinal/VRAEM 2014.xlsx", sheet_name='Hoja1')1516det2014.drop([0],axis=0)17det2014=det2014.drop([0],axis=0)18print (det2014)1920#renombrar columnas21det2014.rename(columns={"Unnamed: 7": "Anual"}, inplace=True)2223det2014.rename(columns={"Unnamed: 1": "I BIMESTRE", "Unnamed: 2":"II BIMESTRE", "Unnamed: 3": "III BIMESTRE", "Unnamed: 4": "IV BIMESTRE", "Unnamed: 5": "V BIMESTRE", "Unnamed: 6": "VI BIMESTRE"}, inplace=True)2425#se eliminan las columnas bimestrales, para solo quedarse con las anuales26det2014.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)2728#se eliminan las columnas de Establecimiento de Salud e Instituciones educativas29det2014.drop([10, 11],axis=0)30det2014=det2014.drop([10, 11],axis=0)3132det2014.drop([13],axis=0)33det2014=det2014.drop([13],axis=0)3435det2014.drop([1],axis=0)36det2014=det2014.drop([1],axis=0)373839det2014=det2014.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)4041det2014.rename(columns={"INFORMACION BIMESTRAL 2014 - VRAEM: InfoJUNTOS": "Reporte"}, inplace=True)4243det2014.rename(columns={"Anual": "2014"}, inplace=True)4445#este proceso de replica para los siguientes años46#20154748det2015 = pd.read_excel(f"C:/Users/{user}/Desktop/trabfinal/VRAEM 2015.xlsx", sheet_name='Hoja1')4950det2015.drop([0],axis=0)51det2015=det2015.drop([0],axis=0)52print (det2015)5354#renombrar columnas55det2015.rename(columns={"Unnamed: 7": "Anual"}, inplace=True)5657det2015.rename(columns={"Unnamed: 1": "I BIMESTRE", "Unnamed: 2":"II BIMESTRE", "Unnamed: 3": "III BIMESTRE", "Unnamed: 4": "IV BIMESTRE", "Unnamed: 5": "V BIMESTRE", "Unnamed: 6": "VI BIMESTRE"}, inplace=True)585960det2015.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)61det2015=det2015.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)6263det2015.drop([10, 11],axis=0)64det2015=det2015.drop([10, 11],axis=0)6566det2015.drop([13],axis=0)67det2015=det2015.drop([13],axis=0)6869det2015.drop([1],axis=0)70det2015=det2015.drop([1],axis=0)717273det2015.rename(columns={"INFORMACION BIMESTRAL 2015 - VRAEM: InfoJUNTOS": "Reporte"}, inplace=True)747576det2015.rename(columns={"Anual": "2015"}, inplace=True)7778#20167980det2016 = pd.read_excel(f"C:/Users/{user}/Desktop/trabfinal/VRAEM 2016.xlsx", sheet_name='Hoja1')8182det2016.drop([0],axis=0)83det2016=det2016.drop([0],axis=0)84print (det2016)8586#renombrar columnas87det2016.rename(columns={"Unnamed: 7": "Anual"}, inplace=True)8889det2016.rename(columns={"Unnamed: 1": "I BIMESTRE", "Unnamed: 2":"II BIMESTRE", "Unnamed: 3": "III BIMESTRE", "Unnamed: 4": "IV BIMESTRE", "Unnamed: 5": "V BIMESTRE", "Unnamed: 6": "VI BIMESTRE"}, inplace=True)909192det2016.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)93det2016=det2016.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)9495det2016.drop([10, 11],axis=0)96det2016=det2016.drop([10, 11],axis=0)9798det2016.drop([13],axis=0)99det2016=det2016.drop([13],axis=0)100101det2016.drop([1],axis=0)102det2016=det2016.drop([1],axis=0)103104det2016.rename(columns={"INFORMACION BIMESTRAL 2016 - VRAEM: InfoJUNTOS": "Reporte"}, inplace=True)105106det2016.rename(columns={"Anual": "2016"}, inplace=True)107108#2017109110det2017 = pd.read_excel(f"C:/Users/{user}/Desktop/trabfinal/VRAEM 2017.xlsx", sheet_name='Hoja1')111112det2017.drop([0],axis=0)113det2017=det2017.drop([0],axis=0)114print (det2017)115116#renombrar columnas117det2017.rename(columns={"Unnamed: 7": "Anual"}, inplace=True)118119det2017.rename(columns={"Unnamed: 1": "I BIMESTRE", "Unnamed: 2":"II BIMESTRE", "Unnamed: 3": "III BIMESTRE", "Unnamed: 4": "IV BIMESTRE", "Unnamed: 5": "V BIMESTRE", "Unnamed: 6": "VI BIMESTRE"}, inplace=True)120121122det2017.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)123det2017=det2017.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)124125det2017.drop([10, 11],axis=0)126det2017=det2017.drop([10, 11],axis=0)127128det2017.drop([13],axis=0)129det2017=det2017.drop([13],axis=0)130131det2017.drop([1],axis=0)132det2017=det2017.drop([1],axis=0)133134135det2017.rename(columns={"INFORMACION BIMESTRAL 2017 - VRAEM: InfoJUNTOS": "Reporte"}, inplace=True)136137det2017.rename(columns={"Anual": "2017"}, inplace=True)138139140#2018141142det2018 = pd.read_excel(f"C:/Users/{user}/Desktop/trabfinal/VRAEM 2018.xlsx", sheet_name='Hoja1')143144det2018.drop([0],axis=0)145det2018=det2018.drop([0],axis=0)146print (det2018)147148#renombrar columnas149det2018.rename(columns={"Unnamed: 7": "Anual"}, inplace=True)150151det2018.rename(columns={"Unnamed: 1": "I BIMESTRE", "Unnamed: 2":"II BIMESTRE", "Unnamed: 3": "III BIMESTRE", "Unnamed: 4": "IV BIMESTRE", "Unnamed: 5": "V BIMESTRE", "Unnamed: 6": "VI BIMESTRE"}, inplace=True)152153154det2018.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)155det2018=det2018.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)156157det2018.drop([10, 11],axis=0)158det2018=det2018.drop([10, 11],axis=0)159160det2018.drop([13],axis=0)161det2018=det2018.drop([13],axis=0)162163det2018.drop([1],axis=0)164det2018=det2018.drop([1],axis=0)165166det2018.rename(columns={"INFORMACION BIMESTRAL 2018 - VRAEM: InfoJUNTOS": "Reporte"}, inplace=True)167det2018.rename(columns={"Anual": "2018"}, inplace=True)168169170171#2019172173det2019 = pd.read_excel(f"C:/Users/{user}/Desktop/trabfinal/VRAEM 2019.xlsx", sheet_name='Hoja1')174175det2019.drop([0],axis=0)176det2019=det2019.drop([0],axis=0)177print (det2019)178179#renombrar columnas180det2019.rename(columns={"Unnamed: 7": "Anual"}, inplace=True)181182det2019.rename(columns={"Unnamed: 1": "I BIMESTRE", "Unnamed: 2":"II BIMESTRE", "Unnamed: 3": "III BIMESTRE", "Unnamed: 4": "IV BIMESTRE", "Unnamed: 5": "V BIMESTRE", "Unnamed: 6": "VI BIMESTRE"}, inplace=True)183184185det2019.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)186det2019=det2019.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)187188det2019.drop([10, 11],axis=0)189det2019=det2019.drop([10, 11],axis=0)190191det2019.drop([13],axis=0)192det2019=det2019.drop([13],axis=0)193194det2019.drop([1],axis=0)195det2019=det2019.drop([1],axis=0)196197det2019.rename(columns={"INFORMACION BIMESTRAL 2019 - VRAEM: InfoJUNTOS": "Reporte"}, inplace=True)198199200det2019.rename(columns={"Anual": "2019"}, inplace=True)201202203#2020204det2020 = pd.read_excel(f"C:/Users/{user}/Desktop/trabfinal/VRAEM 2020.xlsx", sheet_name='Hoja1')205206det2020.drop([0],axis=0)207det2020=det2020.drop([0],axis=0)208print (det2020)209210#renombrar columnas211det2020.rename(columns={"Unnamed: 7": "Anual"}, inplace=True)212213det2020.rename(columns={"Unnamed: 1": "I BIMESTRE", "Unnamed: 2":"II BIMESTRE", "Unnamed: 3": "III BIMESTRE", "Unnamed: 4": "IV BIMESTRE", "Unnamed: 5": "V BIMESTRE", "Unnamed: 6": "VI BIMESTRE"}, inplace=True)214215216det2020.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)217det2020=det2020.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)218219det2020.drop([10, 11],axis=0)220det2020=det2020.drop([10, 11],axis=0)221222det2020.drop([13],axis=0)223det2020=det2020.drop([13],axis=0)224225det2020.drop([1],axis=0)226det2020=det2020.drop([1],axis=0)227228229det2020.rename(columns={"INFORMACION BIMESTRAL 2020 - VRAEM: InfoJUNTOS": "Reporte"}, inplace=True)230231det2020.rename(columns={"Anual": "2020"}, inplace=True)232233#2021234235det2021 = pd.read_excel(f"C:/Users/{user}/Desktop/trabfinal/VRAEM 2021.xlsx", sheet_name='Hoja1')236237det2021.drop([0],axis=0)238det2021=det2021.drop([0],axis=0)239print (det2021)240241#renombrar columnas242det2021.rename(columns={"Unnamed: 7": "Anual"}, inplace=True)243244det2021.rename(columns={"Unnamed: 1": "I BIMESTRE", "Unnamed: 2":"II BIMESTRE", "Unnamed: 3": "III BIMESTRE", "Unnamed: 4": "IV BIMESTRE", "Unnamed: 5": "V BIMESTRE", "Unnamed: 6": "VI BIMESTRE"}, inplace=True)245246247det2021.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)248det2021=det2021.drop(['I BIMESTRE','II BIMESTRE', 'III BIMESTRE','IV BIMESTRE','V BIMESTRE', 'VI BIMESTRE'], axis=1)249250det2021.drop([10, 11],axis=0)251det2021=det2021.drop([10, 11],axis=0)252253det2021.drop([13],axis=0)254det2021=det2021.drop([13],axis=0)255256det2021.drop([1],axis=0)257det2021=det2021.drop([1],axis=0)258259det2021.rename(columns={"INFORMACION BIMESTRAL 2021 - VRAEM: InfoJUNTOS": "Reporte"}, inplace=True)260261det2021.rename(columns={"Anual": "2021"}, inplace=True)262263264265#utilizamos merge para poder agrupar los dataframe (de dos en dos)266det1514=pd.merge(det2014, det2015, on='Reporte', how='inner')267det1614=pd.merge(det1514, det2016, on='Reporte', how='inner')268det1714=pd.merge(det1614, det2017, on='Reporte', how='inner')269det1814=pd.merge(det1714, det2018, on='Reporte', how='inner')270det1914=pd.merge(det1814, det2019, on='Reporte', how='inner')271det1420=pd.merge(det1914, det2020, on='Reporte', how='inner')272det1421=pd.merge(det1420, det2021, on='Reporte', how='inner')273274275#finalmente, det1421 representa el dataframe que agrupa los dataframe para cada año desde 2014 hasta 2021 (en términos anuales)276#trasponemos el dataframe277278dataframefinal=det1421.transpose()279280print(dataframefinal)281282#se obtiene de el dataframefinal283284285286287288