-
Notifications
You must be signed in to change notification settings - Fork 11
/
etl_unificando.py
161 lines (137 loc) · 5.34 KB
/
etl_unificando.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
import pandas as pd
from apiclient import discovery
from oauth2client import client
from oauth2client import tools
from oauth2client.file import Storage
import re
import os
import httplib2
from geopy.geocoders import Nominatim
from Dicc_Tipo_Danhos import camb_tipos
try:
import argparse
flags = argparse.ArgumentParser(parents=[tools.argparser]).parse_args()
except ImportError:
flags = None
# If modifying these scopes, delete your previously saved credentials
# at ~/.credentials/sheets.googleapis.com-python-quickstart.json
SCOPES = 'https://www.googleapis.com/auth/spreadsheets.readonly'
CLIENT_SECRET_FILE = 'creds/secreto_cliente.json'
APPLICATION_NAME = 'Temblor'
def get_credentials():
"""Gets valid user credentials from storage.
If nothing has been stored, or if the stored credentials are invalid,
the OAuth2 flow is completed to obtain the new credentials.
Returns:
Credentials, the obtained credential.
"""
home_dir = os.path.expanduser('~')
credential_dir = os.path.join(home_dir, '.credentials')
if not os.path.exists(credential_dir):
os.makedirs(credential_dir)
credential_path = os.path.join(
credential_dir,
'sheets.googleapis.com-python-quickstart.json')
store = Storage(credential_path)
credentials = store.get()
if not credentials or credentials.invalid:
flow = client.flow_from_clientsecrets(CLIENT_SECRET_FILE, SCOPES)
flow.user_agent = APPLICATION_NAME
if flags:
credentials = tools.run_flow(flow, store, flags)
else: # Needed only for compatibility with Python 2.6
credentials = tools.run(flow, store)
print('Storing credentials to ' + credential_path)
return credentials
def get_Data_temblor():
"""Shows basic usage of the Sheets API.
Creates a Sheets API service object and prints the names and majors of
students in a sample spreadsheet:
https://docs.google.com/spreadsheets/d/1BxiMVs0XRA5nFMdKvBdBZjgmUUqptlbs74OgvE2upms/edit
"""
credentials = get_credentials()
http = credentials.authorize(httplib2.Http())
discoveryUrl = ('https://sheets.googleapis.com/$discovery/rest?'
'version=v4')
service = discovery.build('sheets',
'v4',
http=http,
discoveryServiceUrl=discoveryUrl)
# DAÑOS Y DERRUMBES VERIFICADOS
# Para descargar otras páginas cambiar el onmbre en el campo range
result = service.spreadsheets().values().get(
spreadsheetId='1C7qvWM0o3u5pdFJhnvQosK_3l-VGyZWTZ0JvOtOgPp0',
range='Traslado de Víveres!A7:AH10000').execute()
values = result.get('values', [])
if not values:
print('No data found.')
else:
return values
def insert_Data_temblor(datos):
"""Shows basic usage of the Sheets API.
Creates a Sheets API service object and prints the names and majors of
students in a sample spreadsheet:
https://docs.google.com/spreadsheets/d/1BxiMVs0XRA5nFMdKvBdBZjgmUUqptlbs74OgvE2upms/edit
"""
credentials = get_credentials()
http = credentials.authorize(httplib2.Http())
discoveryUrl = ('https://sheets.googleapis.com/$discovery/rest?'
'version=v4')
service = discovery.build('sheets',
'v4',
http=http,
discoveryServiceUrl=discoveryUrl)
result = service.spreadsheets().values().get(
spreadsheetId='1wLHf5ITtTsfErWoPHwhu7Vfy-96eQKKxZO2AmZbP9XY',
range='Datos!A1:H10000').execute()
values = result.get('values', [])
if not values:
print('No data found.')
else:
print(values)
def estructura_sheet(listas):
columnas = listas[0]
info = pd.DataFrame()
for lista in listas:
dicc_aux = {}
for col in range(len(lista)):
dicc_aux[columnas[col]] = lista[col]
info = info.append(dicc_aux, ignore_index=True)
return info
if __name__ == '__main__':
data = get_Data_temblor()
unificando = estructura_sheet(data)
Descripcion = unificando['DESCRIPCIÓN']
Del_Ent = unificando['DELEGACIÓN/ENTIDAD FEDERATIVA ']
Colonia = unificando['COLONIA ']
Referencia = unificando['Lugar de REFERENCIA']
Direccion = unificando['DIRECCIÓN']
Hora_Atencion = unificando['HORARIOS DE ATENCIÓN']
Transporte = unificando['REQ TRANSPORTE PARA MOVER VÍVERES A OTRO LUGAR']
Viveres = unificando['Mandan víveres hacia ']
Salidas = unificando['Horarios de salidas']
Necesitan = unificando['NECESITAN']
Ex_Viveres = unificando['OFRECEN VÍVERES A QUIEN LO NECESITEN']
Fechas = unificando['ULTIMA ACTUALIZACIÓN (AAAA-MM-DD 23:59)']
s19 = unificando['s19 POR FAVOR NO MODIFICAR']
latitud = unificando['LAT ']
longitud = unificando['LONG ']
unif = pd.DataFrame ({
'Descripcion':Descripcion,
'Delegacion/Entidad Federativa':Del_Ent,
'Colonia':Colonia,
'Lugar de Referencia':Referencia,
'Direccion':Direccion,
'Horarios de atencion ':Hora_Atencion,
'Requiere transporte para mover viveres a otro lugar':Transporte,
'Mandan viveres hacia':Viveres,
'Horarios de salidas':Salidas,
'Necesitan':Necesitan,
'Exceso de viveres':Ex_Viveres,
'Fechas':Fechas,
's19': s19,
'Latitud': latitud,
'Longitud': longitud,
})
unif_l = unif_l[unif.s19.isnull() == False]
unif_l.to_csv('unificando.csv')