-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathFuncionIteraFrenteAmplio.py
More file actions
80 lines (60 loc) · 2.36 KB
/
FuncionIteraFrenteAmplio.py
File metadata and controls
80 lines (60 loc) · 2.36 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
import pandas as pd
import requests
import urllib.request
from bs4 import BeautifulSoup
datafinal=[]
def iterasesiones(x):
df_url = pd.read_excel(r'C:\Users\Usuario\Desktop\Data science\Proyecto Frente Amplio\DataUrl.xlsx')
#datafinal=[]
diputados_1=[]
diputados_2 = []
diputados_final_a_favor=[]
diputados_final_en_contra=[]
url = df_url.loc[x].at['Resultado']
r = requests.get(url)
html_content = r.text
soup = BeautifulSoup(html_content,"lxml")
table = soup.find('table',id='ContentPlaceHolder1_ContentPlaceHolder1_PaginaContent_dtlAFavor')
titulo = df_url.loc[x].at['Sesion']
#subti = titulo.div.info.text.strip()
filas = table.find_all('tr')
#colum = table.find_all('td')
for fila in filas:
colum = fila.find_all('td')
fil = [fila.text.strip() for fila in colum if fila.text.strip()]
#print()
#diputados.append(col_0.replace('\r',''))
if fil:
diputados_1.append(fil)
for i in diputados_1:
for a in i:
diputados_final_a_favor.append(a)
#print(diputados_final_a_favor)
##################################################################
try:
table_1 = soup.find('table',id='ContentPlaceHolder1_ContentPlaceHolder1_PaginaContent_dtlEnContra')
filas_1 = table_1.find_all('tr')
#colum = table.find_all('td')
for fila_1 in filas_1:
colum_1 = fila_1.find_all('td')
fil_1 = [fila_1.text.strip() for fila_1 in colum_1 if fila_1.text.strip()]
#print()
#diputados.append(col_0.replace('\r',''))
if fil_1:
diputados_2.append(fil)
except:
pass
for h in diputados_2:
for b in h:
diputados_final_en_contra.append(b)
#print(diputados_final_en_contra)
#print(len(diputados_final_a_favor)+len(diputados_final_en_contra))
df_1 = pd.DataFrame(diputados_final_a_favor,columns=["Nombre Diputado"])
df_1['Voto'] = 1
df_2 = pd.DataFrame(diputados_final_en_contra,columns=["Nombre Diputado"])
df_2['Voto'] = 0
frames = [df_1,df_2]
eljunte = pd.concat(frames)
eljunte['Sesion'] = titulo
#print(eljunte)
return eljunte