Coding Python Servel
Coding Python Servel
coding:
utf-8 -
*-
"""
Created on Sun Jul 24 20:06:14 2016
'''
info extracted from
http://stackoverflow.com/questions/12360999/pypdf-retrieve-page-numbers-
from-document
http://stackoverflow.com/questions/26494211/extracting-text-from-a-pdf-file-
using-pdfminer-in-python
'''
import csv
import sys
import json
import googlemaps
reload(sys)
sys.setdefaultencoding("utf-8")
output = StringIO()
manager = PDFResourceManager()
converter = TextConverter(manager, output, laparams=LAParams())
interpreter = PDFPageInterpreter(manager, converter)
def servelParser(rutaPdf):
pdf = PdfFileReader(open(rutaPdf,'rb'))
paginas = pdf.getNumPages() #will fetch all the pages from the PDF. It
could take a LOT of time
#paginas = 2
#Define fields
nombres = range(paginas)
rut = range(paginas)
circunscripcion = range(paginas)
comuna = range(paginas)
direccion = range(paginas)
provincia = range(paginas)
Region = range(paginas)
Mesa = range(paginas)
pages = range(paginas)
votantes = 0
for i in range(paginas):
pages[i] = convert(rutaPdf,[i])
indexNombre = pages[i].index('NOMBRE')
indexRegion = pages[i].index('REGION')
indexComuna = pages[i].index('COMUNA:')
indexCI = pages[i].index('C.IDENTIDAD SEXO')
indexCirc = pages[i].index('CIRCUNSCRIPCIÓN')
indexDomEle = pages[i].index('DOMICILIO ELECTORAL')
indexMesa = pages[i].index('MESA')
votantes +=len(nombres[i])
'Lng':geocode_result[0]["geometry"]["location"]["lng"]}
k+=1
return datosServel