From 4c6c304b66897b05b18f9800065a4bc944294e7a Mon Sep 17 00:00:00 2001 From: Michael Stephens Date: Mon, 4 Jan 2010 11:30:23 +0000 Subject: [PATCH] update MI to work with latest version of PdfMiner --- scripts/mi/get_legislation.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/scripts/mi/get_legislation.py b/scripts/mi/get_legislation.py index 902381b558..2bd40bcb5f 100755 --- a/scripts/mi/get_legislation.py +++ b/scripts/mi/get_legislation.py @@ -10,7 +10,7 @@ from pdfminer.pdfinterp import PDFResourceManager, PDFPageInterpreter, process_pdf from pdfminer.pdfdevice import PDFDevice from pdfminer.converter import TextConverter -from pdfminer.cmap import CMapDB, find_cmap_path +from pdfminer.cmapdb import CMapDB from pdfminer.layout import LAParams from StringIO import StringIO @@ -97,7 +97,7 @@ def fetch_past_legislator(self, year, chamber, url, name): # UGH! What a useful yet convoluted library. outtext = StringIO() - rsrc = PDFResourceManager(CMapDB(find_cmap_path())) + rsrc = PDFResourceManager(CMapDB()) device = TextConverter(rsrc, outtext, codec='ascii', laparams=LAParams()) process_pdf(rsrc, device, StringIO(the_pdf), set()) outtext.seek(0) @@ -392,4 +392,4 @@ def parse_name(self, name): return (first_name, middle_name, last_name, suffix) if __name__ == '__main__': - MichiganScraper().run() + MichiganScraper.run()