1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27
| from pdftools.pdffile import PDFDocument
import pdftools
file = "diveintopython.pdf"
doc = PDFDocument(file)
print "Document uses PDF format version", doc.document_version()
pages = doc.count_pages()
print "Document contains %i pages." % pages
page123 = doc.read_page(123)
contents123 = page123.read_contents()
def iterer(sequence, fonction):
try:
for item in sequence:
iterer(item, fonction)
except:
fonction(sequence)
def afficher(texte):
if isinstance(texte, pdftools.pdftext.Text):
print texte.text
for items in contents123.contents:
iterer(items, afficher) |
Partager