OLD | NEW |
(Empty) | |
| 1 # copyright 2003-2011 LOGILAB S.A. (Paris, FRANCE), all rights reserved. |
| 2 # contact http://www.logilab.fr/ -- mailto:contact@logilab.fr |
| 3 # |
| 4 # This file is part of logilab-common. |
| 5 # |
| 6 # logilab-common is free software: you can redistribute it and/or modify it unde
r |
| 7 # the terms of the GNU Lesser General Public License as published by the Free |
| 8 # Software Foundation, either version 2.1 of the License, or (at your option) an
y |
| 9 # later version. |
| 10 # |
| 11 # logilab-common is distributed in the hope that it will be useful, but WITHOUT |
| 12 # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS |
| 13 # FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more |
| 14 # details. |
| 15 # |
| 16 # You should have received a copy of the GNU Lesser General Public License along |
| 17 # with logilab-common. If not, see <http://www.gnu.org/licenses/>. |
| 18 """Manipulate pdf and fdf files (pdftk recommended). |
| 19 |
| 20 Notes regarding pdftk, pdf forms and fdf files (form definition file) |
| 21 fields names can be extracted with: |
| 22 |
| 23 pdftk orig.pdf generate_fdf output truc.fdf |
| 24 |
| 25 to merge fdf and pdf: |
| 26 |
| 27 pdftk orig.pdf fill_form test.fdf output result.pdf [flatten] |
| 28 |
| 29 without flatten, one could further edit the resulting form. |
| 30 with flatten, everything is turned into text. |
| 31 |
| 32 |
| 33 |
| 34 |
| 35 """ |
| 36 __docformat__ = "restructuredtext en" |
| 37 # XXX seems very unix specific |
| 38 # TODO: check availability of pdftk at import |
| 39 |
| 40 |
| 41 import os |
| 42 |
| 43 HEAD="""%FDF-1.2 |
| 44 %\xE2\xE3\xCF\xD3 |
| 45 1 0 obj |
| 46 << |
| 47 /FDF |
| 48 << |
| 49 /Fields [ |
| 50 """ |
| 51 |
| 52 TAIL="""] |
| 53 >> |
| 54 >> |
| 55 endobj |
| 56 trailer |
| 57 |
| 58 << |
| 59 /Root 1 0 R |
| 60 >> |
| 61 %%EOF |
| 62 """ |
| 63 |
| 64 def output_field( f ): |
| 65 return "\xfe\xff" + "".join( [ "\x00"+c for c in f ] ) |
| 66 |
| 67 def extract_keys(lines): |
| 68 keys = [] |
| 69 for line in lines: |
| 70 if line.startswith('/V'): |
| 71 pass #print 'value',line |
| 72 elif line.startswith('/T'): |
| 73 key = line[7:-2] |
| 74 key = ''.join(key.split('\x00')) |
| 75 keys.append( key ) |
| 76 return keys |
| 77 |
| 78 def write_field(out, key, value): |
| 79 out.write("<<\n") |
| 80 if value: |
| 81 out.write("/V (%s)\n" %value) |
| 82 else: |
| 83 out.write("/V /\n") |
| 84 out.write("/T (%s)\n" % output_field(key) ) |
| 85 out.write(">> \n") |
| 86 |
| 87 def write_fields(out, fields): |
| 88 out.write(HEAD) |
| 89 for (key, value, comment) in fields: |
| 90 write_field(out, key, value) |
| 91 write_field(out, key+"a", value) # pour copie-carbone sur autres pages |
| 92 out.write(TAIL) |
| 93 |
| 94 def extract_keys_from_pdf(filename): |
| 95 # what about using 'pdftk filename dump_data_fields' and parsing the output
? |
| 96 os.system('pdftk %s generate_fdf output /tmp/toto.fdf' % filename) |
| 97 lines = file('/tmp/toto.fdf').readlines() |
| 98 return extract_keys(lines) |
| 99 |
| 100 |
| 101 def fill_pdf(infile, outfile, fields): |
| 102 write_fields(file('/tmp/toto.fdf', 'w'), fields) |
| 103 os.system('pdftk %s fill_form /tmp/toto.fdf output %s flatten' % (infile, ou
tfile)) |
| 104 |
| 105 def testfill_pdf(infile, outfile): |
| 106 keys = extract_keys_from_pdf(infile) |
| 107 fields = [] |
| 108 for key in keys: |
| 109 fields.append( (key, key, '') ) |
| 110 fill_pdf(infile, outfile, fields) |
| 111 |
OLD | NEW |