| OLD | NEW |
| (Empty) |
| 1 # copyright 2003-2011 LOGILAB S.A. (Paris, FRANCE), all rights reserved. | |
| 2 # contact http://www.logilab.fr/ -- mailto:contact@logilab.fr | |
| 3 # | |
| 4 # This file is part of logilab-common. | |
| 5 # | |
| 6 # logilab-common is free software: you can redistribute it and/or modify it unde
r | |
| 7 # the terms of the GNU Lesser General Public License as published by the Free | |
| 8 # Software Foundation, either version 2.1 of the License, or (at your option) an
y | |
| 9 # later version. | |
| 10 # | |
| 11 # logilab-common is distributed in the hope that it will be useful, but WITHOUT | |
| 12 # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS | |
| 13 # FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more | |
| 14 # details. | |
| 15 # | |
| 16 # You should have received a copy of the GNU Lesser General Public License along | |
| 17 # with logilab-common. If not, see <http://www.gnu.org/licenses/>. | |
| 18 """Manipulate pdf and fdf files (pdftk recommended). | |
| 19 | |
| 20 Notes regarding pdftk, pdf forms and fdf files (form definition file) | |
| 21 fields names can be extracted with: | |
| 22 | |
| 23 pdftk orig.pdf generate_fdf output truc.fdf | |
| 24 | |
| 25 to merge fdf and pdf: | |
| 26 | |
| 27 pdftk orig.pdf fill_form test.fdf output result.pdf [flatten] | |
| 28 | |
| 29 without flatten, one could further edit the resulting form. | |
| 30 with flatten, everything is turned into text. | |
| 31 | |
| 32 | |
| 33 | |
| 34 | |
| 35 """ | |
| 36 __docformat__ = "restructuredtext en" | |
| 37 # XXX seems very unix specific | |
| 38 # TODO: check availability of pdftk at import | |
| 39 | |
| 40 | |
| 41 import os | |
| 42 | |
| 43 HEAD="""%FDF-1.2 | |
| 44 %\xE2\xE3\xCF\xD3 | |
| 45 1 0 obj | |
| 46 << | |
| 47 /FDF | |
| 48 << | |
| 49 /Fields [ | |
| 50 """ | |
| 51 | |
| 52 TAIL="""] | |
| 53 >> | |
| 54 >> | |
| 55 endobj | |
| 56 trailer | |
| 57 | |
| 58 << | |
| 59 /Root 1 0 R | |
| 60 >> | |
| 61 %%EOF | |
| 62 """ | |
| 63 | |
| 64 def output_field( f ): | |
| 65 return "\xfe\xff" + "".join( [ "\x00"+c for c in f ] ) | |
| 66 | |
| 67 def extract_keys(lines): | |
| 68 keys = [] | |
| 69 for line in lines: | |
| 70 if line.startswith('/V'): | |
| 71 pass #print 'value',line | |
| 72 elif line.startswith('/T'): | |
| 73 key = line[7:-2] | |
| 74 key = ''.join(key.split('\x00')) | |
| 75 keys.append( key ) | |
| 76 return keys | |
| 77 | |
| 78 def write_field(out, key, value): | |
| 79 out.write("<<\n") | |
| 80 if value: | |
| 81 out.write("/V (%s)\n" %value) | |
| 82 else: | |
| 83 out.write("/V /\n") | |
| 84 out.write("/T (%s)\n" % output_field(key) ) | |
| 85 out.write(">> \n") | |
| 86 | |
| 87 def write_fields(out, fields): | |
| 88 out.write(HEAD) | |
| 89 for (key, value, comment) in fields: | |
| 90 write_field(out, key, value) | |
| 91 write_field(out, key+"a", value) # pour copie-carbone sur autres pages | |
| 92 out.write(TAIL) | |
| 93 | |
| 94 def extract_keys_from_pdf(filename): | |
| 95 # what about using 'pdftk filename dump_data_fields' and parsing the output
? | |
| 96 os.system('pdftk %s generate_fdf output /tmp/toto.fdf' % filename) | |
| 97 lines = file('/tmp/toto.fdf').readlines() | |
| 98 return extract_keys(lines) | |
| 99 | |
| 100 | |
| 101 def fill_pdf(infile, outfile, fields): | |
| 102 write_fields(file('/tmp/toto.fdf', 'w'), fields) | |
| 103 os.system('pdftk %s fill_form /tmp/toto.fdf output %s flatten' % (infile, ou
tfile)) | |
| 104 | |
| 105 def testfill_pdf(infile, outfile): | |
| 106 keys = extract_keys_from_pdf(infile) | |
| 107 fields = [] | |
| 108 for key in keys: | |
| 109 fields.append( (key, key, '') ) | |
| 110 fill_pdf(infile, outfile, fields) | |
| 111 | |
| OLD | NEW |