2 # -*- coding: ISO-8859-1 -*-
5 # Copyright (C) 2005-2006 Jörg Lehmann <joergl@users.sourceforge.net>
6 # Copyright (C) 2005-2006 André Wobst <wobsta@users.sourceforge.net>
8 # This file is part of PyX (http://pyx.sourceforge.net/).
10 # PyX is free software; you can redistribute it and/or modify
11 # it under the terms of the GNU General Public License as published by
12 # the Free Software Foundation; either version 2 of the License, or
13 # (at your option) any later version.
15 # PyX is distributed in the hope that it will be useful,
16 # but WITHOUT ANY WARRANTY; without even the implied warranty of
17 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 # GNU General Public License for more details.
20 # You should have received a copy of the GNU General Public License
21 # along with PyX; if not, write to the Free Software
22 # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
24 import cStringIO
, copy
, warnings
, time
31 import bbox
, unit
, style
, type1font
, version
36 # fallback implementation for Python 2.2 and below
38 return zip(xrange(len(list)), list)
45 # we want to keep the order of the resources
47 self
.pageresources
= {}
48 self
.pageprocsets
= {}
50 def add(self
, resource
):
51 """ register resource, merging it with an already registered resource of the same type and id """
52 resources
= self
.types
.setdefault(resource
.type, {})
53 if resources
.has_key(resource
.id):
54 resources
[resource
.id].merge(resource
)
56 self
.resources
.append(resource
)
57 resources
[resource
.id] = resource
59 def getrefno(self
, resource
):
60 return self
.types
[resource
.type][resource
.id].refno
62 def mergeregistry(self
, registry
):
63 for resource
in registry
.resources
:
66 def write(self
, file, writer
, catalog
):
67 # first we set all refnos
69 for resource
in self
.resources
:
70 resource
.refno
= refno
73 # second, all objects are written, keeping the positions in the output file
75 for resource
in self
.resources
:
76 fileposes
.append(file.tell())
77 file.write("%i 0 obj\n" % resource
.refno
)
78 resource
.write(file, writer
, self
)
79 file.write("endobj\n")
85 "0000000000 65535 f \n" % refno
)
87 for filepos
in fileposes
:
88 file.write("%010i 00000 n \n" % filepos
)
91 file.write("trailer\n"
94 file.write("/Root %i 0 R\n" % self
.getrefno(catalog
))
95 file.write("/Info %i 0 R\n" % self
.getrefno(catalog
.PDFinfo
))
104 def __init__(self
, type, _id
=None):
105 """create a PDFobject
106 - type has to be a string describing the type of the object
107 - _id is a unique identification used for the object if it is not None.
108 Otherwise id(self) is used
109 - If pageresource is not None, it has to be a string describing the name
110 of the resource to be included in the resource dictionary of the pages
111 including the PDFobject.
112 - If pageprocset is not None, it has to be a string describing the name
113 to be used in the ProcSet list of the pages including the PDFObject.
121 def merge(self
, other
):
124 def write(self
, file, writer
, registry
):
125 raise NotImplementedError("write method has to be provided by PDFobject subclass")
128 class PDFcatalog(PDFobject
):
130 def __init__(self
, document
, writer
, registry
):
131 PDFobject
.__init
__(self
, "catalog")
132 self
.PDFpages
= PDFpages(document
, writer
, registry
)
133 registry
.add(self
.PDFpages
)
134 self
.PDFinfo
= PDFinfo()
135 registry
.add(self
.PDFinfo
)
137 def write(self
, file, writer
, registry
):
140 "/Pages %i 0 R\n" % registry
.getrefno(self
.PDFpages
))
141 if writer
.fullscreen
:
142 file.write("/PageMode /FullScreen\n")
146 class PDFinfo(PDFobject
):
149 PDFobject
.__init
__(self
, "info")
151 def write(self
, file, writer
, registry
):
152 if time
.timezone
< 0:
153 # divmod on positive numbers, otherwise the minutes have a different sign from the hours
154 timezone
= "-%02i'%02i'" % divmod(-time
.timezone
/60, 60)
155 elif time
.timezone
> 0:
156 timezone
= "+%02i'%02i'" % divmod(time
.timezone
/60, 60)
163 if 32 <= ord(c
) <= 127 and c
not in "()[]<>\\":
166 r
+= "\\%03o" % ord(c
)
171 file.write("/Title (%s)\n" % pdfstring(writer
.title
))
173 file.write("/Author (%s)\n" % pdfstring(writer
.author
))
175 file.write("/Subject (%s)\n" % pdfstring(writer
.subject
))
177 file.write("/Keywords (%s)\n" % pdfstring(writer
.keywords
))
178 file.write("/Creator (PyX %s)\n" % version
.version
)
179 file.write("/CreationDate (D:%s%s)\n" % (time
.strftime("%Y%m%d%H%M"), timezone
))
183 class PDFpages(PDFobject
):
185 def __init__(self
, document
, writer
, registry
):
186 PDFobject
.__init
__(self
, "pages")
187 self
.PDFpagelist
= []
188 for pageno
, page
in enumerate(document
.pages
):
189 page
= PDFpage(page
, pageno
, self
, writer
, registry
)
191 self
.PDFpagelist
.append(page
)
193 def write(self
, file, writer
, registry
):
198 ">>\n" % (" ".join(["%i 0 R" % registry
.getrefno(page
)
199 for page
in self
.PDFpagelist
]),
200 len(self
.PDFpagelist
)))
203 class PDFpage(PDFobject
):
205 def __init__(self
, page
, pageno
, PDFpages
, writer
, registry
):
206 PDFobject
.__init
__(self
, "page")
207 self
.PDFpages
= PDFpages
210 # every page uses its own registry in order to find out which
211 # resources are used within the page. However, the
212 # pageregistry is also merged in the global registry
213 self
.pageregistry
= PDFregistry()
215 self
.PDFcontent
= PDFcontent(page
, writer
, self
.pageregistry
)
216 self
.pageregistry
.add(self
.PDFcontent
)
217 registry
.mergeregistry(self
.pageregistry
)
219 def write(self
, file, writer
, registry
):
222 "/Parent %i 0 R\n" % registry
.getrefno(self
.PDFpages
))
223 paperformat
= self
.page
.paperformat
225 file.write("/MediaBox [0 0 %f %f]\n" % (unit
.topt(paperformat
.width
), unit
.topt(paperformat
.height
)))
227 file.write("/MediaBox [%f %f %f %f]\n" % self
.PDFcontent
.transformedbbox
.highrestuple_pt())
228 if self
.PDFcontent
.transformedbbox
and writer
.writebbox
:
229 file.write("/CropBox [%f %f %f %f]\n" % self
.PDFcontent
.transformedbbox
.highrestuple_pt())
230 file.write("/Resources <<\n"
231 "/ProcSet [ /PDF %s ]\n" % " ".join(["/%s" % p
for p
in self
.pageregistry
.pageprocsets
.keys()]))
232 for pageresource
, resources
in self
.pageregistry
.pageresources
.items():
233 file.write("/%s <<\n%s\n>>\n" % (pageresource
, "\n".join(["/%s %i 0 R" % (name
, registry
.getrefno(resource
))
234 for name
, resource
in resources
.items()])))
237 ">>\n" % registry
.getrefno(self
.PDFcontent
))
240 class PDFcontent(PDFobject
):
242 def __init__(self
, page
, writer
, registry
):
243 PDFobject
.__init
__(self
, registry
, "content")
245 self
.contentfile
= cStringIO
.StringIO()
246 # XXX this should maybe be handled by the page since removing
247 # this code would allow us to (nearly, since we also need to
248 # set more info in the content dict) reuse PDFcontent for
250 self
.bbox
= bbox
.empty()
252 style
.linewidth
.normal
.processPDF(self
.contentfile
, writer
, acontext
, registry
, self
.bbox
)
254 page
.canvas
.processPDF(self
.contentfile
, writer
, acontext
, registry
, self
.bbox
)
256 self
.pagetrafo
= page
.pagetrafo(self
.bbox
)
258 self
.transformedbbox
= self
.bbox
.transformed(self
.pagetrafo
)
260 self
.transformedbbox
= self
.bbox
262 def write(self
, file, writer
, registry
):
263 # apply a possible global transformation
265 pagetrafofile
= cStringIO
.StringIO()
266 self
.pagetrafo
.processPDF(pagetrafofile
, writer
, context(), registry
, bbox
.empty())
267 content
= pagetrafofile
.getvalue() + self
.contentfile
.getvalue()
268 pagetrafofile
.close()
270 content
= self
.contentfile
.getvalue()
271 self
.contentfile
.close()
274 content
= zlib
.compress(content
)
277 "/Length %i\n" % len(content
))
279 file.write("/Filter /FlateDecode\n")
283 file.write("endstream\n")
286 class PDFfont(PDFobject
):
288 def __init__(self
, font
, chars
, writer
, registry
):
289 PDFobject
.__init
__(self
, "font", font
.name
)
290 registry
.pageprocsets
["Text"] = 1
291 registry
.pageresources
.setdefault("Font", {})[font
.name
] = self
293 self
.fontdescriptor
= PDFfontdescriptor(font
, chars
, writer
, registry
)
294 registry
.add(self
.fontdescriptor
)
297 self
.encoding
= PDFencoding(font
.encoding
, writer
, registry
)
298 registry
.add(self
.encoding
)
302 self
.name
= font
.name
303 self
.basefontname
= font
.basefontname
304 self
.metric
= font
.metric
306 def write(self
, file, writer
, registry
):
310 file.write("/Name /%s\n" % self
.name
)
311 file.write("/BaseFont /%s\n" % self
.basefontname
)
312 if self
.fontdescriptor
.fontfile
is not None and self
.fontdescriptor
.fontfile
.usedchars
is not None:
313 usedchars
= self
.fontdescriptor
.fontfile
.usedchars
314 firstchar
= min(usedchars
.keys())
315 lastchar
= max(usedchars
.keys())
316 file.write("/FirstChar %d\n" % firstchar
)
317 file.write("/LastChar %d\n" % lastchar
)
318 file.write("/Widths\n"
320 for i
in range(firstchar
, lastchar
+1):
321 if i
and not (i
% 8):
325 if usedchars
.has_key(i
):
326 file.write("%f" % self
.metric
.getwidth_ds(i
))
331 file.write("/FirstChar 0\n"
336 if i
and not (i
% 8):
341 width
= self
.metric
.getwidth_ds(i
)
342 except (IndexError, AttributeError):
344 file.write("%f" % width
)
346 file.write("/FontDescriptor %d 0 R\n" % registry
.getrefno(self
.fontdescriptor
))
348 file.write("/Encoding %d 0 R\n" % registry
.getrefno(self
.encoding
))
352 class PDFfontdescriptor(PDFobject
):
354 def __init__(self
, font
, chars
, writer
, registry
):
355 PDFobject
.__init
__(self
, "fontdescriptor", font
.basefontname
)
357 if font
.filename
is None:
360 self
.fontfile
= PDFfontfile(font
.basefontname
, font
.filename
, font
.encoding
, chars
, writer
, registry
)
361 registry
.add(self
.fontfile
)
363 self
.name
= font
.basefontname
364 self
.fontinfo
= font
.metric
.fontinfo()
366 def write(self
, file, writer
, registry
):
368 "/Type /FontDescriptor\n"
369 "/FontName /%s\n" % self
.name
)
370 if self
.fontfile
is None:
371 file.write("/Flags 32\n")
373 file.write("/Flags %d\n" % self
.fontfile
.getflags())
374 file.write("/FontBBox [%d %d %d %d]\n" % self
.fontinfo
.fontbbox
)
375 file.write("/ItalicAngle %d\n" % self
.fontinfo
.italicangle
)
376 file.write("/Ascent %d\n" % self
.fontinfo
.ascent
)
377 file.write("/Descent %d\n" % self
.fontinfo
.descent
)
378 file.write("/CapHeight %d\n" % self
.fontinfo
.capheight
)
379 file.write("/StemV %d\n" % self
.fontinfo
.vstem
)
380 if self
.fontfile
is not None:
381 file.write("/FontFile %d 0 R\n" % registry
.getrefno(self
.fontfile
))
385 class PDFfontfile(PDFobject
):
387 def __init__(self
, name
, filename
, encoding
, chars
, writer
, registry
):
388 PDFobject
.__init
__(self
, "fontfile", filename
)
390 self
.filename
= filename
392 self
.encodingfilename
= None
394 self
.encodingfilename
= encoding
.filename
397 self
.usedchars
[char
] = 1
402 def merge(self
, other
):
403 if self
.encodingfilename
== other
.encodingfilename
:
404 self
.usedchars
.update(other
.usedchars
)
406 # TODO: need to resolve the encoding when several encodings are in the play
409 def mkfontfile(self
):
411 self
.font
= font
.t1font
.T1pfbfont(self
.filename
)
414 if self
.font
is None:
416 return self
.font
.getflags()
418 def write(self
, file, writer
, registry
):
419 if self
.font
is None:
422 # XXX: access to the encoding file
423 if self
.encodingfilename
:
424 encodingfile
= type1font
.encodingfile(self
.encodingfilename
, self
.encodingfilename
)
425 usedglyphs
= [encodingfile
.decode(char
)[1:] for char
in self
.usedchars
.keys()]
427 self
.font
._encoding
()
428 usedglyphs
= [self
.font
.encoding
.decode(char
) for char
in self
.usedchars
.keys()]
429 strippedfont
= self
.font
.getstrippedfont(usedglyphs
)
431 strippedfont
= self
.font
432 strippedfont
.outputPDF(file, writer
)
435 class PDFencoding(PDFobject
):
437 def __init__(self
, encoding
, writer
, registry
):
438 PDFobject
.__init
__(self
, "encoding", encoding
.name
)
439 self
.encoding
= encoding
441 def write(self
, file, writer
, registry
):
442 encodingfile
= type1font
.encodingfile(self
.encoding
.name
, self
.encoding
.filename
)
443 encodingfile
.outputPDF(file, writer
)
448 def __init__(self
, document
, filename
,
449 title
=None, author
=None, subject
=None, keywords
=None,
450 fullscreen
=0, writebbox
=0, compress
=1, compresslevel
=6):
451 if not filename
.endswith(".pdf"):
452 filename
= filename
+ ".pdf"
454 file = open(filename
, "wb")
456 raise IOError("cannot open output file")
460 self
.subject
= subject
461 self
.keywords
= keywords
462 self
.fullscreen
= fullscreen
463 self
.writebbox
= writebbox
464 if compress
and not haszlib
:
466 warnings
.warn("compression disabled due to missing zlib module")
467 self
.compress
= compress
468 self
.compresslevel
= compresslevel
470 # the PDFcatalog class automatically builds up the pdfobjects from a document
471 registry
= PDFregistry()
472 catalog
= PDFcatalog(document
, self
, registry
)
473 registry
.add(catalog
)
475 file.write("%%PDF-1.4\n%%%s%s%s%s\n" % (chr(195), chr(182), chr(195), chr(169)))
476 registry
.write(file, self
, catalog
)
483 self
.linewidth_pt
= None
484 # XXX there are both stroke and fill color spaces
485 self
.colorspace
= None
491 def __call__(self
, **kwargs
):
492 newcontext
= copy
.copy(self
)
493 for key
, value
in kwargs
.items():
494 setattr(newcontext
, key
, value
)