Context Navigation

ooo.py @ 357

Revision 357, 3.0 kB (checked in by jerome, 18 years ago)
Added missing docstrings, thanks to pylint.
Property svn:eol-style set to `native` Property svn:keywords set to `Author Date Id Revision`

Line
1	#! /usr/bin/env python
2	# -- coding: ISO-8859-15 --
3	#
4	# pkpgcounter : a generic Page Description Language parser
5	#
6	# (c) 2003, 2004, 2005, 2006 Jerome Alet <alet@librelogiciel.com>
7	# This program is free software; you can redistribute it and/or modify
8	# it under the terms of the GNU General Public License as published by
9	# the Free Software Foundation; either version 2 of the License, or
10	# (at your option) any later version.
11	#
12	# This program is distributed in the hope that it will be useful,
13	# but WITHOUT ANY WARRANTY; without even the implied warranty of
14	# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15	# GNU General Public License for more details.
16	#
17	# You should have received a copy of the GNU General Public License
18	# along with this program; if not, write to the Free Software
19	# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
20	#
21	# $Id$
22	#
23
24	"""This modules implements a page counter for OpenDocument documents."""
25
26	import sys
27	import zipfile
28
29	import pdlparser
30
31	class Parser(pdlparser.PDLParser) :
32	"""A parser for OpenOffice.org documents."""
33	def isValid(self) :
34	"""Returns 1 if data is DVI, else 0."""
35	if self.firstblock[:2] == "PK" :
36	try :
37	self.archive = zipfile.ZipFile(self.infile)
38	self.contentxml = self.archive.read("content.xml")
39	self.metaxml = self.archive.read("meta.xml")
40	except :
41	return 0
42	else :
43	self.logdebug("DEBUG: Input file is in the OpenOffice.org format.")
44	return 1
45	else :
46	return 0
47
48	def getJobSize(self) :
49	"""Counts pages in an OpenOffice.org document.
50
51	Algorithm by Jerome Alet.
52	"""
53	pagecount = 0
54	try :
55	# First try with Text documents
56	index = self.metaxml.index("meta:page-count=")
57	pagecount = int(self.metaxml[index:].split('"')[1])
58	except :
59	# Now try with Impress documents
60	pagecount = self.contentxml.count("<draw:page ")
61	if not pagecount :
62	# Probably a Spreadsheet document
63	raise pdlparser.PDLParserError, "OpenOffice.org's spreadsheet documents are not yet supported."
64	return pagecount
65
66	def test() :
67	"""Test function."""
68	if (len(sys.argv) < 2) or ((not sys.stdin.isatty()) and ("-" not in sys.argv[1:])) :
69	sys.argv.append("-")
70	totalsize = 0
71	for arg in sys.argv[1:] :
72	if arg == "-" :
73	infile = sys.stdin
74	mustclose = 0
75	else :
76	infile = open(arg, "rb")
77	mustclose = 1
78	try :
79	parser = Parser(infile, debug=1)
80	totalsize += parser.getJobSize()
81	except pdlparser.PDLParserError, msg :
82	sys.stderr.write("ERROR: %s\n" % msg)
83	sys.stderr.flush()
84	if mustclose :
85	infile.close()
86	print "%s" % totalsize
87
88	if __name__ == "__main__" :
89	test()

Note: See TracBrowser for help on using the browser.

Context Navigation

root / pkpgcounter / trunk / pkpgpdls / ooo.py @ 357

Download in other formats: