Context Navigation

ooo.py @ 357

Revision 357, 3.0 kB (checked in by jerome, 18 years ago)
Added missing docstrings, thanks to pylint.
Property svn:eol-style set to `native` Property svn:keywords set to `Author Date Id Revision`

Rev	Line
[232]	1	#! /usr/bin/env python
	2	# -- coding: ISO-8859-15 --
	3	#
	4	# pkpgcounter : a generic Page Description Language parser
	5	#
[303]	6	# (c) 2003, 2004, 2005, 2006 Jerome Alet <alet@librelogiciel.com>
[232]	7	# This program is free software; you can redistribute it and/or modify
	8	# it under the terms of the GNU General Public License as published by
	9	# the Free Software Foundation; either version 2 of the License, or
	10	# (at your option) any later version.
	11	#
	12	# This program is distributed in the hope that it will be useful,
	13	# but WITHOUT ANY WARRANTY; without even the implied warranty of
	14	# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	15	# GNU General Public License for more details.
	16	#
	17	# You should have received a copy of the GNU General Public License
	18	# along with this program; if not, write to the Free Software
	19	# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
	20	#
	21	# $Id$
	22	#
	23
[357]	24	"""This modules implements a page counter for OpenDocument documents."""
	25
[232]	26	import sys
	27	import zipfile
	28
[235]	29	import pdlparser
[232]	30
	31	class Parser(pdlparser.PDLParser) :
	32	"""A parser for OpenOffice.org documents."""
	33	def isValid(self) :
	34	"""Returns 1 if data is DVI, else 0."""
	35	if self.firstblock[:2] == "PK" :
	36	try :
	37	self.archive = zipfile.ZipFile(self.infile)
	38	self.contentxml = self.archive.read("content.xml")
	39	self.metaxml = self.archive.read("meta.xml")
	40	except :
	41	return 0
	42	else :
[252]	43	self.logdebug("DEBUG: Input file is in the OpenOffice.org format.")
[232]	44	return 1
	45	else :
	46	return 0
	47
	48	def getJobSize(self) :
	49	"""Counts pages in an OpenOffice.org document.
	50
	51	Algorithm by Jerome Alet.
	52	"""
	53	pagecount = 0
	54	try :
	55	# First try with Text documents
	56	index = self.metaxml.index("meta:page-count=")
	57	pagecount = int(self.metaxml[index:].split('"')[1])
	58	except :
	59	# Now try with Impress documents
	60	pagecount = self.contentxml.count("<draw:page ")
	61	if not pagecount :
	62	# Probably a Spreadsheet document
	63	raise pdlparser.PDLParserError, "OpenOffice.org's spreadsheet documents are not yet supported."
	64	return pagecount
	65
	66	def test() :
	67	"""Test function."""
	68	if (len(sys.argv) < 2) or ((not sys.stdin.isatty()) and ("-" not in sys.argv[1:])) :
	69	sys.argv.append("-")
	70	totalsize = 0
	71	for arg in sys.argv[1:] :
	72	if arg == "-" :
	73	infile = sys.stdin
	74	mustclose = 0
	75	else :
	76	infile = open(arg, "rb")
	77	mustclose = 1
	78	try :
	79	parser = Parser(infile, debug=1)
	80	totalsize += parser.getJobSize()
	81	except pdlparser.PDLParserError, msg :
	82	sys.stderr.write("ERROR: %s\n" % msg)
	83	sys.stderr.flush()
	84	if mustclose :
	85	infile.close()
	86	print "%s" % totalsize
	87
	88	if __name__ == "__main__" :
	89	test()

Note: See TracBrowser for help on using the browser.

Context Navigation

root / pkpgcounter / trunk / pkpgpdls / ooo.py @ 357

Download in other formats: