mirror of
https://github.com/olivierkes/manuskript.git
synced 2024-10-01 17:56:46 +13:00
120 lines
3.7 KiB
Python
120 lines
3.7 KiB
Python
#!/usr/bin/python
|
|
# -*- coding: utf-8 -*-
|
|
# Copyright (C) 2006-2007 Søren Roug, European Environment Agency
|
|
#
|
|
# This library is free software; you can redistribute it and/or
|
|
# modify it under the terms of the GNU Lesser General Public
|
|
# License as published by the Free Software Foundation; either
|
|
# version 2.1 of the License, or (at your option) any later version.
|
|
#
|
|
# This library is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
# Lesser General Public License for more details.
|
|
#
|
|
# You should have received a copy of the GNU Lesser General Public
|
|
# License along with this library; if not, write to the Free Software
|
|
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
#
|
|
# Contributor(s):
|
|
#
|
|
from __future__ import print_function
|
|
# This script lists the content of the manifest.xml file
|
|
import zipfile
|
|
from xml.sax import make_parser,handler
|
|
from xml.sax.xmlreader import InputSource
|
|
import xml.sax.saxutils
|
|
try:
|
|
from cStringIO import StringIO
|
|
except ImportError:
|
|
from io import StringIO
|
|
|
|
MANIFESTNS="urn:oasis:names:tc:opendocument:xmlns:manifest:1.0"
|
|
|
|
#-----------------------------------------------------------------------------
|
|
#
|
|
# ODFMANIFESTHANDLER
|
|
#
|
|
#-----------------------------------------------------------------------------
|
|
|
|
class ODFManifestHandler(handler.ContentHandler):
|
|
""" The ODFManifestHandler parses a manifest file and produces a list of
|
|
content """
|
|
|
|
def __init__(self):
|
|
self.manifest = {}
|
|
|
|
# Tags
|
|
# FIXME: Also handle encryption data
|
|
self.elements = {
|
|
(MANIFESTNS, 'file-entry'): (self.s_file_entry, self.donothing),
|
|
}
|
|
|
|
def handle_starttag(self, tag, method, attrs):
|
|
method(tag,attrs)
|
|
|
|
def handle_endtag(self, tag, method):
|
|
method(tag)
|
|
|
|
def startElementNS(self, tag, qname, attrs):
|
|
method = self.elements.get(tag, (None, None))[0]
|
|
if method:
|
|
self.handle_starttag(tag, method, attrs)
|
|
else:
|
|
self.unknown_starttag(tag,attrs)
|
|
|
|
def endElementNS(self, tag, qname):
|
|
method = self.elements.get(tag, (None, None))[1]
|
|
if method:
|
|
self.handle_endtag(tag, method)
|
|
else:
|
|
self.unknown_endtag(tag)
|
|
|
|
def unknown_starttag(self, tag, attrs):
|
|
pass
|
|
|
|
def unknown_endtag(self, tag):
|
|
pass
|
|
|
|
def donothing(self, tag, attrs=None):
|
|
pass
|
|
|
|
def s_file_entry(self, tag, attrs):
|
|
m = attrs.get((MANIFESTNS, 'media-type'),"application/octet-stream")
|
|
p = attrs.get((MANIFESTNS, 'full-path'))
|
|
self.manifest[p] = { 'media-type':m, 'full-path':p }
|
|
|
|
|
|
#-----------------------------------------------------------------------------
|
|
#
|
|
# Reading the file
|
|
#
|
|
#-----------------------------------------------------------------------------
|
|
|
|
def manifestlist(manifestxml):
|
|
odhandler = ODFManifestHandler()
|
|
parser = make_parser()
|
|
parser.setFeature(handler.feature_namespaces, 1)
|
|
parser.setContentHandler(odhandler)
|
|
parser.setErrorHandler(handler.ErrorHandler())
|
|
|
|
inpsrc = InputSource()
|
|
if not isinstance(manifestxml, str):
|
|
manifestxml=manifestxml.decode("utf-8")
|
|
inpsrc.setByteStream(StringIO(manifestxml))
|
|
parser.parse(inpsrc)
|
|
|
|
return odhandler.manifest
|
|
|
|
def odfmanifest(odtfile):
|
|
z = zipfile.ZipFile(odtfile)
|
|
manifest = z.read('META-INF/manifest.xml')
|
|
z.close()
|
|
return manifestlist(manifest)
|
|
|
|
if __name__ == "__main__":
|
|
import sys
|
|
result = odfmanifest(sys.argv[1])
|
|
for file in result.values():
|
|
print ("%-40s %-40s" % (file['media-type'], file['full-path']))
|
|
|