#!/usr/bin/python import zipfile, re rx_stripxml = re.compile("<[^>]*?>", re.DOTALL|re.MULTILINE) def convert_OO(filename): """Converts an OO file into text""" zf = zipfile.ZipFile(filename, "r") data = zf.read("content.xml") zf.close() data = " ".join(rx_stripxml.sub(" ", data).split()) return data if __name__=="__main__": import sys if len(sys.argv)>1: for docname in sys.argv[1:]: try: print 'Text of', docname, ':' print convert_OO(docname) except: print "That file doesn't exist, or is not a .odt" else: print 'Call with paths to openoffice doc files to see Text form.'