![]() ![]() |
Sie sind hier: TeilnehmerInnen > Volkers Bereich > Artikel > pyuno-Konverter pyuno-KonverterKonvertiert Winword-Doc oder OpenOffice-SXW nach HTML oder PDF. M�glich ist auch die Konvertierung von HTML nach PDF Das Script erweitert http://www.zopelabs.com/cookbook/1070039713 um einige Filter. Voraussetzung ist eine laufende OpenOffice-Installation mit pyuno. Download: convert.py import getopt,sys import uno from unohelper import Base,systemPathToFileUrl, absolutize from os import getcwd from com.sun.star.beans import PropertyValue from com.sun.star.beans.PropertyState import DIRECT_VALUE from com.sun.star.uno import Exception as UnoException from com.sun.star.io import IOException,XInputStream, XOutputStream class OutputStream( Base, XOutputStream ): def __init__( self ): self.closed = 0 def closeOutput(self): self.closed = 1 def writeBytes( self, seq ): sys.stdout.write( seq.value ) def flush( self ): pass def main(): retVal = 0 doc = None try: opts, args = getopt.getopt(sys.argv[1:], "hc:",["help", "connection-string=" , "html", "htmltopdf","pdf"]) format = None url = "uno:socket,host=localhost,port=2002;urp;StarOffice.ComponentContext" filterName = "Text (Encoded)" for o, a in opts: if o in ("-h", "--help"): usage() sys.exit() if o in ("-c", "--connection-string" ): url = "uno:" + a + ";urp;StarOffice.ComponentContext" if o == "--html": filterName = "HTML (StarWriter)" if o == "--htmltopdf": filterName = "writer_web_pdf_export" if o == "--pdf": filterName = "writer_pdf_export" #print filterName if not len( args ): usage() sys.exit() ctxLocal = uno.getComponentContext() smgrLocal = ctxLocal.ServiceManager resolver = smgrLocal.createInstanceWithContext( "com.sun.star.bridge.UnoUrlResolver", ctxLocal ) ctx = resolver.resolve( url ) smgr = ctx.ServiceManager desktop = smgr.createInstanceWithContext("com.sun.star.frame.Desktop", ctx ) cwd = systemPathToFileUrl( getcwd() ) outProps = ( PropertyValue( "FilterName" , 0, filterName , 0 ), PropertyValue( "Overwrite" , 0, True , 0 ), PropertyValue( "OutputStream",0, OutputStream(),0)) inProps = PropertyValue( "Hidden" , 0 , True, 0 ), for path in args: try: fileUrl = uno.absolutize( cwd, systemPathToFileUrl(path) ) doc = desktop.loadComponentFromURL( fileUrl , "_blank", 0,inProps) if not doc: raise UnoException( "Couldn't open stream for unknown reason", None ) if filterName == "Text (Encoded)": doc.storeToURL('%s.txt' % fileUrl,outProps) if filterName == "HTML (StarWriter)": doc.storeToURL('%s.html' % fileUrl,outProps) if filterName == "writer_pdf_export": doc.storeToURL('%s.pdf' % fileUrl,outProps) if filterName == "writer_web_pdf_export": doc.storeToURL('%s.pdf' % fileUrl,outProps) except IOException, e: sys.stderr.write( "Error during conversion: " + e.Message + "\n" ) retVal = 1 except UnoException, e: sys.stderr.write( "Error ("+repr(e.__class__)+") during conversion:" + e.Message + "\n" ) retVal = 1 if doc: doc.dispose() except UnoException, e: sys.stderr.write( "Error ("+repr(e.__class__)+") :" + e.Message + "\n" ) retVal = 1 except getopt.GetoptError,e: sys.stderr.write( str(e) + "\n" ) usage() retVal = 1 sys.exit(retVal) def usage(): sys.stderr.write( "usage: convert.py --help |\n" +\ " [-c | --connection-string=\n"+ \ " file1 file2 ...\n"+ \ "\n" + "Convert Winword-Doc \ OpenOffice-SXW.\ HTML to Plain Text \ HTML \ PDF \n" + \ "Requires an OpenOffice.org instance to be running. The script and the\n"+ \ "running OpenOffice.org instance must be able to access the file with\n"+ \ "by the same system path.\n" "\n"+ \ "-c | --connection-string=\n" + \ "The connection-string part of a uno url to where the\n" + \ "the script should connect to in order to do the conversion.\n" + \ "The strings defaults to socket,host=localhost,port=2002\n" \ "--html \n" + \ "Instead of the plain-text filter, the writer html filter is used\n" "--pdf \n" + \ "Instead of the plain-text filter, the writer pdf filter is used\n" "--htmltopdf \n" + \ "Instead of the plain-text filter, the writer_web pdf filter is used\n" ) main() Geschrieben von vbachs . Letzte �nderung 21.12.2003 17:27. |