Deutsche Zope User Group
Gast 2 Benutzer online
DZUG-News

pyuno-Konverter

Konvertiert Winword-Doc oder OpenOffice-SXW nach HTML oder PDF. M�glich ist auch die Konvertierung von HTML nach PDF

Das Script erweitert http://www.zopelabs.com/cookbook/1070039713 um einige Filter.

Voraussetzung ist eine laufende OpenOffice-Installation mit pyuno.
Das Script muss mit dem Python von OpenOffice aufgerufen werden.

Download: convert.py


import getopt,sys
import uno
from unohelper import Base,systemPathToFileUrl, absolutize 
from os import getcwd

from com.sun.star.beans import PropertyValue 
from com.sun.star.beans.PropertyState import DIRECT_VALUE 
from com.sun.star.uno import Exception as UnoException 
from com.sun.star.io import IOException,XInputStream, XOutputStream

class OutputStream( Base, XOutputStream ):
      def __init__( self ):
          self.closed = 0

      def closeOutput(self):
          self.closed = 1

      def writeBytes( self, seq ):
          sys.stdout.write( seq.value )

      def flush( self ):
          pass


def main():
    retVal = 0
    doc = None

    try:
        opts, args = getopt.getopt(sys.argv[1:], "hc:",["help",
        "connection-string=" , "html", "htmltopdf","pdf"]) 
        format = None
        url = "uno:socket,host=localhost,port=2002;urp;StarOffice.ComponentContext"
        filterName = "Text (Encoded)"
        for o, a in opts:
            if o in ("-h", "--help"):
                usage()
                sys.exit()
            if o in ("-c", "--connection-string" ):
                url = "uno:" + a + ";urp;StarOffice.ComponentContext"
            if o == "--html":
                filterName = "HTML (StarWriter)"
            if o == "--htmltopdf":
                filterName = "writer_web_pdf_export"
            if o == "--pdf":
                filterName = "writer_pdf_export"


        #print filterName
        if not len( args ):
              usage()
              sys.exit()

        ctxLocal = uno.getComponentContext()
        smgrLocal = ctxLocal.ServiceManager

        resolver = smgrLocal.createInstanceWithContext(
                 "com.sun.star.bridge.UnoUrlResolver", ctxLocal )
        ctx = resolver.resolve( url )
        smgr = ctx.ServiceManager

        desktop = smgr.createInstanceWithContext("com.sun.star.frame.Desktop", ctx )

        cwd = systemPathToFileUrl( getcwd() ) 
        outProps = (
            PropertyValue( "FilterName" , 0, filterName , 0 ),
            PropertyValue( "Overwrite" , 0, True , 0 ), PropertyValue(
            "OutputStream",0, OutputStream(),0))
        inProps = PropertyValue( "Hidden" , 0 , True, 0 ), 
        for path in args:
            try:
                fileUrl = uno.absolutize( cwd, systemPathToFileUrl(path) )
                doc = desktop.loadComponentFromURL( fileUrl , "_blank",
                0,inProps)

                if not doc:
                    raise UnoException( "Couldn't open stream for unknown reason", None )

                if filterName == "Text (Encoded)":
                    doc.storeToURL('%s.txt' % fileUrl,outProps)
                
                if filterName == "HTML (StarWriter)":
                    doc.storeToURL('%s.html' % fileUrl,outProps)

                if filterName == "writer_pdf_export":
                    doc.storeToURL('%s.pdf' % fileUrl,outProps)

                if filterName == "writer_web_pdf_export":
                    doc.storeToURL('%s.pdf' % fileUrl,outProps)

            except IOException, e:
                sys.stderr.write( "Error during conversion: " + e.Message + "\n" )                 
                retVal = 1
            except UnoException, e:
                sys.stderr.write( "Error ("+repr(e.__class__)+") during conversion:" + e.Message + "\n" )
                retVal = 1
            if doc:
                doc.dispose()

    except UnoException, e:
        sys.stderr.write( "Error ("+repr(e.__class__)+") :" + e.Message + "\n" ) 
        retVal = 1
    except getopt.GetoptError,e:
        sys.stderr.write( str(e) + "\n" )
        usage()
        retVal = 1

    sys.exit(retVal)

def usage():
    sys.stderr.write( "usage: convert.py --help |\n" +\
                "       [-c  |   --connection-string=\n"+ \
                "       file1 file2 ...\n"+ \
                "\n" + "Convert Winword-Doc \ OpenOffice-SXW.\ HTML to Plain Text \ HTML \ PDF \n" + \
                "Requires an OpenOffice.org instance to be running. The script and the\n"+ \
                "running OpenOffice.org instance must be able to access the file with\n"+ \
                "by the same system path.\n" "\n"+ \
                "-c  | --connection-string=\n" + \
                "The connection-string part of a uno url to where the\n" + \
                "the script should connect to in order to do the conversion.\n" + \
                "The strings defaults to socket,host=localhost,port=2002\n" \
                "--html \n" + \
                "Instead of the plain-text filter, the writer html filter is used\n" 
                "--pdf \n" + \
                "Instead of the plain-text filter, the writer pdf filter is used\n" 
                "--htmltopdf \n" + \
                "Instead of the plain-text filter, the writer_web pdf filter is used\n" )
                

main()

Geschrieben von vbachs . Letzte �nderung 21.12.2003 17:27.