"""
$RCSfile: PyanaProcessor.py,v $

This class encapsulates an XSLT Processor for use by ZopeXMLMethods.
This is the Pyana version, including support for XSLT
parameters.  It does not yet include support for URN resolution.

Author: <a href="mailto:cstrong@arielpartners.com">Craeg Strong</a>
Release: 1.0
"""

__cvstag__  = '$Name:  $'[6:-2]
__date__    = '$Date: 2003/06/16 05:47:53 $'[6:-2]
__version__ = '$Revision: 1.3 $'[10:-2]

# Pyana
import Pyana

# Zope
from Acquisition import aq_get
from zope.interface import implements
# python
import os.path, sys, urllib

# local peer classes
from interfaces import IXSLTProcessor

################################################################
# Defaults
################################################################

namespacesPropertyName        = 'URNnamespaces'
parametersPropertyName        = 'XSLparameters'

################################################################
# PyanaProcessor class
################################################################

class PyanaProcessor:
    """
    This class encapsulates an XSLT Processor for use by
    ZopeXMLMethods.  This is the Pyana version, including support for
    XSLT parameters.  It does not yet include support for URN
    resolution.
    """

    implements(IXSLTProcessor)
    name           = 'Pyana 0.6'
        
    def __init__(self):
        "Initialize a new instance of PyanaProcessor"
        self.debugLevel = 0

        # This global variable determines which ProblemListener is used by
        # Pyana to report errors and messages during XSLT transformation
        Pyana.defaultProblemListenerFactory = ProblemListener

        # This global variable determines which ErrorHandler is used by
        # Pyana to report errors during XML parsing
        Pyana.defaultErrorHandlerFactory = ErrorHandler

    ################################################################
    # Methods implementing the IProcessor interface
    ################################################################

    def setDebugLevel(self, level):
        """

        Set debug level from 0 to 3.
        0 = silent
        3 = extra verbose
        Debug messages go to Zope server log.

        """
        self.debugLevel   = level
        
    ################################################################
    # Methods implementing the IXSLTProcessor interface
    ################################################################

    def transform(self, xmlContents, xmlURL, xsltContents, xsltURL,
                  transformObject = None, params = {}, REQUEST = None):
        """

        Transforms the passed in XML into the required output (usually
        HTML) using the passed in XSLT.  Both the XML and XSLT strings
        should be well-formed.  Returns the output as a string.
        transformObject and REQUEST params may be used to acquire Zope
        content such as XSLT parameters and URN namespaces, if
        required.

        Catches any Pyana specific exceptions and raises an Exception

        """

        if self.debugLevel > 1:
            print "params:", params

        if self.debugLevel > 1:
            print "xsltContents:"
            print xsltContents
            print "xmlContents:"
            print xmlContents

        # Pyana does not work with unicode; rather it requires an encoding.
        # Unfortunately, ParsedXML gives us unicode.  We coerce it to UTF-8
        # The only place we get this today AFAIK is ParsedXML
        # @@ FIXME we need a better way... CKS 3/2/2003
        if type(xmlContents) is type(u''):
            xmlContents = xmlContents.encode('utf8')
        if type(xsltContents) is type(u''):
            xsltContents = xsltContents.encode('utf8')

        # Convert the parameters to the form expected by this processor
        xsltParams = {}
        for key, value in params.items():
            self.addParam(xsltParams, key, value)

        namespaceMap   = {}
        if transformObject is not None:
            namespaceMap   = self.retrieveNamespaces(transformObject)
        if self.debugLevel > 1:
            print "namespaces:", namespaceMap

        t = Pyana.Transformer()
        t.useValidation = 0
        t.setStylesheetParams(xsltParams)
        t.setEntityResolver(URIResolver(namespaceMap, REQUEST))
        result =  t.transform2String(source = xmlContents,
                                     style  = xsltContents)
        return result

    def addParam(self, paramMap, name, value):
        """

        This is a convenience function for adding parameters in the
        correct format to the parameter map to be used for the
        'params' parameter in transformGuts.
        
        """
        paramMap[ name ] = "'%s'" % (value)
        return paramMap

    ################################################################
    # Utility methods
    ################################################################

    def retrieveNamespaces(self, transformObject):
        """

        retrieves Namespaces defined for URI Resolution

        """
        NIDs   = aq_get(transformObject,namespacesPropertyName,None)
        result = {}
        if NIDs is not None:
            for n in NIDs:
                value = aq_get(transformObject,n,None)
                # I use callable() to determine if it is not a scalar.
                # If not, it must be a Zope object (I think) - WGM
                if callable(value):
                    result[n] = value
                else:
                    result[n] = str(value)
        return result

################################################################
# Pyana API Hooks
################################################################

class ProblemListener:
    """

    This class replaces the default class used by Pyana to report
    errors and XSLT messages that occur during the XSLT transformation
    process.

    """
    
    def problem(
        self, where, classification,
        sourceNode, styleNode,
        msg, uri, line, offset):
        """
        
        The default error handler for Pyana prints out
        messages to stderr.  Throw an exception instead.
        
        """
        import sys
        message = ''

        typeMap = {
            Pyana.eERROR:   'Error: ',
            Pyana.eWARNING: 'Warning: ',
            Pyana.eMESSAGE: 'Message: ' }

        message = typeMap[classification] + msg

        if uri or line != -1 or offset != -1:
            if line != -1 or offset != -1:
                message = message + \
                          ' [systemID: "%s" (line: %s, column: %s)]' % \
                          (uri, line, offset)
            else:
                message = message + ' [systemID: "%s"]'% (uri,)
        
        raise Exception(message)

class ErrorHandler:
    """

    This class replaces the default class used by Pyana to report
    errors that occur during the parsing of XML files.

    """

    def common(self, name, e):
        message = '%s: %s' % (name, e.message)
        if e.systemID or e.lineNumber or e.columnNumber:
            message = message + \
                      '[systemID: "%s" (line: %s, column: %s)]' % \
                      (e.systemID, e.lineNumber, e.columnNumber)
        return message
            
    def warning(self, e):
        # From Pyana-0.6/Test/TestEntityResolver.py line 85...
        #
        # A request is  made to open the NULL string
        # because Xerces is attempting to load the
        # XML file's schema. Whether that is a bug
        # or not is still up in the air. testXSLT
        # has the same problem.
        #
        # When this happens, a warning is generated.  It looks like this:
        # 
        # Warning: An exception occurred! Type:RuntimeException, Message:Warning: The primary document entity could not be opened. Id=
        #
        print self.common('Warning', e)
        pass

    def error(self, e):
        print self.common('Error', e)

    def fatalError(self, e):
        raise Exception(self.common('FatalError', e))
    
    def resetErrors(self):
        pass

class URIResolver:
    def __init__(self, namespaceMap, REQUEST):
        """
        Remember the URN namespaces corresponding to Zope folders and
        the REQUEST context with which we want to load the resources

        """
        self.namespaceMap = namespaceMap
        self.req          = REQUEST

    def acquireObjectContents(self, base, contextURL, REQUEST):
        """

        Obtain the contents of the Zope object indicated by the passed
        in context, starting from the passed in base object.

        """
        #print "acquire contents for:",contextURL
        zObject     = base
        #print "base", zObject.getId()
        #
        # why doesn't the below work?  Is this a bug?
        # (see com/arielpartners/website/scripts/resolver.dtml)
        # zObject = base.restrictedTraverse(contextURL)
        
        # sigh.   Do it the hard way.
        contextList = contextURL.split('/')
        for context in contextList:
            zObject = aq_get(zObject,context,None)
            if zObject is None:
                return None
        contents = zObject(zObject, REQUEST)
        return contents
        
    def resolveEntity(self, public, sysid):
        "Resolve the URN to a Zope object, or pass on the request"

        if self.isRecognizedURN(sysid):
            #print  "resolveEntity, publicID '%s', sysid '%s'" % (public, sysid)
            uri      = sysid[sysid.find('urn:'):]
            uriParts = uri.split(':')
            nid      = uriParts[1] # namespace ID
            nss      = uriParts[2] # namespace specific string
            base     = self.namespaceMap.get(nid, None)
            if base is None:
                # revert to normal behavior
                return None
            elif type(base) == type(''):
                # We are mapping one URL to another a la XMLCatalog RewriteURI
                #
                # could use urllib join, but it replaces the last component if no trailing slash. e.g.
                #
                # urllib.join  ("http://www.foo.com/bar", "mumble.xml") ==> http://www.foo.com/mumble.xml
                # os.path.join ("http://www.foo.com/bar", "mumble.xml") ==> http://www.foo.com/bar/mumble.xml
                resolvedURL = os.path.join(base, nss)
                return urllib.urlopen(resolvedURL).read()
            else: # its a Zope object, we must retrieve its contents
                st = self.acquireObjectContents(base, nss, self.req)
                if st is None:
                    # failure, cannot grab object, revert to normal behavior
                    return None
                else:
                    # load the resource from the Zope object
                    return StringInputStream(st)
        else:
            # revert to normal behavior
            return None

    def isRecognizedURN(self, uri):
        "Return true if this uri is of a format we recognize"

        if uri == '':
            return 0 # false
        if uri.find('urn:') == -1:
            return 0 # false
        uri = uri[uri.find('urn:'):]
        uriParts = uri.split(':')
        return uriParts[0] == 'urn' and len(uriParts) == 3
            
class StringInputStream:
    
    def __init__(self, string):
        self.string = string.encode('utf-8')
        
    def makeStream(self):
        # The returned stream can be any object with
        # a read(size) method. So open(...), urllib.open(...),
        # etc. will all generate valid streams. In this case,
        # we will use StringIO to present a string as a
        # stream.  We can't use cStringIO, b/c it might be
        # UNICODE.
        from StringIO import StringIO
        return StringIO(self.string)

################################################################
# Register ourselves with the Processor Registry
################################################################

from ProcessorRegistry import ProcessorRegistry
klass = PyanaProcessor
try:
    proc = klass()
    ProcessorRegistry.register(proc)
    #print "Registered processor", klass.name, "for use with ZopeXMLMethods"
except:
    print "Processor", klass.name, "not available for use with ZopeXMLMethods"