| import libxml2mod |
| import types |
| import sys |
|
|
| |
| class libxmlError(Exception): pass |
|
|
| |
| def checkWrapper(obj): |
| try: |
| n = type(_obj).__name__ |
| if n != 'PyCObject' and n != 'PyCapsule': |
| return 1 |
| except: |
| return 0 |
| return 0 |
|
|
| |
| |
| |
| def pos_id(o): |
| i = id(o) |
| if (i < 0): |
| return (sys.maxsize - i) |
| return i |
|
|
| |
| |
| |
| class treeError(libxmlError): |
| def __init__(self, msg): |
| self.msg = msg |
| def __str__(self): |
| return self.msg |
|
|
| class parserError(libxmlError): |
| def __init__(self, msg): |
| self.msg = msg |
| def __str__(self): |
| return self.msg |
|
|
| class uriError(libxmlError): |
| def __init__(self, msg): |
| self.msg = msg |
| def __str__(self): |
| return self.msg |
|
|
| class xpathError(libxmlError): |
| def __init__(self, msg): |
| self.msg = msg |
| def __str__(self): |
| return self.msg |
|
|
| class ioWrapper: |
| def __init__(self, _obj): |
| self.__io = _obj |
| self._o = None |
|
|
| def io_close(self): |
| if self.__io == None: |
| return(-1) |
| self.__io.close() |
| self.__io = None |
| return(0) |
|
|
| def io_flush(self): |
| if self.__io == None: |
| return(-1) |
| self.__io.flush() |
| return(0) |
|
|
| def io_read(self, len = -1): |
| if self.__io == None: |
| return(-1) |
| try: |
| if len < 0: |
| ret = self.__io.read() |
| else: |
| ret = self.__io.read(len) |
| except Exception: |
| import sys |
| e = sys.exc_info()[1] |
| print("failed to read from Python:", type(e)) |
| print("on IO:", self.__io) |
| self.__io == None |
| return(-1) |
|
|
| return(ret) |
|
|
| def io_write(self, str, len = -1): |
| if self.__io == None: |
| return(-1) |
| if len < 0: |
| return(self.__io.write(str)) |
| return(self.__io.write(str, len)) |
|
|
| class ioReadWrapper(ioWrapper): |
| def __init__(self, _obj, enc = ""): |
| ioWrapper.__init__(self, _obj) |
| self._o = libxml2mod.xmlCreateInputBuffer(self, enc) |
|
|
| def __del__(self): |
| print("__del__") |
| self.io_close() |
| if self._o != None: |
| libxml2mod.xmlFreeParserInputBuffer(self._o) |
| self._o = None |
|
|
| def close(self): |
| self.io_close() |
| if self._o != None: |
| libxml2mod.xmlFreeParserInputBuffer(self._o) |
| self._o = None |
|
|
| class ioWriteWrapper(ioWrapper): |
| def __init__(self, _obj, enc = ""): |
| |
| if type(_obj) == type(''): |
| print("write io from a string") |
| self.o = None |
| elif type(_obj).__name__ == 'PyCapsule': |
| file = libxml2mod.outputBufferGetPythonFile(_obj) |
| if file != None: |
| ioWrapper.__init__(self, file) |
| else: |
| ioWrapper.__init__(self, _obj) |
| self._o = _obj |
| |
| |
| |
| |
| else: |
| file = libxml2mod.outputBufferGetPythonFile(_obj) |
| if file != None: |
| ioWrapper.__init__(self, file) |
| else: |
| ioWrapper.__init__(self, _obj) |
| self._o = _obj |
|
|
| def __del__(self): |
| |
| self.io_close() |
| if self._o != None: |
| libxml2mod.xmlOutputBufferClose(self._o) |
| self._o = None |
|
|
| def flush(self): |
| self.io_flush() |
| if self._o != None: |
| libxml2mod.xmlOutputBufferClose(self._o) |
| self._o = None |
|
|
| def close(self): |
| self.io_flush() |
| if self._o != None: |
| libxml2mod.xmlOutputBufferClose(self._o) |
| self._o = None |
|
|
| |
| |
| |
| class SAXCallback: |
| """Base class for SAX handlers""" |
| def startDocument(self): |
| """called at the start of the document""" |
| pass |
|
|
| def endDocument(self): |
| """called at the end of the document""" |
| pass |
|
|
| def startElement(self, tag, attrs): |
| """called at the start of every element, tag is the name of |
| the element, attrs is a dictionary of the element's attributes""" |
| pass |
|
|
| def endElement(self, tag): |
| """called at the start of every element, tag is the name of |
| the element""" |
| pass |
|
|
| def characters(self, data): |
| """called when character data have been read, data is the string |
| containing the data, multiple consecutive characters() callback |
| are possible.""" |
| pass |
|
|
| def cdataBlock(self, data): |
| """called when CDATA section have been read, data is the string |
| containing the data, multiple consecutive cdataBlock() callback |
| are possible.""" |
| pass |
|
|
| def reference(self, name): |
| """called when an entity reference has been found""" |
| pass |
|
|
| def ignorableWhitespace(self, data): |
| """called when potentially ignorable white spaces have been found""" |
| pass |
|
|
| def processingInstruction(self, target, data): |
| """called when a PI has been found, target contains the PI name and |
| data is the associated data in the PI""" |
| pass |
|
|
| def comment(self, content): |
| """called when a comment has been found, content contains the comment""" |
| pass |
|
|
| def externalSubset(self, name, externalID, systemID): |
| """called when a DOCTYPE declaration has been found, name is the |
| DTD name and externalID, systemID are the DTD public and system |
| identifier for that DTd if available""" |
| pass |
|
|
| def internalSubset(self, name, externalID, systemID): |
| """called when a DOCTYPE declaration has been found, name is the |
| DTD name and externalID, systemID are the DTD public and system |
| identifier for that DTD if available""" |
| pass |
|
|
| def entityDecl(self, name, type, externalID, systemID, content): |
| """called when an ENTITY declaration has been found, name is the |
| entity name and externalID, systemID are the entity public and |
| system identifier for that entity if available, type indicates |
| the entity type, and content reports it's string content""" |
| pass |
|
|
| def notationDecl(self, name, externalID, systemID): |
| """called when an NOTATION declaration has been found, name is the |
| notation name and externalID, systemID are the notation public and |
| system identifier for that notation if available""" |
| pass |
|
|
| def attributeDecl(self, elem, name, type, defi, defaultValue, nameList): |
| """called when an ATTRIBUTE definition has been found""" |
| pass |
|
|
| def elementDecl(self, name, type, content): |
| """called when an ELEMENT definition has been found""" |
| pass |
|
|
| def entityDecl(self, name, publicId, systemID, notationName): |
| """called when an unparsed ENTITY declaration has been found, |
| name is the entity name and publicId,, systemID are the entity |
| public and system identifier for that entity if available, |
| and notationName indicate the associated NOTATION""" |
| pass |
|
|
| def warning(self, msg): |
| |
| pass |
|
|
| def error(self, msg): |
| raise parserError(msg) |
|
|
| def fatalError(self, msg): |
| raise parserError(msg) |
|
|
| |
| |
| |
| |
| |
| |
| class xmlCore: |
| def __init__(self, _obj=None): |
| if _obj != None: |
| self._o = _obj; |
| return |
| self._o = None |
|
|
| def __eq__(self, other): |
| if other == None: |
| return False |
| ret = libxml2mod.compareNodesEqual(self._o, other._o) |
| if ret == None: |
| return False |
| return ret == True |
| def __ne__(self, other): |
| if other == None: |
| return True |
| ret = libxml2mod.compareNodesEqual(self._o, other._o) |
| return not ret |
| def __hash__(self): |
| ret = libxml2mod.nodeHash(self._o) |
| return ret |
|
|
| def __str__(self): |
| return self.serialize() |
| def get_parent(self): |
| ret = libxml2mod.parent(self._o) |
| if ret == None: |
| return None |
| return nodeWrap(ret) |
| def get_children(self): |
| ret = libxml2mod.children(self._o) |
| if ret == None: |
| return None |
| return nodeWrap(ret) |
| def get_last(self): |
| ret = libxml2mod.last(self._o) |
| if ret == None: |
| return None |
| return nodeWrap(ret) |
| def get_next(self): |
| ret = libxml2mod.next(self._o) |
| if ret == None: |
| return None |
| return nodeWrap(ret) |
| def get_properties(self): |
| ret = libxml2mod.properties(self._o) |
| if ret == None: |
| return None |
| return xmlAttr(_obj=ret) |
| def get_prev(self): |
| ret = libxml2mod.prev(self._o) |
| if ret == None: |
| return None |
| return nodeWrap(ret) |
| def get_content(self): |
| return libxml2mod.xmlNodeGetContent(self._o) |
| getContent = get_content |
| def get_name(self): |
| return libxml2mod.name(self._o) |
| def get_type(self): |
| return libxml2mod.type(self._o) |
| def get_doc(self): |
| ret = libxml2mod.doc(self._o) |
| if ret == None: |
| if self.type in ["document_xml", "document_html"]: |
| return xmlDoc(_obj=self._o) |
| else: |
| return None |
| return xmlDoc(_obj=ret) |
| |
| |
| |
| |
| import sys |
| if float(sys.version[0:3]) < 2.2: |
| def __getattr__(self, attr): |
| if attr == "parent": |
| ret = libxml2mod.parent(self._o) |
| if ret == None: |
| return None |
| return nodeWrap(ret) |
| elif attr == "properties": |
| ret = libxml2mod.properties(self._o) |
| if ret == None: |
| return None |
| return xmlAttr(_obj=ret) |
| elif attr == "children": |
| ret = libxml2mod.children(self._o) |
| if ret == None: |
| return None |
| return nodeWrap(ret) |
| elif attr == "last": |
| ret = libxml2mod.last(self._o) |
| if ret == None: |
| return None |
| return nodeWrap(ret) |
| elif attr == "next": |
| ret = libxml2mod.next(self._o) |
| if ret == None: |
| return None |
| return nodeWrap(ret) |
| elif attr == "prev": |
| ret = libxml2mod.prev(self._o) |
| if ret == None: |
| return None |
| return nodeWrap(ret) |
| elif attr == "content": |
| return libxml2mod.xmlNodeGetContent(self._o) |
| elif attr == "name": |
| return libxml2mod.name(self._o) |
| elif attr == "type": |
| return libxml2mod.type(self._o) |
| elif attr == "doc": |
| ret = libxml2mod.doc(self._o) |
| if ret == None: |
| if self.type == "document_xml" or self.type == "document_html": |
| return xmlDoc(_obj=self._o) |
| else: |
| return None |
| return xmlDoc(_obj=ret) |
| raise AttributeError(attr) |
| else: |
| parent = property(get_parent, None, None, "Parent node") |
| children = property(get_children, None, None, "First child node") |
| last = property(get_last, None, None, "Last sibling node") |
| next = property(get_next, None, None, "Next sibling node") |
| prev = property(get_prev, None, None, "Previous sibling node") |
| properties = property(get_properties, None, None, "List of properties") |
| content = property(get_content, None, None, "Content of this node") |
| name = property(get_name, None, None, "Node name") |
| type = property(get_type, None, None, "Node type") |
| doc = property(get_doc, None, None, "The document this node belongs to") |
|
|
| |
| |
| |
| |
| |
| |
| def serialize(self, encoding = None, format = 0): |
| return libxml2mod.serializeNode(self._o, encoding, format) |
| def saveTo(self, file, encoding = None, format = 0): |
| return libxml2mod.saveNodeTo(self._o, file, encoding, format) |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| def c14nMemory(self, |
| nodes=None, |
| exclusive=0, |
| prefixes=None, |
| with_comments=0): |
| if nodes: |
| nodes = [n._o for n in nodes] |
| return libxml2mod.xmlC14NDocDumpMemory( |
| self.get_doc()._o, |
| nodes, |
| exclusive != 0, |
| prefixes, |
| with_comments != 0) |
| def c14nSaveTo(self, |
| file, |
| nodes=None, |
| exclusive=0, |
| prefixes=None, |
| with_comments=0): |
| if nodes: |
| nodes = [n._o for n in nodes] |
| return libxml2mod.xmlC14NDocSaveTo( |
| self.get_doc()._o, |
| nodes, |
| exclusive != 0, |
| prefixes, |
| with_comments != 0, |
| file) |
|
|
| |
| |
| |
| |
| def xpathEval(self, expr): |
| doc = self.doc |
| if doc == None: |
| return None |
| ctxt = doc.xpathNewContext() |
| ctxt.setContextNode(self) |
| res = ctxt.xpathEval(expr) |
| ctxt.xpathFreeContext() |
| return res |
|
|
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| def xpathEval2(self, expr): |
| return self.xpathEval(expr) |
|
|
| |
| def removeNsDef(self, href): |
| """ |
| Remove a namespace definition from a node. If href is None, |
| remove all of the ns definitions on that node. The removed |
| namespaces are returned as a linked list. |
| |
| Note: If any child nodes referred to the removed namespaces, |
| they will be left with dangling links. You should call |
| renconciliateNs() to fix those pointers. |
| |
| Note: This method does not free memory taken by the ns |
| definitions. You will need to free it manually with the |
| freeNsList() method on the returns xmlNs object. |
| """ |
|
|
| ret = libxml2mod.xmlNodeRemoveNsDef(self._o, href) |
| if ret is None:return None |
| __tmp = xmlNs(_obj=ret) |
| return __tmp |
|
|
| |
| def walk_depth_first(self): |
| return xmlCoreDepthFirstItertor(self) |
| def walk_breadth_first(self): |
| return xmlCoreBreadthFirstItertor(self) |
| __iter__ = walk_depth_first |
|
|
| def free(self): |
| try: |
| self.doc._ctxt.xpathFreeContext() |
| except: |
| pass |
| libxml2mod.xmlFreeDoc(self._o) |
|
|
|
|
| |
| |
| |
| class xmlCoreDepthFirstItertor: |
| def __init__(self, node): |
| self.node = node |
| self.parents = [] |
| def __iter__(self): |
| return self |
| def __next__(self): |
| while 1: |
| if self.node: |
| ret = self.node |
| self.parents.append(self.node) |
| self.node = self.node.children |
| return ret |
| try: |
| parent = self.parents.pop() |
| except IndexError: |
| raise StopIteration |
| self.node = parent.next |
| next = __next__ |
|
|
| |
| |
| |
| class xmlCoreBreadthFirstItertor: |
| def __init__(self, node): |
| self.node = node |
| self.parents = [] |
| def __iter__(self): |
| return self |
| def __next__(self): |
| while 1: |
| if self.node: |
| ret = self.node |
| self.parents.append(self.node) |
| self.node = self.node.next |
| return ret |
| try: |
| parent = self.parents.pop() |
| except IndexError: |
| raise StopIteration |
| self.node = parent.children |
| next = __next__ |
|
|
| |
| |
| |
| def nodeWrap(o): |
| |
| name = libxml2mod.type(o) |
| if name == "element" or name == "text": |
| return xmlNode(_obj=o) |
| if name == "attribute": |
| return xmlAttr(_obj=o) |
| if name[0:8] == "document": |
| return xmlDoc(_obj=o) |
| if name == "namespace": |
| return xmlNs(_obj=o) |
| if name == "elem_decl": |
| return xmlElement(_obj=o) |
| if name == "attribute_decl": |
| return xmlAttribute(_obj=o) |
| if name == "entity_decl": |
| return xmlEntity(_obj=o) |
| if name == "dtd": |
| return xmlDtd(_obj=o) |
| return xmlNode(_obj=o) |
|
|
| def xpathObjectRet(o): |
| otype = type(o) |
| if otype == type([]): |
| ret = list(map(xpathObjectRet, o)) |
| return ret |
| elif otype == type(()): |
| ret = list(map(xpathObjectRet, o)) |
| return tuple(ret) |
| elif otype == type('') or otype == type(0) or otype == type(0.0): |
| return o |
| else: |
| return nodeWrap(o) |
|
|
| |
| |
| |
| def registerXPathFunction(ctxt, name, ns_uri, f): |
| ret = libxml2mod.xmlRegisterXPathFunction(ctxt, name, ns_uri, f) |
|
|
| |
| |
| |
| PARSER_LOADDTD=1 |
| PARSER_DEFAULTATTRS=2 |
| PARSER_VALIDATE=3 |
| PARSER_SUBST_ENTITIES=4 |
|
|
| |
| |
| |
| PARSER_SEVERITY_VALIDITY_WARNING=1 |
| PARSER_SEVERITY_VALIDITY_ERROR=2 |
| PARSER_SEVERITY_WARNING=3 |
| PARSER_SEVERITY_ERROR=4 |
|
|
| |
| |
| |
| def registerErrorHandler(f, ctx): |
| """Register a Python written function to for error reporting. |
| The function is called back as f(ctx, error). """ |
| import sys |
| if 'libxslt' not in sys.modules: |
| |
| ret = libxml2mod.xmlRegisterErrorHandler(f,ctx) |
| else: |
| |
| |
| import libxslt |
| ret = libxslt.registerErrorHandler(f,ctx) |
| return ret |
|
|
| class parserCtxtCore: |
|
|
| def __init__(self, _obj=None): |
| if _obj != None: |
| self._o = _obj; |
| return |
| self._o = None |
|
|
| def __del__(self): |
| if self._o != None: |
| libxml2mod.xmlFreeParserCtxt(self._o) |
| self._o = None |
|
|
| def setErrorHandler(self,f,arg): |
| """Register an error handler that will be called back as |
| f(arg,msg,severity,reserved). |
| |
| @reserved is currently always None.""" |
| libxml2mod.xmlParserCtxtSetErrorHandler(self._o,f,arg) |
|
|
| def getErrorHandler(self): |
| """Return (f,arg) as previously registered with setErrorHandler |
| or (None,None).""" |
| return libxml2mod.xmlParserCtxtGetErrorHandler(self._o) |
|
|
| def addLocalCatalog(self, uri): |
| """Register a local catalog with the parser""" |
| return libxml2mod.addLocalCatalog(self._o, uri) |
| |
|
|
| class ValidCtxtCore: |
|
|
| def __init__(self, *args, **kw): |
| pass |
|
|
| def setValidityErrorHandler(self, err_func, warn_func, arg=None): |
| """ |
| Register error and warning handlers for DTD validation. |
| These will be called back as f(msg,arg) |
| """ |
| libxml2mod.xmlSetValidErrors(self._o, err_func, warn_func, arg) |
| |
|
|
| class SchemaValidCtxtCore: |
|
|
| def __init__(self, *args, **kw): |
| pass |
|
|
| def setValidityErrorHandler(self, err_func, warn_func, arg=None): |
| """ |
| Register error and warning handlers for Schema validation. |
| These will be called back as f(msg,arg) |
| """ |
| libxml2mod.xmlSchemaSetValidErrors(self._o, err_func, warn_func, arg) |
|
|
|
|
| class relaxNgValidCtxtCore: |
|
|
| def __init__(self, *args, **kw): |
| pass |
|
|
| def setValidityErrorHandler(self, err_func, warn_func, arg=None): |
| """ |
| Register error and warning handlers for RelaxNG validation. |
| These will be called back as f(msg,arg) |
| """ |
| libxml2mod.xmlRelaxNGSetValidErrors(self._o, err_func, warn_func, arg) |
|
|
| |
| def _xmlTextReaderErrorFunc(xxx_todo_changeme,msg,severity,locator): |
| """Intermediate callback to wrap the locator""" |
| (f,arg) = xxx_todo_changeme |
| return f(arg,msg,severity,xmlTextReaderLocator(locator)) |
|
|
| class xmlTextReaderCore: |
|
|
| def __init__(self, _obj=None): |
| self.input = None |
| if _obj != None:self._o = _obj;return |
| self._o = None |
|
|
| def __del__(self): |
| if self._o != None: |
| libxml2mod.xmlFreeTextReader(self._o) |
| self._o = None |
|
|
| def SetErrorHandler(self,f,arg): |
| """Register an error handler that will be called back as |
| f(arg,msg,severity,locator).""" |
| if f is None: |
| libxml2mod.xmlTextReaderSetErrorHandler(\ |
| self._o,None,None) |
| else: |
| libxml2mod.xmlTextReaderSetErrorHandler(\ |
| self._o,_xmlTextReaderErrorFunc,(f,arg)) |
|
|
| def GetErrorHandler(self): |
| """Return (f,arg) as previously registered with setErrorHandler |
| or (None,None).""" |
| f,arg = libxml2mod.xmlTextReaderGetErrorHandler(self._o) |
| if f is None: |
| return None,None |
| else: |
| |
| return arg |
|
|
| |
| |
| |
| def cleanupParser(): |
| libxml2mod.xmlPythonCleanupParser() |
|
|
| |
| |
| |
| |
| |
| |
| __input_callbacks = [] |
| def registerInputCallback(func): |
| def findOpenCallback(URI): |
| for cb in reversed(__input_callbacks): |
| o = cb(URI) |
| if o is not None: |
| return o |
| libxml2mod.xmlRegisterInputCallback(findOpenCallback) |
| __input_callbacks.append(func) |
|
|
| def popInputCallbacks(): |
| |
| |
| if len(__input_callbacks) > 0: |
| __input_callbacks.pop() |
| if len(__input_callbacks) == 0: |
| libxml2mod.xmlUnregisterInputCallback() |
|
|
| |
| |
| |
| def dumpMemory(): |
| """DEPRECATED: This feature was removed.""" |
|
|
| |
| |
| |
| |
| |
| |
|
|
|
|