mirror of
				https://github.com/python/cpython.git
				synced 2025-11-03 03:22:27 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			1984 lines
		
	
	
	
		
			60 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			1984 lines
		
	
	
	
		
			60 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
#include "Python.h"
 | 
						|
#include <ctype.h>
 | 
						|
 | 
						|
#include "frameobject.h"
 | 
						|
#include "expat.h"
 | 
						|
 | 
						|
#include "pyexpat.h"
 | 
						|
 | 
						|
/* Do not emit Clinic output to a file as that wreaks havoc with conditionally
 | 
						|
   included methods. */
 | 
						|
/*[clinic input]
 | 
						|
module pyexpat
 | 
						|
[clinic start generated code]*/
 | 
						|
/*[clinic end generated code: output=da39a3ee5e6b4b0d input=b168d503a4490c15]*/
 | 
						|
 | 
						|
#define XML_COMBINED_VERSION (10000*XML_MAJOR_VERSION+100*XML_MINOR_VERSION+XML_MICRO_VERSION)
 | 
						|
 | 
						|
static XML_Memory_Handling_Suite ExpatMemoryHandler = {
 | 
						|
    PyObject_Malloc, PyObject_Realloc, PyObject_Free};
 | 
						|
 | 
						|
enum HandlerTypes {
 | 
						|
    StartElement,
 | 
						|
    EndElement,
 | 
						|
    ProcessingInstruction,
 | 
						|
    CharacterData,
 | 
						|
    UnparsedEntityDecl,
 | 
						|
    NotationDecl,
 | 
						|
    StartNamespaceDecl,
 | 
						|
    EndNamespaceDecl,
 | 
						|
    Comment,
 | 
						|
    StartCdataSection,
 | 
						|
    EndCdataSection,
 | 
						|
    Default,
 | 
						|
    DefaultHandlerExpand,
 | 
						|
    NotStandalone,
 | 
						|
    ExternalEntityRef,
 | 
						|
    StartDoctypeDecl,
 | 
						|
    EndDoctypeDecl,
 | 
						|
    EntityDecl,
 | 
						|
    XmlDecl,
 | 
						|
    ElementDecl,
 | 
						|
    AttlistDecl,
 | 
						|
#if XML_COMBINED_VERSION >= 19504
 | 
						|
    SkippedEntity,
 | 
						|
#endif
 | 
						|
    _DummyDecl
 | 
						|
};
 | 
						|
 | 
						|
static PyObject *ErrorObject;
 | 
						|
 | 
						|
/* ----------------------------------------------------- */
 | 
						|
 | 
						|
/* Declarations for objects of type xmlparser */
 | 
						|
 | 
						|
typedef struct {
 | 
						|
    PyObject_HEAD
 | 
						|
 | 
						|
    XML_Parser itself;
 | 
						|
    int ordered_attributes;     /* Return attributes as a list. */
 | 
						|
    int specified_attributes;   /* Report only specified attributes. */
 | 
						|
    int in_callback;            /* Is a callback active? */
 | 
						|
    int ns_prefixes;            /* Namespace-triplets mode? */
 | 
						|
    XML_Char *buffer;           /* Buffer used when accumulating characters */
 | 
						|
                                /* NULL if not enabled */
 | 
						|
    int buffer_size;            /* Size of buffer, in XML_Char units */
 | 
						|
    int buffer_used;            /* Buffer units in use */
 | 
						|
    PyObject *intern;           /* Dictionary to intern strings */
 | 
						|
    PyObject **handlers;
 | 
						|
} xmlparseobject;
 | 
						|
 | 
						|
#include "clinic/pyexpat.c.h"
 | 
						|
 | 
						|
#define CHARACTER_DATA_BUFFER_SIZE 8192
 | 
						|
 | 
						|
static PyTypeObject Xmlparsetype;
 | 
						|
 | 
						|
typedef void (*xmlhandlersetter)(XML_Parser self, void *meth);
 | 
						|
typedef void* xmlhandler;
 | 
						|
 | 
						|
struct HandlerInfo {
 | 
						|
    const char *name;
 | 
						|
    xmlhandlersetter setter;
 | 
						|
    xmlhandler handler;
 | 
						|
    PyCodeObject *tb_code;
 | 
						|
    PyObject *nameobj;
 | 
						|
};
 | 
						|
 | 
						|
static struct HandlerInfo handler_info[64];
 | 
						|
 | 
						|
/* Set an integer attribute on the error object; return true on success,
 | 
						|
 * false on an exception.
 | 
						|
 */
 | 
						|
static int
 | 
						|
set_error_attr(PyObject *err, char *name, int value)
 | 
						|
{
 | 
						|
    PyObject *v = PyLong_FromLong(value);
 | 
						|
 | 
						|
    if (v == NULL || PyObject_SetAttrString(err, name, v) == -1) {
 | 
						|
        Py_XDECREF(v);
 | 
						|
        return 0;
 | 
						|
    }
 | 
						|
    Py_DECREF(v);
 | 
						|
    return 1;
 | 
						|
}
 | 
						|
 | 
						|
/* Build and set an Expat exception, including positioning
 | 
						|
 * information.  Always returns NULL.
 | 
						|
 */
 | 
						|
static PyObject *
 | 
						|
set_error(xmlparseobject *self, enum XML_Error code)
 | 
						|
{
 | 
						|
    PyObject *err;
 | 
						|
    PyObject *buffer;
 | 
						|
    XML_Parser parser = self->itself;
 | 
						|
    int lineno = XML_GetErrorLineNumber(parser);
 | 
						|
    int column = XML_GetErrorColumnNumber(parser);
 | 
						|
 | 
						|
    buffer = PyUnicode_FromFormat("%s: line %i, column %i",
 | 
						|
                                  XML_ErrorString(code), lineno, column);
 | 
						|
    if (buffer == NULL)
 | 
						|
        return NULL;
 | 
						|
    err = PyObject_CallFunction(ErrorObject, "O", buffer);
 | 
						|
    Py_DECREF(buffer);
 | 
						|
    if (  err != NULL
 | 
						|
          && set_error_attr(err, "code", code)
 | 
						|
          && set_error_attr(err, "offset", column)
 | 
						|
          && set_error_attr(err, "lineno", lineno)) {
 | 
						|
        PyErr_SetObject(ErrorObject, err);
 | 
						|
    }
 | 
						|
    Py_XDECREF(err);
 | 
						|
    return NULL;
 | 
						|
}
 | 
						|
 | 
						|
static int
 | 
						|
have_handler(xmlparseobject *self, int type)
 | 
						|
{
 | 
						|
    PyObject *handler = self->handlers[type];
 | 
						|
    return handler != NULL;
 | 
						|
}
 | 
						|
 | 
						|
static PyObject *
 | 
						|
get_handler_name(struct HandlerInfo *hinfo)
 | 
						|
{
 | 
						|
    PyObject *name = hinfo->nameobj;
 | 
						|
    if (name == NULL) {
 | 
						|
        name = PyUnicode_FromString(hinfo->name);
 | 
						|
        hinfo->nameobj = name;
 | 
						|
    }
 | 
						|
    Py_XINCREF(name);
 | 
						|
    return name;
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
/* Convert a string of XML_Chars into a Unicode string.
 | 
						|
   Returns None if str is a null pointer. */
 | 
						|
 | 
						|
static PyObject *
 | 
						|
conv_string_to_unicode(const XML_Char *str)
 | 
						|
{
 | 
						|
    /* XXX currently this code assumes that XML_Char is 8-bit,
 | 
						|
       and hence in UTF-8.  */
 | 
						|
    /* UTF-8 from Expat, Unicode desired */
 | 
						|
    if (str == NULL) {
 | 
						|
        Py_INCREF(Py_None);
 | 
						|
        return Py_None;
 | 
						|
    }
 | 
						|
    return PyUnicode_DecodeUTF8(str, strlen(str), "strict");
 | 
						|
}
 | 
						|
 | 
						|
static PyObject *
 | 
						|
conv_string_len_to_unicode(const XML_Char *str, int len)
 | 
						|
{
 | 
						|
    /* XXX currently this code assumes that XML_Char is 8-bit,
 | 
						|
       and hence in UTF-8.  */
 | 
						|
    /* UTF-8 from Expat, Unicode desired */
 | 
						|
    if (str == NULL) {
 | 
						|
        Py_INCREF(Py_None);
 | 
						|
        return Py_None;
 | 
						|
    }
 | 
						|
    return PyUnicode_DecodeUTF8((const char *)str, len, "strict");
 | 
						|
}
 | 
						|
 | 
						|
/* Callback routines */
 | 
						|
 | 
						|
static void clear_handlers(xmlparseobject *self, int initial);
 | 
						|
 | 
						|
/* This handler is used when an error has been detected, in the hope
 | 
						|
   that actual parsing can be terminated early.  This will only help
 | 
						|
   if an external entity reference is encountered. */
 | 
						|
static int
 | 
						|
error_external_entity_ref_handler(XML_Parser parser,
 | 
						|
                                  const XML_Char *context,
 | 
						|
                                  const XML_Char *base,
 | 
						|
                                  const XML_Char *systemId,
 | 
						|
                                  const XML_Char *publicId)
 | 
						|
{
 | 
						|
    return 0;
 | 
						|
}
 | 
						|
 | 
						|
/* Dummy character data handler used when an error (exception) has
 | 
						|
   been detected, and the actual parsing can be terminated early.
 | 
						|
   This is needed since character data handler can't be safely removed
 | 
						|
   from within the character data handler, but can be replaced.  It is
 | 
						|
   used only from the character data handler trampoline, and must be
 | 
						|
   used right after `flag_error()` is called. */
 | 
						|
static void
 | 
						|
noop_character_data_handler(void *userData, const XML_Char *data, int len)
 | 
						|
{
 | 
						|
    /* Do nothing. */
 | 
						|
}
 | 
						|
 | 
						|
static void
 | 
						|
flag_error(xmlparseobject *self)
 | 
						|
{
 | 
						|
    clear_handlers(self, 0);
 | 
						|
    XML_SetExternalEntityRefHandler(self->itself,
 | 
						|
                                    error_external_entity_ref_handler);
 | 
						|
}
 | 
						|
 | 
						|
static PyObject*
 | 
						|
call_with_frame(char *funcname, int lineno, PyObject* func, PyObject* args,
 | 
						|
                xmlparseobject *self)
 | 
						|
{
 | 
						|
    PyObject *res;
 | 
						|
 | 
						|
    res = PyEval_CallObject(func, args);
 | 
						|
    if (res == NULL) {
 | 
						|
        _PyTraceback_Add(funcname, __FILE__, lineno);
 | 
						|
        XML_StopParser(self->itself, XML_FALSE);
 | 
						|
    }
 | 
						|
    return res;
 | 
						|
}
 | 
						|
 | 
						|
static PyObject*
 | 
						|
string_intern(xmlparseobject *self, const char* str)
 | 
						|
{
 | 
						|
    PyObject *result = conv_string_to_unicode(str);
 | 
						|
    PyObject *value;
 | 
						|
    /* result can be NULL if the unicode conversion failed. */
 | 
						|
    if (!result)
 | 
						|
        return result;
 | 
						|
    if (!self->intern)
 | 
						|
        return result;
 | 
						|
    value = PyDict_GetItem(self->intern, result);
 | 
						|
    if (!value) {
 | 
						|
        if (PyDict_SetItem(self->intern, result, result) == 0)
 | 
						|
            return result;
 | 
						|
        else
 | 
						|
            return NULL;
 | 
						|
    }
 | 
						|
    Py_INCREF(value);
 | 
						|
    Py_DECREF(result);
 | 
						|
    return value;
 | 
						|
}
 | 
						|
 | 
						|
/* Return 0 on success, -1 on exception.
 | 
						|
 * flag_error() will be called before return if needed.
 | 
						|
 */
 | 
						|
static int
 | 
						|
call_character_handler(xmlparseobject *self, const XML_Char *buffer, int len)
 | 
						|
{
 | 
						|
    PyObject *args;
 | 
						|
    PyObject *temp;
 | 
						|
 | 
						|
    if (!have_handler(self, CharacterData))
 | 
						|
        return -1;
 | 
						|
 | 
						|
    args = PyTuple_New(1);
 | 
						|
    if (args == NULL)
 | 
						|
        return -1;
 | 
						|
    temp = (conv_string_len_to_unicode(buffer, len));
 | 
						|
    if (temp == NULL) {
 | 
						|
        Py_DECREF(args);
 | 
						|
        flag_error(self);
 | 
						|
        XML_SetCharacterDataHandler(self->itself,
 | 
						|
                                    noop_character_data_handler);
 | 
						|
        return -1;
 | 
						|
    }
 | 
						|
    PyTuple_SET_ITEM(args, 0, temp);
 | 
						|
    /* temp is now a borrowed reference; consider it unused. */
 | 
						|
    self->in_callback = 1;
 | 
						|
    temp = call_with_frame("CharacterData", __LINE__,
 | 
						|
                           self->handlers[CharacterData], args, self);
 | 
						|
    /* temp is an owned reference again, or NULL */
 | 
						|
    self->in_callback = 0;
 | 
						|
    Py_DECREF(args);
 | 
						|
    if (temp == NULL) {
 | 
						|
        flag_error(self);
 | 
						|
        XML_SetCharacterDataHandler(self->itself,
 | 
						|
                                    noop_character_data_handler);
 | 
						|
        return -1;
 | 
						|
    }
 | 
						|
    Py_DECREF(temp);
 | 
						|
    return 0;
 | 
						|
}
 | 
						|
 | 
						|
static int
 | 
						|
flush_character_buffer(xmlparseobject *self)
 | 
						|
{
 | 
						|
    int rc;
 | 
						|
    if (self->buffer == NULL || self->buffer_used == 0)
 | 
						|
        return 0;
 | 
						|
    rc = call_character_handler(self, self->buffer, self->buffer_used);
 | 
						|
    self->buffer_used = 0;
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
static void
 | 
						|
my_CharacterDataHandler(void *userData, const XML_Char *data, int len)
 | 
						|
{
 | 
						|
    xmlparseobject *self = (xmlparseobject *) userData;
 | 
						|
 | 
						|
    if (PyErr_Occurred())
 | 
						|
        return;
 | 
						|
 | 
						|
    if (self->buffer == NULL)
 | 
						|
        call_character_handler(self, data, len);
 | 
						|
    else {
 | 
						|
        if ((self->buffer_used + len) > self->buffer_size) {
 | 
						|
            if (flush_character_buffer(self) < 0)
 | 
						|
                return;
 | 
						|
            /* handler might have changed; drop the rest on the floor
 | 
						|
             * if there isn't a handler anymore
 | 
						|
             */
 | 
						|
            if (!have_handler(self, CharacterData))
 | 
						|
                return;
 | 
						|
        }
 | 
						|
        if (len > self->buffer_size) {
 | 
						|
            call_character_handler(self, data, len);
 | 
						|
            self->buffer_used = 0;
 | 
						|
        }
 | 
						|
        else {
 | 
						|
            memcpy(self->buffer + self->buffer_used,
 | 
						|
                   data, len * sizeof(XML_Char));
 | 
						|
            self->buffer_used += len;
 | 
						|
        }
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
static void
 | 
						|
my_StartElementHandler(void *userData,
 | 
						|
                       const XML_Char *name, const XML_Char *atts[])
 | 
						|
{
 | 
						|
    xmlparseobject *self = (xmlparseobject *)userData;
 | 
						|
 | 
						|
    if (have_handler(self, StartElement)) {
 | 
						|
        PyObject *container, *rv, *args;
 | 
						|
        int i, max;
 | 
						|
 | 
						|
        if (PyErr_Occurred())
 | 
						|
            return;
 | 
						|
 | 
						|
        if (flush_character_buffer(self) < 0)
 | 
						|
            return;
 | 
						|
        /* Set max to the number of slots filled in atts[]; max/2 is
 | 
						|
         * the number of attributes we need to process.
 | 
						|
         */
 | 
						|
        if (self->specified_attributes) {
 | 
						|
            max = XML_GetSpecifiedAttributeCount(self->itself);
 | 
						|
        }
 | 
						|
        else {
 | 
						|
            max = 0;
 | 
						|
            while (atts[max] != NULL)
 | 
						|
                max += 2;
 | 
						|
        }
 | 
						|
        /* Build the container. */
 | 
						|
        if (self->ordered_attributes)
 | 
						|
            container = PyList_New(max);
 | 
						|
        else
 | 
						|
            container = PyDict_New();
 | 
						|
        if (container == NULL) {
 | 
						|
            flag_error(self);
 | 
						|
            return;
 | 
						|
        }
 | 
						|
        for (i = 0; i < max; i += 2) {
 | 
						|
            PyObject *n = string_intern(self, (XML_Char *) atts[i]);
 | 
						|
            PyObject *v;
 | 
						|
            if (n == NULL) {
 | 
						|
                flag_error(self);
 | 
						|
                Py_DECREF(container);
 | 
						|
                return;
 | 
						|
            }
 | 
						|
            v = conv_string_to_unicode((XML_Char *) atts[i+1]);
 | 
						|
            if (v == NULL) {
 | 
						|
                flag_error(self);
 | 
						|
                Py_DECREF(container);
 | 
						|
                Py_DECREF(n);
 | 
						|
                return;
 | 
						|
            }
 | 
						|
            if (self->ordered_attributes) {
 | 
						|
                PyList_SET_ITEM(container, i, n);
 | 
						|
                PyList_SET_ITEM(container, i+1, v);
 | 
						|
            }
 | 
						|
            else if (PyDict_SetItem(container, n, v)) {
 | 
						|
                flag_error(self);
 | 
						|
                Py_DECREF(n);
 | 
						|
                Py_DECREF(v);
 | 
						|
                return;
 | 
						|
            }
 | 
						|
            else {
 | 
						|
                Py_DECREF(n);
 | 
						|
                Py_DECREF(v);
 | 
						|
            }
 | 
						|
        }
 | 
						|
        args = string_intern(self, name);
 | 
						|
        if (args != NULL)
 | 
						|
            args = Py_BuildValue("(NN)", args, container);
 | 
						|
        if (args == NULL) {
 | 
						|
            Py_DECREF(container);
 | 
						|
            return;
 | 
						|
        }
 | 
						|
        /* Container is now a borrowed reference; ignore it. */
 | 
						|
        self->in_callback = 1;
 | 
						|
        rv = call_with_frame("StartElement", __LINE__,
 | 
						|
                             self->handlers[StartElement], args, self);
 | 
						|
        self->in_callback = 0;
 | 
						|
        Py_DECREF(args);
 | 
						|
        if (rv == NULL) {
 | 
						|
            flag_error(self);
 | 
						|
            return;
 | 
						|
        }
 | 
						|
        Py_DECREF(rv);
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
#define RC_HANDLER(RC, NAME, PARAMS, INIT, PARAM_FORMAT, CONVERSION, \
 | 
						|
                RETURN, GETUSERDATA) \
 | 
						|
static RC \
 | 
						|
my_##NAME##Handler PARAMS {\
 | 
						|
    xmlparseobject *self = GETUSERDATA ; \
 | 
						|
    PyObject *args = NULL; \
 | 
						|
    PyObject *rv = NULL; \
 | 
						|
    INIT \
 | 
						|
\
 | 
						|
    if (have_handler(self, NAME)) { \
 | 
						|
        if (PyErr_Occurred()) \
 | 
						|
            return RETURN; \
 | 
						|
        if (flush_character_buffer(self) < 0) \
 | 
						|
            return RETURN; \
 | 
						|
        args = Py_BuildValue PARAM_FORMAT ;\
 | 
						|
        if (!args) { flag_error(self); return RETURN;} \
 | 
						|
        self->in_callback = 1; \
 | 
						|
        rv = call_with_frame(#NAME,__LINE__, \
 | 
						|
                             self->handlers[NAME], args, self); \
 | 
						|
        self->in_callback = 0; \
 | 
						|
        Py_DECREF(args); \
 | 
						|
        if (rv == NULL) { \
 | 
						|
            flag_error(self); \
 | 
						|
            return RETURN; \
 | 
						|
        } \
 | 
						|
        CONVERSION \
 | 
						|
        Py_DECREF(rv); \
 | 
						|
    } \
 | 
						|
    return RETURN; \
 | 
						|
}
 | 
						|
 | 
						|
#define VOID_HANDLER(NAME, PARAMS, PARAM_FORMAT) \
 | 
						|
        RC_HANDLER(void, NAME, PARAMS, ;, PARAM_FORMAT, ;, ;,\
 | 
						|
        (xmlparseobject *)userData)
 | 
						|
 | 
						|
#define INT_HANDLER(NAME, PARAMS, PARAM_FORMAT)\
 | 
						|
        RC_HANDLER(int, NAME, PARAMS, int rc=0;, PARAM_FORMAT, \
 | 
						|
                        rc = PyLong_AsLong(rv);, rc, \
 | 
						|
        (xmlparseobject *)userData)
 | 
						|
 | 
						|
VOID_HANDLER(EndElement,
 | 
						|
             (void *userData, const XML_Char *name),
 | 
						|
             ("(N)", string_intern(self, name)))
 | 
						|
 | 
						|
VOID_HANDLER(ProcessingInstruction,
 | 
						|
             (void *userData,
 | 
						|
              const XML_Char *target,
 | 
						|
              const XML_Char *data),
 | 
						|
             ("(NO&)", string_intern(self, target), conv_string_to_unicode ,data))
 | 
						|
 | 
						|
VOID_HANDLER(UnparsedEntityDecl,
 | 
						|
             (void *userData,
 | 
						|
              const XML_Char *entityName,
 | 
						|
              const XML_Char *base,
 | 
						|
              const XML_Char *systemId,
 | 
						|
              const XML_Char *publicId,
 | 
						|
              const XML_Char *notationName),
 | 
						|
             ("(NNNNN)",
 | 
						|
              string_intern(self, entityName), string_intern(self, base),
 | 
						|
              string_intern(self, systemId), string_intern(self, publicId),
 | 
						|
              string_intern(self, notationName)))
 | 
						|
 | 
						|
VOID_HANDLER(EntityDecl,
 | 
						|
             (void *userData,
 | 
						|
              const XML_Char *entityName,
 | 
						|
              int is_parameter_entity,
 | 
						|
              const XML_Char *value,
 | 
						|
              int value_length,
 | 
						|
              const XML_Char *base,
 | 
						|
              const XML_Char *systemId,
 | 
						|
              const XML_Char *publicId,
 | 
						|
              const XML_Char *notationName),
 | 
						|
             ("NiNNNNN",
 | 
						|
              string_intern(self, entityName), is_parameter_entity,
 | 
						|
              (conv_string_len_to_unicode(value, value_length)),
 | 
						|
              string_intern(self, base), string_intern(self, systemId),
 | 
						|
              string_intern(self, publicId),
 | 
						|
              string_intern(self, notationName)))
 | 
						|
 | 
						|
VOID_HANDLER(XmlDecl,
 | 
						|
             (void *userData,
 | 
						|
              const XML_Char *version,
 | 
						|
              const XML_Char *encoding,
 | 
						|
              int standalone),
 | 
						|
             ("(O&O&i)",
 | 
						|
              conv_string_to_unicode ,version, conv_string_to_unicode ,encoding,
 | 
						|
              standalone))
 | 
						|
 | 
						|
static PyObject *
 | 
						|
conv_content_model(XML_Content * const model,
 | 
						|
                   PyObject *(*conv_string)(const XML_Char *))
 | 
						|
{
 | 
						|
    PyObject *result = NULL;
 | 
						|
    PyObject *children = PyTuple_New(model->numchildren);
 | 
						|
    int i;
 | 
						|
 | 
						|
    if (children != NULL) {
 | 
						|
        assert(model->numchildren < INT_MAX);
 | 
						|
        for (i = 0; i < (int)model->numchildren; ++i) {
 | 
						|
            PyObject *child = conv_content_model(&model->children[i],
 | 
						|
                                                 conv_string);
 | 
						|
            if (child == NULL) {
 | 
						|
                Py_XDECREF(children);
 | 
						|
                return NULL;
 | 
						|
            }
 | 
						|
            PyTuple_SET_ITEM(children, i, child);
 | 
						|
        }
 | 
						|
        result = Py_BuildValue("(iiO&N)",
 | 
						|
                               model->type, model->quant,
 | 
						|
                               conv_string,model->name, children);
 | 
						|
    }
 | 
						|
    return result;
 | 
						|
}
 | 
						|
 | 
						|
static void
 | 
						|
my_ElementDeclHandler(void *userData,
 | 
						|
                      const XML_Char *name,
 | 
						|
                      XML_Content *model)
 | 
						|
{
 | 
						|
    xmlparseobject *self = (xmlparseobject *)userData;
 | 
						|
    PyObject *args = NULL;
 | 
						|
 | 
						|
    if (have_handler(self, ElementDecl)) {
 | 
						|
        PyObject *rv = NULL;
 | 
						|
        PyObject *modelobj, *nameobj;
 | 
						|
 | 
						|
        if (PyErr_Occurred())
 | 
						|
            return;
 | 
						|
 | 
						|
        if (flush_character_buffer(self) < 0)
 | 
						|
            goto finally;
 | 
						|
        modelobj = conv_content_model(model, (conv_string_to_unicode));
 | 
						|
        if (modelobj == NULL) {
 | 
						|
            flag_error(self);
 | 
						|
            goto finally;
 | 
						|
        }
 | 
						|
        nameobj = string_intern(self, name);
 | 
						|
        if (nameobj == NULL) {
 | 
						|
            Py_DECREF(modelobj);
 | 
						|
            flag_error(self);
 | 
						|
            goto finally;
 | 
						|
        }
 | 
						|
        args = Py_BuildValue("NN", nameobj, modelobj);
 | 
						|
        if (args == NULL) {
 | 
						|
            Py_DECREF(modelobj);
 | 
						|
            flag_error(self);
 | 
						|
            goto finally;
 | 
						|
        }
 | 
						|
        self->in_callback = 1;
 | 
						|
        rv = call_with_frame("ElementDecl", __LINE__,
 | 
						|
                             self->handlers[ElementDecl], args, self);
 | 
						|
        self->in_callback = 0;
 | 
						|
        if (rv == NULL) {
 | 
						|
            flag_error(self);
 | 
						|
            goto finally;
 | 
						|
        }
 | 
						|
        Py_DECREF(rv);
 | 
						|
    }
 | 
						|
 finally:
 | 
						|
    Py_XDECREF(args);
 | 
						|
    XML_FreeContentModel(self->itself, model);
 | 
						|
    return;
 | 
						|
}
 | 
						|
 | 
						|
VOID_HANDLER(AttlistDecl,
 | 
						|
             (void *userData,
 | 
						|
              const XML_Char *elname,
 | 
						|
              const XML_Char *attname,
 | 
						|
              const XML_Char *att_type,
 | 
						|
              const XML_Char *dflt,
 | 
						|
              int isrequired),
 | 
						|
             ("(NNO&O&i)",
 | 
						|
              string_intern(self, elname), string_intern(self, attname),
 | 
						|
              conv_string_to_unicode ,att_type, conv_string_to_unicode ,dflt,
 | 
						|
              isrequired))
 | 
						|
 | 
						|
#if XML_COMBINED_VERSION >= 19504
 | 
						|
VOID_HANDLER(SkippedEntity,
 | 
						|
             (void *userData,
 | 
						|
              const XML_Char *entityName,
 | 
						|
              int is_parameter_entity),
 | 
						|
             ("Ni",
 | 
						|
              string_intern(self, entityName), is_parameter_entity))
 | 
						|
#endif
 | 
						|
 | 
						|
VOID_HANDLER(NotationDecl,
 | 
						|
                (void *userData,
 | 
						|
                        const XML_Char *notationName,
 | 
						|
                        const XML_Char *base,
 | 
						|
                        const XML_Char *systemId,
 | 
						|
                        const XML_Char *publicId),
 | 
						|
                ("(NNNN)",
 | 
						|
                 string_intern(self, notationName), string_intern(self, base),
 | 
						|
                 string_intern(self, systemId), string_intern(self, publicId)))
 | 
						|
 | 
						|
VOID_HANDLER(StartNamespaceDecl,
 | 
						|
                (void *userData,
 | 
						|
                      const XML_Char *prefix,
 | 
						|
                      const XML_Char *uri),
 | 
						|
                ("(NN)",
 | 
						|
                 string_intern(self, prefix), string_intern(self, uri)))
 | 
						|
 | 
						|
VOID_HANDLER(EndNamespaceDecl,
 | 
						|
                (void *userData,
 | 
						|
                    const XML_Char *prefix),
 | 
						|
                ("(N)", string_intern(self, prefix)))
 | 
						|
 | 
						|
VOID_HANDLER(Comment,
 | 
						|
               (void *userData, const XML_Char *data),
 | 
						|
                ("(O&)", conv_string_to_unicode ,data))
 | 
						|
 | 
						|
VOID_HANDLER(StartCdataSection,
 | 
						|
               (void *userData),
 | 
						|
                ("()"))
 | 
						|
 | 
						|
VOID_HANDLER(EndCdataSection,
 | 
						|
               (void *userData),
 | 
						|
                ("()"))
 | 
						|
 | 
						|
VOID_HANDLER(Default,
 | 
						|
              (void *userData, const XML_Char *s, int len),
 | 
						|
              ("(N)", (conv_string_len_to_unicode(s,len))))
 | 
						|
 | 
						|
VOID_HANDLER(DefaultHandlerExpand,
 | 
						|
              (void *userData, const XML_Char *s, int len),
 | 
						|
              ("(N)", (conv_string_len_to_unicode(s,len))))
 | 
						|
 | 
						|
INT_HANDLER(NotStandalone,
 | 
						|
                (void *userData),
 | 
						|
                ("()"))
 | 
						|
 | 
						|
RC_HANDLER(int, ExternalEntityRef,
 | 
						|
                (XML_Parser parser,
 | 
						|
                    const XML_Char *context,
 | 
						|
                    const XML_Char *base,
 | 
						|
                    const XML_Char *systemId,
 | 
						|
                    const XML_Char *publicId),
 | 
						|
                int rc=0;,
 | 
						|
                ("(O&NNN)",
 | 
						|
                 conv_string_to_unicode ,context, string_intern(self, base),
 | 
						|
                 string_intern(self, systemId), string_intern(self, publicId)),
 | 
						|
                rc = PyLong_AsLong(rv);, rc,
 | 
						|
                XML_GetUserData(parser))
 | 
						|
 | 
						|
/* XXX UnknownEncodingHandler */
 | 
						|
 | 
						|
VOID_HANDLER(StartDoctypeDecl,
 | 
						|
             (void *userData, const XML_Char *doctypeName,
 | 
						|
              const XML_Char *sysid, const XML_Char *pubid,
 | 
						|
              int has_internal_subset),
 | 
						|
             ("(NNNi)", string_intern(self, doctypeName),
 | 
						|
              string_intern(self, sysid), string_intern(self, pubid),
 | 
						|
              has_internal_subset))
 | 
						|
 | 
						|
VOID_HANDLER(EndDoctypeDecl, (void *userData), ("()"))
 | 
						|
 | 
						|
/* ---------------------------------------------------------------- */
 | 
						|
/*[clinic input]
 | 
						|
class pyexpat.xmlparser "xmlparseobject *" "&Xmlparsetype"
 | 
						|
[clinic start generated code]*/
 | 
						|
/*[clinic end generated code: output=da39a3ee5e6b4b0d input=2393162385232e1c]*/
 | 
						|
 | 
						|
 | 
						|
static PyObject *
 | 
						|
get_parse_result(xmlparseobject *self, int rv)
 | 
						|
{
 | 
						|
    if (PyErr_Occurred()) {
 | 
						|
        return NULL;
 | 
						|
    }
 | 
						|
    if (rv == 0) {
 | 
						|
        return set_error(self, XML_GetErrorCode(self->itself));
 | 
						|
    }
 | 
						|
    if (flush_character_buffer(self) < 0) {
 | 
						|
        return NULL;
 | 
						|
    }
 | 
						|
    return PyLong_FromLong(rv);
 | 
						|
}
 | 
						|
 | 
						|
#define MAX_CHUNK_SIZE (1 << 20)
 | 
						|
 | 
						|
/*[clinic input]
 | 
						|
pyexpat.xmlparser.Parse
 | 
						|
 | 
						|
    data: object
 | 
						|
    isFinal: int = 0
 | 
						|
    /
 | 
						|
 | 
						|
Parse XML data.
 | 
						|
 | 
						|
`isfinal' should be true at end of input.
 | 
						|
[clinic start generated code]*/
 | 
						|
 | 
						|
static PyObject *
 | 
						|
pyexpat_xmlparser_Parse_impl(xmlparseobject *self, PyObject *data,
 | 
						|
                             int isFinal)
 | 
						|
/*[clinic end generated code: output=37e105d55645b0f2 input=e37b81b8948ca7e0]*/
 | 
						|
{
 | 
						|
    const char *s;
 | 
						|
    Py_ssize_t slen;
 | 
						|
    Py_buffer view;
 | 
						|
    int rc;
 | 
						|
 | 
						|
    if (PyUnicode_Check(data)) {
 | 
						|
        view.buf = NULL;
 | 
						|
        s = PyUnicode_AsUTF8AndSize(data, &slen);
 | 
						|
        if (s == NULL)
 | 
						|
            return NULL;
 | 
						|
        /* Explicitly set UTF-8 encoding. Return code ignored. */
 | 
						|
        (void)XML_SetEncoding(self->itself, "utf-8");
 | 
						|
    }
 | 
						|
    else {
 | 
						|
        if (PyObject_GetBuffer(data, &view, PyBUF_SIMPLE) < 0)
 | 
						|
            return NULL;
 | 
						|
        s = view.buf;
 | 
						|
        slen = view.len;
 | 
						|
    }
 | 
						|
 | 
						|
    while (slen > MAX_CHUNK_SIZE) {
 | 
						|
        rc = XML_Parse(self->itself, s, MAX_CHUNK_SIZE, 0);
 | 
						|
        if (!rc)
 | 
						|
            goto done;
 | 
						|
        s += MAX_CHUNK_SIZE;
 | 
						|
        slen -= MAX_CHUNK_SIZE;
 | 
						|
    }
 | 
						|
    assert(MAX_CHUNK_SIZE < INT_MAX && slen < INT_MAX);
 | 
						|
    rc = XML_Parse(self->itself, s, (int)slen, isFinal);
 | 
						|
 | 
						|
done:
 | 
						|
    if (view.buf != NULL)
 | 
						|
        PyBuffer_Release(&view);
 | 
						|
    return get_parse_result(self, rc);
 | 
						|
}
 | 
						|
 | 
						|
/* File reading copied from cPickle */
 | 
						|
 | 
						|
#define BUF_SIZE 2048
 | 
						|
 | 
						|
static int
 | 
						|
readinst(char *buf, int buf_size, PyObject *meth)
 | 
						|
{
 | 
						|
    PyObject *str;
 | 
						|
    Py_ssize_t len;
 | 
						|
    char *ptr;
 | 
						|
 | 
						|
    str = PyObject_CallFunction(meth, "n", buf_size);
 | 
						|
    if (str == NULL)
 | 
						|
        goto error;
 | 
						|
 | 
						|
    if (PyBytes_Check(str))
 | 
						|
        ptr = PyBytes_AS_STRING(str);
 | 
						|
    else if (PyByteArray_Check(str))
 | 
						|
        ptr = PyByteArray_AS_STRING(str);
 | 
						|
    else {
 | 
						|
        PyErr_Format(PyExc_TypeError,
 | 
						|
                     "read() did not return a bytes object (type=%.400s)",
 | 
						|
                     Py_TYPE(str)->tp_name);
 | 
						|
        goto error;
 | 
						|
    }
 | 
						|
    len = Py_SIZE(str);
 | 
						|
    if (len > buf_size) {
 | 
						|
        PyErr_Format(PyExc_ValueError,
 | 
						|
                     "read() returned too much data: "
 | 
						|
                     "%i bytes requested, %zd returned",
 | 
						|
                     buf_size, len);
 | 
						|
        goto error;
 | 
						|
    }
 | 
						|
    memcpy(buf, ptr, len);
 | 
						|
    Py_DECREF(str);
 | 
						|
    /* len <= buf_size <= INT_MAX */
 | 
						|
    return (int)len;
 | 
						|
 | 
						|
error:
 | 
						|
    Py_XDECREF(str);
 | 
						|
    return -1;
 | 
						|
}
 | 
						|
 | 
						|
/*[clinic input]
 | 
						|
pyexpat.xmlparser.ParseFile
 | 
						|
 | 
						|
    file: object
 | 
						|
    /
 | 
						|
 | 
						|
Parse XML data from file-like object.
 | 
						|
[clinic start generated code]*/
 | 
						|
 | 
						|
static PyObject *
 | 
						|
pyexpat_xmlparser_ParseFile(xmlparseobject *self, PyObject *file)
 | 
						|
/*[clinic end generated code: output=2adc6a13100cc42b input=fbb5a12b6038d735]*/
 | 
						|
{
 | 
						|
    int rv = 1;
 | 
						|
    PyObject *readmethod = NULL;
 | 
						|
    _Py_IDENTIFIER(read);
 | 
						|
 | 
						|
    readmethod = _PyObject_GetAttrId(file, &PyId_read);
 | 
						|
    if (readmethod == NULL) {
 | 
						|
        PyErr_SetString(PyExc_TypeError,
 | 
						|
                        "argument must have 'read' attribute");
 | 
						|
        return NULL;
 | 
						|
    }
 | 
						|
    for (;;) {
 | 
						|
        int bytes_read;
 | 
						|
        void *buf = XML_GetBuffer(self->itself, BUF_SIZE);
 | 
						|
        if (buf == NULL) {
 | 
						|
            Py_XDECREF(readmethod);
 | 
						|
            return get_parse_result(self, 0);
 | 
						|
        }
 | 
						|
 | 
						|
        bytes_read = readinst(buf, BUF_SIZE, readmethod);
 | 
						|
        if (bytes_read < 0) {
 | 
						|
            Py_DECREF(readmethod);
 | 
						|
            return NULL;
 | 
						|
        }
 | 
						|
        rv = XML_ParseBuffer(self->itself, bytes_read, bytes_read == 0);
 | 
						|
        if (PyErr_Occurred()) {
 | 
						|
            Py_XDECREF(readmethod);
 | 
						|
            return NULL;
 | 
						|
        }
 | 
						|
 | 
						|
        if (!rv || bytes_read == 0)
 | 
						|
            break;
 | 
						|
    }
 | 
						|
    Py_XDECREF(readmethod);
 | 
						|
    return get_parse_result(self, rv);
 | 
						|
}
 | 
						|
 | 
						|
/*[clinic input]
 | 
						|
pyexpat.xmlparser.SetBase
 | 
						|
 | 
						|
    base: str
 | 
						|
    /
 | 
						|
 | 
						|
Set the base URL for the parser.
 | 
						|
[clinic start generated code]*/
 | 
						|
 | 
						|
static PyObject *
 | 
						|
pyexpat_xmlparser_SetBase_impl(xmlparseobject *self, const char *base)
 | 
						|
/*[clinic end generated code: output=c212ddceb607b539 input=c684e5de895ee1a8]*/
 | 
						|
{
 | 
						|
    if (!XML_SetBase(self->itself, base)) {
 | 
						|
        return PyErr_NoMemory();
 | 
						|
    }
 | 
						|
    Py_RETURN_NONE;
 | 
						|
}
 | 
						|
 | 
						|
/*[clinic input]
 | 
						|
pyexpat.xmlparser.GetBase
 | 
						|
 | 
						|
Return base URL string for the parser.
 | 
						|
[clinic start generated code]*/
 | 
						|
 | 
						|
static PyObject *
 | 
						|
pyexpat_xmlparser_GetBase_impl(xmlparseobject *self)
 | 
						|
/*[clinic end generated code: output=2886cb21f9a8739a input=918d71c38009620e]*/
 | 
						|
{
 | 
						|
    return Py_BuildValue("z", XML_GetBase(self->itself));
 | 
						|
}
 | 
						|
 | 
						|
/*[clinic input]
 | 
						|
pyexpat.xmlparser.GetInputContext
 | 
						|
 | 
						|
Return the untranslated text of the input that caused the current event.
 | 
						|
 | 
						|
If the event was generated by a large amount of text (such as a start tag
 | 
						|
for an element with many attributes), not all of the text may be available.
 | 
						|
[clinic start generated code]*/
 | 
						|
 | 
						|
static PyObject *
 | 
						|
pyexpat_xmlparser_GetInputContext_impl(xmlparseobject *self)
 | 
						|
/*[clinic end generated code: output=a88026d683fc22cc input=034df8712db68379]*/
 | 
						|
{
 | 
						|
    if (self->in_callback) {
 | 
						|
        int offset, size;
 | 
						|
        const char *buffer
 | 
						|
            = XML_GetInputContext(self->itself, &offset, &size);
 | 
						|
 | 
						|
        if (buffer != NULL)
 | 
						|
            return PyBytes_FromStringAndSize(buffer + offset,
 | 
						|
                                              size - offset);
 | 
						|
        else
 | 
						|
            Py_RETURN_NONE;
 | 
						|
    }
 | 
						|
    else
 | 
						|
        Py_RETURN_NONE;
 | 
						|
}
 | 
						|
 | 
						|
/*[clinic input]
 | 
						|
pyexpat.xmlparser.ExternalEntityParserCreate
 | 
						|
 | 
						|
    context: str(accept={str, NoneType})
 | 
						|
    encoding: str = NULL
 | 
						|
    /
 | 
						|
 | 
						|
Create a parser for parsing an external entity based on the information passed to the ExternalEntityRefHandler.
 | 
						|
[clinic start generated code]*/
 | 
						|
 | 
						|
static PyObject *
 | 
						|
pyexpat_xmlparser_ExternalEntityParserCreate_impl(xmlparseobject *self,
 | 
						|
                                                  const char *context,
 | 
						|
                                                  const char *encoding)
 | 
						|
/*[clinic end generated code: output=535cda9d7a0fbcd6 input=b906714cc122c322]*/
 | 
						|
{
 | 
						|
    xmlparseobject *new_parser;
 | 
						|
    int i;
 | 
						|
 | 
						|
    new_parser = PyObject_GC_New(xmlparseobject, &Xmlparsetype);
 | 
						|
    if (new_parser == NULL)
 | 
						|
        return NULL;
 | 
						|
    new_parser->buffer_size = self->buffer_size;
 | 
						|
    new_parser->buffer_used = 0;
 | 
						|
    new_parser->buffer = NULL;
 | 
						|
    new_parser->ordered_attributes = self->ordered_attributes;
 | 
						|
    new_parser->specified_attributes = self->specified_attributes;
 | 
						|
    new_parser->in_callback = 0;
 | 
						|
    new_parser->ns_prefixes = self->ns_prefixes;
 | 
						|
    new_parser->itself = XML_ExternalEntityParserCreate(self->itself, context,
 | 
						|
                                                        encoding);
 | 
						|
    new_parser->handlers = 0;
 | 
						|
    new_parser->intern = self->intern;
 | 
						|
    Py_XINCREF(new_parser->intern);
 | 
						|
    PyObject_GC_Track(new_parser);
 | 
						|
 | 
						|
    if (self->buffer != NULL) {
 | 
						|
        new_parser->buffer = PyMem_Malloc(new_parser->buffer_size);
 | 
						|
        if (new_parser->buffer == NULL) {
 | 
						|
            Py_DECREF(new_parser);
 | 
						|
            return PyErr_NoMemory();
 | 
						|
        }
 | 
						|
    }
 | 
						|
    if (!new_parser->itself) {
 | 
						|
        Py_DECREF(new_parser);
 | 
						|
        return PyErr_NoMemory();
 | 
						|
    }
 | 
						|
 | 
						|
    XML_SetUserData(new_parser->itself, (void *)new_parser);
 | 
						|
 | 
						|
    /* allocate and clear handlers first */
 | 
						|
    for (i = 0; handler_info[i].name != NULL; i++)
 | 
						|
        /* do nothing */;
 | 
						|
 | 
						|
    new_parser->handlers = PyMem_New(PyObject *, i);
 | 
						|
    if (!new_parser->handlers) {
 | 
						|
        Py_DECREF(new_parser);
 | 
						|
        return PyErr_NoMemory();
 | 
						|
    }
 | 
						|
    clear_handlers(new_parser, 1);
 | 
						|
 | 
						|
    /* then copy handlers from self */
 | 
						|
    for (i = 0; handler_info[i].name != NULL; i++) {
 | 
						|
        PyObject *handler = self->handlers[i];
 | 
						|
        if (handler != NULL) {
 | 
						|
            Py_INCREF(handler);
 | 
						|
            new_parser->handlers[i] = handler;
 | 
						|
            handler_info[i].setter(new_parser->itself,
 | 
						|
                                   handler_info[i].handler);
 | 
						|
        }
 | 
						|
    }
 | 
						|
    return (PyObject *)new_parser;
 | 
						|
}
 | 
						|
 | 
						|
/*[clinic input]
 | 
						|
pyexpat.xmlparser.SetParamEntityParsing
 | 
						|
 | 
						|
    flag: int
 | 
						|
    /
 | 
						|
 | 
						|
Controls parsing of parameter entities (including the external DTD subset).
 | 
						|
 | 
						|
Possible flag values are XML_PARAM_ENTITY_PARSING_NEVER,
 | 
						|
XML_PARAM_ENTITY_PARSING_UNLESS_STANDALONE and
 | 
						|
XML_PARAM_ENTITY_PARSING_ALWAYS. Returns true if setting the flag
 | 
						|
was successful.
 | 
						|
[clinic start generated code]*/
 | 
						|
 | 
						|
static PyObject *
 | 
						|
pyexpat_xmlparser_SetParamEntityParsing_impl(xmlparseobject *self, int flag)
 | 
						|
/*[clinic end generated code: output=18668ee8e760d64c input=8aea19b4b15e9af1]*/
 | 
						|
{
 | 
						|
    flag = XML_SetParamEntityParsing(self->itself, flag);
 | 
						|
    return PyLong_FromLong(flag);
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
#if XML_COMBINED_VERSION >= 19505
 | 
						|
/*[clinic input]
 | 
						|
pyexpat.xmlparser.UseForeignDTD
 | 
						|
 | 
						|
    flag: bool = True
 | 
						|
    /
 | 
						|
 | 
						|
Allows the application to provide an artificial external subset if one is not specified as part of the document instance.
 | 
						|
 | 
						|
This readily allows the use of a 'default' document type controlled by the
 | 
						|
application, while still getting the advantage of providing document type
 | 
						|
information to the parser. 'flag' defaults to True if not provided.
 | 
						|
[clinic start generated code]*/
 | 
						|
 | 
						|
static PyObject *
 | 
						|
pyexpat_xmlparser_UseForeignDTD_impl(xmlparseobject *self, int flag)
 | 
						|
/*[clinic end generated code: output=cfaa9aa50bb0f65c input=78144c519d116a6e]*/
 | 
						|
{
 | 
						|
    enum XML_Error rc;
 | 
						|
 | 
						|
    rc = XML_UseForeignDTD(self->itself, flag ? XML_TRUE : XML_FALSE);
 | 
						|
    if (rc != XML_ERROR_NONE) {
 | 
						|
        return set_error(self, rc);
 | 
						|
    }
 | 
						|
    Py_INCREF(Py_None);
 | 
						|
    return Py_None;
 | 
						|
}
 | 
						|
#endif
 | 
						|
 | 
						|
/*[clinic input]
 | 
						|
pyexpat.xmlparser.__dir__
 | 
						|
[clinic start generated code]*/
 | 
						|
 | 
						|
static PyObject *
 | 
						|
pyexpat_xmlparser___dir___impl(xmlparseobject *self)
 | 
						|
/*[clinic end generated code: output=bc22451efb9e4d17 input=76aa455f2a661384]*/
 | 
						|
{
 | 
						|
#define APPEND(list, str)                               \
 | 
						|
        do {                                            \
 | 
						|
                PyObject *o = PyUnicode_FromString(str);        \
 | 
						|
                if (o != NULL)                          \
 | 
						|
                        PyList_Append(list, o);         \
 | 
						|
                Py_XDECREF(o);                          \
 | 
						|
        } while (0)
 | 
						|
 | 
						|
    int i;
 | 
						|
    PyObject *rc = PyList_New(0);
 | 
						|
    if (!rc)
 | 
						|
        return NULL;
 | 
						|
    for (i = 0; handler_info[i].name != NULL; i++) {
 | 
						|
        PyObject *o = get_handler_name(&handler_info[i]);
 | 
						|
        if (o != NULL)
 | 
						|
            PyList_Append(rc, o);
 | 
						|
        Py_XDECREF(o);
 | 
						|
    }
 | 
						|
    APPEND(rc, "ErrorCode");
 | 
						|
    APPEND(rc, "ErrorLineNumber");
 | 
						|
    APPEND(rc, "ErrorColumnNumber");
 | 
						|
    APPEND(rc, "ErrorByteIndex");
 | 
						|
    APPEND(rc, "CurrentLineNumber");
 | 
						|
    APPEND(rc, "CurrentColumnNumber");
 | 
						|
    APPEND(rc, "CurrentByteIndex");
 | 
						|
    APPEND(rc, "buffer_size");
 | 
						|
    APPEND(rc, "buffer_text");
 | 
						|
    APPEND(rc, "buffer_used");
 | 
						|
    APPEND(rc, "namespace_prefixes");
 | 
						|
    APPEND(rc, "ordered_attributes");
 | 
						|
    APPEND(rc, "specified_attributes");
 | 
						|
    APPEND(rc, "intern");
 | 
						|
 | 
						|
#undef APPEND
 | 
						|
 | 
						|
    if (PyErr_Occurred()) {
 | 
						|
        Py_DECREF(rc);
 | 
						|
        rc = NULL;
 | 
						|
    }
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
static struct PyMethodDef xmlparse_methods[] = {
 | 
						|
    PYEXPAT_XMLPARSER_PARSE_METHODDEF
 | 
						|
    PYEXPAT_XMLPARSER_PARSEFILE_METHODDEF
 | 
						|
    PYEXPAT_XMLPARSER_SETBASE_METHODDEF
 | 
						|
    PYEXPAT_XMLPARSER_GETBASE_METHODDEF
 | 
						|
    PYEXPAT_XMLPARSER_GETINPUTCONTEXT_METHODDEF
 | 
						|
    PYEXPAT_XMLPARSER_EXTERNALENTITYPARSERCREATE_METHODDEF
 | 
						|
    PYEXPAT_XMLPARSER_SETPARAMENTITYPARSING_METHODDEF
 | 
						|
#if XML_COMBINED_VERSION >= 19505
 | 
						|
    PYEXPAT_XMLPARSER_USEFOREIGNDTD_METHODDEF
 | 
						|
#endif
 | 
						|
    PYEXPAT_XMLPARSER___DIR___METHODDEF
 | 
						|
    {NULL, NULL}  /* sentinel */
 | 
						|
};
 | 
						|
 | 
						|
/* ---------- */
 | 
						|
 | 
						|
 | 
						|
 | 
						|
/* pyexpat international encoding support.
 | 
						|
   Make it as simple as possible.
 | 
						|
*/
 | 
						|
 | 
						|
static int
 | 
						|
PyUnknownEncodingHandler(void *encodingHandlerData,
 | 
						|
                         const XML_Char *name,
 | 
						|
                         XML_Encoding *info)
 | 
						|
{
 | 
						|
    static unsigned char template_buffer[256] = {0};
 | 
						|
    PyObject* u;
 | 
						|
    int i;
 | 
						|
    void *data;
 | 
						|
    unsigned int kind;
 | 
						|
 | 
						|
    if (PyErr_Occurred())
 | 
						|
        return XML_STATUS_ERROR;
 | 
						|
 | 
						|
    if (template_buffer[1] == 0) {
 | 
						|
        for (i = 0; i < 256; i++)
 | 
						|
            template_buffer[i] = i;
 | 
						|
    }
 | 
						|
 | 
						|
    u = PyUnicode_Decode((char*) template_buffer, 256, name, "replace");
 | 
						|
    if (u == NULL || PyUnicode_READY(u)) {
 | 
						|
        Py_XDECREF(u);
 | 
						|
        return XML_STATUS_ERROR;
 | 
						|
    }
 | 
						|
 | 
						|
    if (PyUnicode_GET_LENGTH(u) != 256) {
 | 
						|
        Py_DECREF(u);
 | 
						|
        PyErr_SetString(PyExc_ValueError,
 | 
						|
                        "multi-byte encodings are not supported");
 | 
						|
        return XML_STATUS_ERROR;
 | 
						|
    }
 | 
						|
 | 
						|
    kind = PyUnicode_KIND(u);
 | 
						|
    data = PyUnicode_DATA(u);
 | 
						|
    for (i = 0; i < 256; i++) {
 | 
						|
        Py_UCS4 ch = PyUnicode_READ(kind, data, i);
 | 
						|
        if (ch != Py_UNICODE_REPLACEMENT_CHARACTER)
 | 
						|
            info->map[i] = ch;
 | 
						|
        else
 | 
						|
            info->map[i] = -1;
 | 
						|
    }
 | 
						|
 | 
						|
    info->data = NULL;
 | 
						|
    info->convert = NULL;
 | 
						|
    info->release = NULL;
 | 
						|
    Py_DECREF(u);
 | 
						|
 | 
						|
    return XML_STATUS_OK;
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
static PyObject *
 | 
						|
newxmlparseobject(const char *encoding, const char *namespace_separator, PyObject *intern)
 | 
						|
{
 | 
						|
    int i;
 | 
						|
    xmlparseobject *self;
 | 
						|
 | 
						|
    self = PyObject_GC_New(xmlparseobject, &Xmlparsetype);
 | 
						|
    if (self == NULL)
 | 
						|
        return NULL;
 | 
						|
 | 
						|
    self->buffer = NULL;
 | 
						|
    self->buffer_size = CHARACTER_DATA_BUFFER_SIZE;
 | 
						|
    self->buffer_used = 0;
 | 
						|
    self->ordered_attributes = 0;
 | 
						|
    self->specified_attributes = 0;
 | 
						|
    self->in_callback = 0;
 | 
						|
    self->ns_prefixes = 0;
 | 
						|
    self->handlers = NULL;
 | 
						|
    self->intern = intern;
 | 
						|
    Py_XINCREF(self->intern);
 | 
						|
    PyObject_GC_Track(self);
 | 
						|
 | 
						|
    /* namespace_separator is either NULL or contains one char + \0 */
 | 
						|
    self->itself = XML_ParserCreate_MM(encoding, &ExpatMemoryHandler,
 | 
						|
                                       namespace_separator);
 | 
						|
    if (self->itself == NULL) {
 | 
						|
        PyErr_SetString(PyExc_RuntimeError,
 | 
						|
                        "XML_ParserCreate failed");
 | 
						|
        Py_DECREF(self);
 | 
						|
        return NULL;
 | 
						|
    }
 | 
						|
#if ((XML_MAJOR_VERSION >= 2) && (XML_MINOR_VERSION >= 1)) || defined(XML_HAS_SET_HASH_SALT)
 | 
						|
    /* This feature was added upstream in libexpat 2.1.0.  Our expat copy
 | 
						|
     * has a backport of this feature where we also define XML_HAS_SET_HASH_SALT
 | 
						|
     * to indicate that we can still use it. */
 | 
						|
    XML_SetHashSalt(self->itself,
 | 
						|
                    (unsigned long)_Py_HashSecret.expat.hashsalt);
 | 
						|
#endif
 | 
						|
    XML_SetUserData(self->itself, (void *)self);
 | 
						|
    XML_SetUnknownEncodingHandler(self->itself,
 | 
						|
                  (XML_UnknownEncodingHandler) PyUnknownEncodingHandler, NULL);
 | 
						|
 | 
						|
    for (i = 0; handler_info[i].name != NULL; i++)
 | 
						|
        /* do nothing */;
 | 
						|
 | 
						|
    self->handlers = PyMem_New(PyObject *, i);
 | 
						|
    if (!self->handlers) {
 | 
						|
        Py_DECREF(self);
 | 
						|
        return PyErr_NoMemory();
 | 
						|
    }
 | 
						|
    clear_handlers(self, 1);
 | 
						|
 | 
						|
    return (PyObject*)self;
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
static void
 | 
						|
xmlparse_dealloc(xmlparseobject *self)
 | 
						|
{
 | 
						|
    int i;
 | 
						|
    PyObject_GC_UnTrack(self);
 | 
						|
    if (self->itself != NULL)
 | 
						|
        XML_ParserFree(self->itself);
 | 
						|
    self->itself = NULL;
 | 
						|
 | 
						|
    if (self->handlers != NULL) {
 | 
						|
        PyObject *temp;
 | 
						|
        for (i = 0; handler_info[i].name != NULL; i++) {
 | 
						|
            temp = self->handlers[i];
 | 
						|
            self->handlers[i] = NULL;
 | 
						|
            Py_XDECREF(temp);
 | 
						|
        }
 | 
						|
        PyMem_Free(self->handlers);
 | 
						|
        self->handlers = NULL;
 | 
						|
    }
 | 
						|
    if (self->buffer != NULL) {
 | 
						|
        PyMem_Free(self->buffer);
 | 
						|
        self->buffer = NULL;
 | 
						|
    }
 | 
						|
    Py_XDECREF(self->intern);
 | 
						|
    PyObject_GC_Del(self);
 | 
						|
}
 | 
						|
 | 
						|
static int
 | 
						|
handlername2int(PyObject *name)
 | 
						|
{
 | 
						|
    int i;
 | 
						|
    for (i = 0; handler_info[i].name != NULL; i++) {
 | 
						|
        if (PyUnicode_CompareWithASCIIString(
 | 
						|
                name, handler_info[i].name) == 0) {
 | 
						|
            return i;
 | 
						|
        }
 | 
						|
    }
 | 
						|
    return -1;
 | 
						|
}
 | 
						|
 | 
						|
static PyObject *
 | 
						|
get_pybool(int istrue)
 | 
						|
{
 | 
						|
    PyObject *result = istrue ? Py_True : Py_False;
 | 
						|
    Py_INCREF(result);
 | 
						|
    return result;
 | 
						|
}
 | 
						|
 | 
						|
static PyObject *
 | 
						|
xmlparse_getattro(xmlparseobject *self, PyObject *nameobj)
 | 
						|
{
 | 
						|
    Py_UCS4 first_char;
 | 
						|
    int handlernum = -1;
 | 
						|
 | 
						|
    if (!PyUnicode_Check(nameobj))
 | 
						|
        goto generic;
 | 
						|
    if (PyUnicode_READY(nameobj))
 | 
						|
        return NULL;
 | 
						|
 | 
						|
    handlernum = handlername2int(nameobj);
 | 
						|
 | 
						|
    if (handlernum != -1) {
 | 
						|
        PyObject *result = self->handlers[handlernum];
 | 
						|
        if (result == NULL)
 | 
						|
            result = Py_None;
 | 
						|
        Py_INCREF(result);
 | 
						|
        return result;
 | 
						|
    }
 | 
						|
 | 
						|
    first_char = PyUnicode_READ_CHAR(nameobj, 0);
 | 
						|
    if (first_char == 'E') {
 | 
						|
        if (PyUnicode_CompareWithASCIIString(nameobj, "ErrorCode") == 0)
 | 
						|
            return PyLong_FromLong((long)
 | 
						|
                                  XML_GetErrorCode(self->itself));
 | 
						|
        if (PyUnicode_CompareWithASCIIString(nameobj, "ErrorLineNumber") == 0)
 | 
						|
            return PyLong_FromLong((long)
 | 
						|
                                  XML_GetErrorLineNumber(self->itself));
 | 
						|
        if (PyUnicode_CompareWithASCIIString(nameobj, "ErrorColumnNumber") == 0)
 | 
						|
            return PyLong_FromLong((long)
 | 
						|
                                  XML_GetErrorColumnNumber(self->itself));
 | 
						|
        if (PyUnicode_CompareWithASCIIString(nameobj, "ErrorByteIndex") == 0)
 | 
						|
            return PyLong_FromLong((long)
 | 
						|
                                  XML_GetErrorByteIndex(self->itself));
 | 
						|
    }
 | 
						|
    if (first_char == 'C') {
 | 
						|
        if (PyUnicode_CompareWithASCIIString(nameobj, "CurrentLineNumber") == 0)
 | 
						|
            return PyLong_FromLong((long)
 | 
						|
                                  XML_GetCurrentLineNumber(self->itself));
 | 
						|
        if (PyUnicode_CompareWithASCIIString(nameobj, "CurrentColumnNumber") == 0)
 | 
						|
            return PyLong_FromLong((long)
 | 
						|
                                  XML_GetCurrentColumnNumber(self->itself));
 | 
						|
        if (PyUnicode_CompareWithASCIIString(nameobj, "CurrentByteIndex") == 0)
 | 
						|
            return PyLong_FromLong((long)
 | 
						|
                                  XML_GetCurrentByteIndex(self->itself));
 | 
						|
    }
 | 
						|
    if (first_char == 'b') {
 | 
						|
        if (PyUnicode_CompareWithASCIIString(nameobj, "buffer_size") == 0)
 | 
						|
            return PyLong_FromLong((long) self->buffer_size);
 | 
						|
        if (PyUnicode_CompareWithASCIIString(nameobj, "buffer_text") == 0)
 | 
						|
            return get_pybool(self->buffer != NULL);
 | 
						|
        if (PyUnicode_CompareWithASCIIString(nameobj, "buffer_used") == 0)
 | 
						|
            return PyLong_FromLong((long) self->buffer_used);
 | 
						|
    }
 | 
						|
    if (PyUnicode_CompareWithASCIIString(nameobj, "namespace_prefixes") == 0)
 | 
						|
        return get_pybool(self->ns_prefixes);
 | 
						|
    if (PyUnicode_CompareWithASCIIString(nameobj, "ordered_attributes") == 0)
 | 
						|
        return get_pybool(self->ordered_attributes);
 | 
						|
    if (PyUnicode_CompareWithASCIIString(nameobj, "specified_attributes") == 0)
 | 
						|
        return get_pybool((long) self->specified_attributes);
 | 
						|
    if (PyUnicode_CompareWithASCIIString(nameobj, "intern") == 0) {
 | 
						|
        if (self->intern == NULL) {
 | 
						|
            Py_INCREF(Py_None);
 | 
						|
            return Py_None;
 | 
						|
        }
 | 
						|
        else {
 | 
						|
            Py_INCREF(self->intern);
 | 
						|
            return self->intern;
 | 
						|
        }
 | 
						|
    }
 | 
						|
  generic:
 | 
						|
    return PyObject_GenericGetAttr((PyObject*)self, nameobj);
 | 
						|
}
 | 
						|
 | 
						|
static int
 | 
						|
sethandler(xmlparseobject *self, PyObject *name, PyObject* v)
 | 
						|
{
 | 
						|
    int handlernum = handlername2int(name);
 | 
						|
    if (handlernum >= 0) {
 | 
						|
        xmlhandler c_handler = NULL;
 | 
						|
        PyObject *temp = self->handlers[handlernum];
 | 
						|
 | 
						|
        if (v == Py_None) {
 | 
						|
            /* If this is the character data handler, and a character
 | 
						|
               data handler is already active, we need to be more
 | 
						|
               careful.  What we can safely do is replace the existing
 | 
						|
               character data handler callback function with a no-op
 | 
						|
               function that will refuse to call Python.  The downside
 | 
						|
               is that this doesn't completely remove the character
 | 
						|
               data handler from the C layer if there's any callback
 | 
						|
               active, so Expat does a little more work than it
 | 
						|
               otherwise would, but that's really an odd case.  A more
 | 
						|
               elaborate system of handlers and state could remove the
 | 
						|
               C handler more effectively. */
 | 
						|
            if (handlernum == CharacterData && self->in_callback)
 | 
						|
                c_handler = noop_character_data_handler;
 | 
						|
            v = NULL;
 | 
						|
        }
 | 
						|
        else if (v != NULL) {
 | 
						|
            Py_INCREF(v);
 | 
						|
            c_handler = handler_info[handlernum].handler;
 | 
						|
        }
 | 
						|
        self->handlers[handlernum] = v;
 | 
						|
        Py_XDECREF(temp);
 | 
						|
        handler_info[handlernum].setter(self->itself, c_handler);
 | 
						|
        return 1;
 | 
						|
    }
 | 
						|
    return 0;
 | 
						|
}
 | 
						|
 | 
						|
static int
 | 
						|
xmlparse_setattro(xmlparseobject *self, PyObject *name, PyObject *v)
 | 
						|
{
 | 
						|
    /* Set attribute 'name' to value 'v'. v==NULL means delete */
 | 
						|
    if (v == NULL) {
 | 
						|
        PyErr_SetString(PyExc_RuntimeError, "Cannot delete attribute");
 | 
						|
        return -1;
 | 
						|
    }
 | 
						|
    assert(PyUnicode_Check(name));
 | 
						|
    if (PyUnicode_CompareWithASCIIString(name, "buffer_text") == 0) {
 | 
						|
        int b = PyObject_IsTrue(v);
 | 
						|
        if (b < 0)
 | 
						|
            return -1;
 | 
						|
        if (b) {
 | 
						|
            if (self->buffer == NULL) {
 | 
						|
                self->buffer = PyMem_Malloc(self->buffer_size);
 | 
						|
                if (self->buffer == NULL) {
 | 
						|
                    PyErr_NoMemory();
 | 
						|
                    return -1;
 | 
						|
                }
 | 
						|
                self->buffer_used = 0;
 | 
						|
            }
 | 
						|
        }
 | 
						|
        else if (self->buffer != NULL) {
 | 
						|
            if (flush_character_buffer(self) < 0)
 | 
						|
                return -1;
 | 
						|
            PyMem_Free(self->buffer);
 | 
						|
            self->buffer = NULL;
 | 
						|
        }
 | 
						|
        return 0;
 | 
						|
    }
 | 
						|
    if (PyUnicode_CompareWithASCIIString(name, "namespace_prefixes") == 0) {
 | 
						|
        int b = PyObject_IsTrue(v);
 | 
						|
        if (b < 0)
 | 
						|
            return -1;
 | 
						|
        self->ns_prefixes = b;
 | 
						|
        XML_SetReturnNSTriplet(self->itself, self->ns_prefixes);
 | 
						|
        return 0;
 | 
						|
    }
 | 
						|
    if (PyUnicode_CompareWithASCIIString(name, "ordered_attributes") == 0) {
 | 
						|
        int b = PyObject_IsTrue(v);
 | 
						|
        if (b < 0)
 | 
						|
            return -1;
 | 
						|
        self->ordered_attributes = b;
 | 
						|
        return 0;
 | 
						|
    }
 | 
						|
    if (PyUnicode_CompareWithASCIIString(name, "specified_attributes") == 0) {
 | 
						|
        int b = PyObject_IsTrue(v);
 | 
						|
        if (b < 0)
 | 
						|
            return -1;
 | 
						|
        self->specified_attributes = b;
 | 
						|
        return 0;
 | 
						|
    }
 | 
						|
 | 
						|
    if (PyUnicode_CompareWithASCIIString(name, "buffer_size") == 0) {
 | 
						|
      long new_buffer_size;
 | 
						|
      if (!PyLong_Check(v)) {
 | 
						|
        PyErr_SetString(PyExc_TypeError, "buffer_size must be an integer");
 | 
						|
        return -1;
 | 
						|
      }
 | 
						|
 | 
						|
      new_buffer_size=PyLong_AS_LONG(v);
 | 
						|
      /* trivial case -- no change */
 | 
						|
      if (new_buffer_size == self->buffer_size) {
 | 
						|
        return 0;
 | 
						|
      }
 | 
						|
 | 
						|
      if (new_buffer_size <= 0) {
 | 
						|
        PyErr_SetString(PyExc_ValueError, "buffer_size must be greater than zero");
 | 
						|
        return -1;
 | 
						|
      }
 | 
						|
 | 
						|
      /* check maximum */
 | 
						|
      if (new_buffer_size > INT_MAX) {
 | 
						|
        char errmsg[100];
 | 
						|
        sprintf(errmsg, "buffer_size must not be greater than %i", INT_MAX);
 | 
						|
        PyErr_SetString(PyExc_ValueError, errmsg);
 | 
						|
        return -1;
 | 
						|
      }
 | 
						|
 | 
						|
      if (self->buffer != NULL) {
 | 
						|
        /* there is already a buffer */
 | 
						|
        if (self->buffer_used != 0) {
 | 
						|
            if (flush_character_buffer(self) < 0) {
 | 
						|
                return -1;
 | 
						|
            }
 | 
						|
        }
 | 
						|
        /* free existing buffer */
 | 
						|
        PyMem_Free(self->buffer);
 | 
						|
      }
 | 
						|
      self->buffer = PyMem_Malloc(new_buffer_size);
 | 
						|
      if (self->buffer == NULL) {
 | 
						|
        PyErr_NoMemory();
 | 
						|
        return -1;
 | 
						|
      }
 | 
						|
      self->buffer_size = new_buffer_size;
 | 
						|
      return 0;
 | 
						|
    }
 | 
						|
 | 
						|
    if (PyUnicode_CompareWithASCIIString(name, "CharacterDataHandler") == 0) {
 | 
						|
        /* If we're changing the character data handler, flush all
 | 
						|
         * cached data with the old handler.  Not sure there's a
 | 
						|
         * "right" thing to do, though, but this probably won't
 | 
						|
         * happen.
 | 
						|
         */
 | 
						|
        if (flush_character_buffer(self) < 0)
 | 
						|
            return -1;
 | 
						|
    }
 | 
						|
    if (sethandler(self, name, v)) {
 | 
						|
        return 0;
 | 
						|
    }
 | 
						|
    PyErr_SetObject(PyExc_AttributeError, name);
 | 
						|
    return -1;
 | 
						|
}
 | 
						|
 | 
						|
static int
 | 
						|
xmlparse_traverse(xmlparseobject *op, visitproc visit, void *arg)
 | 
						|
{
 | 
						|
    int i;
 | 
						|
    for (i = 0; handler_info[i].name != NULL; i++)
 | 
						|
        Py_VISIT(op->handlers[i]);
 | 
						|
    return 0;
 | 
						|
}
 | 
						|
 | 
						|
static int
 | 
						|
xmlparse_clear(xmlparseobject *op)
 | 
						|
{
 | 
						|
    clear_handlers(op, 0);
 | 
						|
    Py_CLEAR(op->intern);
 | 
						|
    return 0;
 | 
						|
}
 | 
						|
 | 
						|
PyDoc_STRVAR(Xmlparsetype__doc__, "XML parser");
 | 
						|
 | 
						|
static PyTypeObject Xmlparsetype = {
 | 
						|
        PyVarObject_HEAD_INIT(NULL, 0)
 | 
						|
        "pyexpat.xmlparser",            /*tp_name*/
 | 
						|
        sizeof(xmlparseobject),         /*tp_basicsize*/
 | 
						|
        0,                              /*tp_itemsize*/
 | 
						|
        /* methods */
 | 
						|
        (destructor)xmlparse_dealloc,   /*tp_dealloc*/
 | 
						|
        (printfunc)0,           /*tp_print*/
 | 
						|
        0,                      /*tp_getattr*/
 | 
						|
        0,  /*tp_setattr*/
 | 
						|
        0,                      /*tp_reserved*/
 | 
						|
        (reprfunc)0,            /*tp_repr*/
 | 
						|
        0,                      /*tp_as_number*/
 | 
						|
        0,              /*tp_as_sequence*/
 | 
						|
        0,              /*tp_as_mapping*/
 | 
						|
        (hashfunc)0,            /*tp_hash*/
 | 
						|
        (ternaryfunc)0,         /*tp_call*/
 | 
						|
        (reprfunc)0,            /*tp_str*/
 | 
						|
        (getattrofunc)xmlparse_getattro, /* tp_getattro */
 | 
						|
        (setattrofunc)xmlparse_setattro,              /* tp_setattro */
 | 
						|
        0,              /* tp_as_buffer */
 | 
						|
        Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC, /*tp_flags*/
 | 
						|
        Xmlparsetype__doc__, /* tp_doc - Documentation string */
 | 
						|
        (traverseproc)xmlparse_traverse,        /* tp_traverse */
 | 
						|
        (inquiry)xmlparse_clear,                /* tp_clear */
 | 
						|
        0,                              /* tp_richcompare */
 | 
						|
        0,                              /* tp_weaklistoffset */
 | 
						|
        0,                              /* tp_iter */
 | 
						|
        0,                              /* tp_iternext */
 | 
						|
        xmlparse_methods,               /* tp_methods */
 | 
						|
};
 | 
						|
 | 
						|
/* End of code for xmlparser objects */
 | 
						|
/* -------------------------------------------------------- */
 | 
						|
 | 
						|
/*[clinic input]
 | 
						|
pyexpat.ParserCreate
 | 
						|
 | 
						|
    encoding: str(accept={str, NoneType}) = NULL
 | 
						|
    namespace_separator: str(accept={str, NoneType}) = NULL
 | 
						|
    intern: object = NULL
 | 
						|
 | 
						|
Return a new XML parser object.
 | 
						|
[clinic start generated code]*/
 | 
						|
 | 
						|
static PyObject *
 | 
						|
pyexpat_ParserCreate_impl(PyModuleDef *module, const char *encoding,
 | 
						|
                          const char *namespace_separator, PyObject *intern)
 | 
						|
/*[clinic end generated code: output=81fccd233e1743a8 input=23d29704acad385d]*/
 | 
						|
{
 | 
						|
    PyObject *result;
 | 
						|
    int intern_decref = 0;
 | 
						|
 | 
						|
    if (namespace_separator != NULL
 | 
						|
        && strlen(namespace_separator) > 1) {
 | 
						|
        PyErr_SetString(PyExc_ValueError,
 | 
						|
                        "namespace_separator must be at most one"
 | 
						|
                        " character, omitted, or None");
 | 
						|
        return NULL;
 | 
						|
    }
 | 
						|
    /* Explicitly passing None means no interning is desired.
 | 
						|
       Not passing anything means that a new dictionary is used. */
 | 
						|
    if (intern == Py_None)
 | 
						|
        intern = NULL;
 | 
						|
    else if (intern == NULL) {
 | 
						|
        intern = PyDict_New();
 | 
						|
        if (!intern)
 | 
						|
            return NULL;
 | 
						|
        intern_decref = 1;
 | 
						|
    }
 | 
						|
    else if (!PyDict_Check(intern)) {
 | 
						|
        PyErr_SetString(PyExc_TypeError, "intern must be a dictionary");
 | 
						|
        return NULL;
 | 
						|
    }
 | 
						|
 | 
						|
    result = newxmlparseobject(encoding, namespace_separator, intern);
 | 
						|
    if (intern_decref) {
 | 
						|
        Py_DECREF(intern);
 | 
						|
    }
 | 
						|
    return result;
 | 
						|
}
 | 
						|
 | 
						|
/*[clinic input]
 | 
						|
pyexpat.ErrorString
 | 
						|
 | 
						|
    code: long
 | 
						|
    /
 | 
						|
 | 
						|
Returns string error for given number.
 | 
						|
[clinic start generated code]*/
 | 
						|
 | 
						|
static PyObject *
 | 
						|
pyexpat_ErrorString_impl(PyModuleDef *module, long code)
 | 
						|
/*[clinic end generated code: output=d87668108b6868e5 input=cc67de010d9e62b3]*/
 | 
						|
{
 | 
						|
    return Py_BuildValue("z", XML_ErrorString((int)code));
 | 
						|
}
 | 
						|
 | 
						|
/* List of methods defined in the module */
 | 
						|
 | 
						|
static struct PyMethodDef pyexpat_methods[] = {
 | 
						|
    PYEXPAT_PARSERCREATE_METHODDEF
 | 
						|
    PYEXPAT_ERRORSTRING_METHODDEF
 | 
						|
    {NULL, NULL}  /* sentinel */
 | 
						|
};
 | 
						|
 | 
						|
/* Module docstring */
 | 
						|
 | 
						|
PyDoc_STRVAR(pyexpat_module_documentation,
 | 
						|
"Python wrapper for Expat parser.");
 | 
						|
 | 
						|
/* Initialization function for the module */
 | 
						|
 | 
						|
#ifndef MODULE_NAME
 | 
						|
#define MODULE_NAME "pyexpat"
 | 
						|
#endif
 | 
						|
 | 
						|
#ifndef MODULE_INITFUNC
 | 
						|
#define MODULE_INITFUNC PyInit_pyexpat
 | 
						|
#endif
 | 
						|
 | 
						|
static struct PyModuleDef pyexpatmodule = {
 | 
						|
        PyModuleDef_HEAD_INIT,
 | 
						|
        MODULE_NAME,
 | 
						|
        pyexpat_module_documentation,
 | 
						|
        -1,
 | 
						|
        pyexpat_methods,
 | 
						|
        NULL,
 | 
						|
        NULL,
 | 
						|
        NULL,
 | 
						|
        NULL
 | 
						|
};
 | 
						|
 | 
						|
PyMODINIT_FUNC
 | 
						|
MODULE_INITFUNC(void)
 | 
						|
{
 | 
						|
    PyObject *m, *d;
 | 
						|
    PyObject *errmod_name = PyUnicode_FromString(MODULE_NAME ".errors");
 | 
						|
    PyObject *errors_module;
 | 
						|
    PyObject *modelmod_name;
 | 
						|
    PyObject *model_module;
 | 
						|
    PyObject *sys_modules;
 | 
						|
    PyObject *tmpnum, *tmpstr;
 | 
						|
    PyObject *codes_dict;
 | 
						|
    PyObject *rev_codes_dict;
 | 
						|
    int res;
 | 
						|
    static struct PyExpat_CAPI capi;
 | 
						|
    PyObject *capi_object;
 | 
						|
 | 
						|
    if (errmod_name == NULL)
 | 
						|
        return NULL;
 | 
						|
    modelmod_name = PyUnicode_FromString(MODULE_NAME ".model");
 | 
						|
    if (modelmod_name == NULL)
 | 
						|
        return NULL;
 | 
						|
 | 
						|
    if (PyType_Ready(&Xmlparsetype) < 0)
 | 
						|
        return NULL;
 | 
						|
 | 
						|
    /* Create the module and add the functions */
 | 
						|
    m = PyModule_Create(&pyexpatmodule);
 | 
						|
    if (m == NULL)
 | 
						|
        return NULL;
 | 
						|
 | 
						|
    /* Add some symbolic constants to the module */
 | 
						|
    if (ErrorObject == NULL) {
 | 
						|
        ErrorObject = PyErr_NewException("xml.parsers.expat.ExpatError",
 | 
						|
                                         NULL, NULL);
 | 
						|
        if (ErrorObject == NULL)
 | 
						|
            return NULL;
 | 
						|
    }
 | 
						|
    Py_INCREF(ErrorObject);
 | 
						|
    PyModule_AddObject(m, "error", ErrorObject);
 | 
						|
    Py_INCREF(ErrorObject);
 | 
						|
    PyModule_AddObject(m, "ExpatError", ErrorObject);
 | 
						|
    Py_INCREF(&Xmlparsetype);
 | 
						|
    PyModule_AddObject(m, "XMLParserType", (PyObject *) &Xmlparsetype);
 | 
						|
 | 
						|
    PyModule_AddStringConstant(m, "EXPAT_VERSION",
 | 
						|
                               XML_ExpatVersion());
 | 
						|
    {
 | 
						|
        XML_Expat_Version info = XML_ExpatVersionInfo();
 | 
						|
        PyModule_AddObject(m, "version_info",
 | 
						|
                           Py_BuildValue("(iii)", info.major,
 | 
						|
                                         info.minor, info.micro));
 | 
						|
    }
 | 
						|
    /* XXX When Expat supports some way of figuring out how it was
 | 
						|
       compiled, this should check and set native_encoding
 | 
						|
       appropriately.
 | 
						|
    */
 | 
						|
    PyModule_AddStringConstant(m, "native_encoding", "UTF-8");
 | 
						|
 | 
						|
    sys_modules = PySys_GetObject("modules");
 | 
						|
    d = PyModule_GetDict(m);
 | 
						|
    errors_module = PyDict_GetItem(d, errmod_name);
 | 
						|
    if (errors_module == NULL) {
 | 
						|
        errors_module = PyModule_New(MODULE_NAME ".errors");
 | 
						|
        if (errors_module != NULL) {
 | 
						|
            PyDict_SetItem(sys_modules, errmod_name, errors_module);
 | 
						|
            /* gives away the reference to errors_module */
 | 
						|
            PyModule_AddObject(m, "errors", errors_module);
 | 
						|
        }
 | 
						|
    }
 | 
						|
    Py_DECREF(errmod_name);
 | 
						|
    model_module = PyDict_GetItem(d, modelmod_name);
 | 
						|
    if (model_module == NULL) {
 | 
						|
        model_module = PyModule_New(MODULE_NAME ".model");
 | 
						|
        if (model_module != NULL) {
 | 
						|
            PyDict_SetItem(sys_modules, modelmod_name, model_module);
 | 
						|
            /* gives away the reference to model_module */
 | 
						|
            PyModule_AddObject(m, "model", model_module);
 | 
						|
        }
 | 
						|
    }
 | 
						|
    Py_DECREF(modelmod_name);
 | 
						|
    if (errors_module == NULL || model_module == NULL)
 | 
						|
        /* Don't core dump later! */
 | 
						|
        return NULL;
 | 
						|
 | 
						|
#if XML_COMBINED_VERSION > 19505
 | 
						|
    {
 | 
						|
        const XML_Feature *features = XML_GetFeatureList();
 | 
						|
        PyObject *list = PyList_New(0);
 | 
						|
        if (list == NULL)
 | 
						|
            /* just ignore it */
 | 
						|
            PyErr_Clear();
 | 
						|
        else {
 | 
						|
            int i = 0;
 | 
						|
            for (; features[i].feature != XML_FEATURE_END; ++i) {
 | 
						|
                int ok;
 | 
						|
                PyObject *item = Py_BuildValue("si", features[i].name,
 | 
						|
                                               features[i].value);
 | 
						|
                if (item == NULL) {
 | 
						|
                    Py_DECREF(list);
 | 
						|
                    list = NULL;
 | 
						|
                    break;
 | 
						|
                }
 | 
						|
                ok = PyList_Append(list, item);
 | 
						|
                Py_DECREF(item);
 | 
						|
                if (ok < 0) {
 | 
						|
                    PyErr_Clear();
 | 
						|
                    break;
 | 
						|
                }
 | 
						|
            }
 | 
						|
            if (list != NULL)
 | 
						|
                PyModule_AddObject(m, "features", list);
 | 
						|
        }
 | 
						|
    }
 | 
						|
#endif
 | 
						|
 | 
						|
    codes_dict = PyDict_New();
 | 
						|
    rev_codes_dict = PyDict_New();
 | 
						|
    if (codes_dict == NULL || rev_codes_dict == NULL) {
 | 
						|
        Py_XDECREF(codes_dict);
 | 
						|
        Py_XDECREF(rev_codes_dict);
 | 
						|
        return NULL;
 | 
						|
    }
 | 
						|
 | 
						|
#define MYCONST(name) \
 | 
						|
    if (PyModule_AddStringConstant(errors_module, #name,               \
 | 
						|
                                   XML_ErrorString(name)) < 0)         \
 | 
						|
        return NULL;                                                   \
 | 
						|
    tmpnum = PyLong_FromLong(name);                                    \
 | 
						|
    if (tmpnum == NULL) return NULL;                                   \
 | 
						|
    res = PyDict_SetItemString(codes_dict,                             \
 | 
						|
                               XML_ErrorString(name), tmpnum);         \
 | 
						|
    if (res < 0) return NULL;                                          \
 | 
						|
    tmpstr = PyUnicode_FromString(XML_ErrorString(name));              \
 | 
						|
    if (tmpstr == NULL) return NULL;                                   \
 | 
						|
    res = PyDict_SetItem(rev_codes_dict, tmpnum, tmpstr);              \
 | 
						|
    Py_DECREF(tmpstr);                                                 \
 | 
						|
    Py_DECREF(tmpnum);                                                 \
 | 
						|
    if (res < 0) return NULL;                                          \
 | 
						|
 | 
						|
    MYCONST(XML_ERROR_NO_MEMORY);
 | 
						|
    MYCONST(XML_ERROR_SYNTAX);
 | 
						|
    MYCONST(XML_ERROR_NO_ELEMENTS);
 | 
						|
    MYCONST(XML_ERROR_INVALID_TOKEN);
 | 
						|
    MYCONST(XML_ERROR_UNCLOSED_TOKEN);
 | 
						|
    MYCONST(XML_ERROR_PARTIAL_CHAR);
 | 
						|
    MYCONST(XML_ERROR_TAG_MISMATCH);
 | 
						|
    MYCONST(XML_ERROR_DUPLICATE_ATTRIBUTE);
 | 
						|
    MYCONST(XML_ERROR_JUNK_AFTER_DOC_ELEMENT);
 | 
						|
    MYCONST(XML_ERROR_PARAM_ENTITY_REF);
 | 
						|
    MYCONST(XML_ERROR_UNDEFINED_ENTITY);
 | 
						|
    MYCONST(XML_ERROR_RECURSIVE_ENTITY_REF);
 | 
						|
    MYCONST(XML_ERROR_ASYNC_ENTITY);
 | 
						|
    MYCONST(XML_ERROR_BAD_CHAR_REF);
 | 
						|
    MYCONST(XML_ERROR_BINARY_ENTITY_REF);
 | 
						|
    MYCONST(XML_ERROR_ATTRIBUTE_EXTERNAL_ENTITY_REF);
 | 
						|
    MYCONST(XML_ERROR_MISPLACED_XML_PI);
 | 
						|
    MYCONST(XML_ERROR_UNKNOWN_ENCODING);
 | 
						|
    MYCONST(XML_ERROR_INCORRECT_ENCODING);
 | 
						|
    MYCONST(XML_ERROR_UNCLOSED_CDATA_SECTION);
 | 
						|
    MYCONST(XML_ERROR_EXTERNAL_ENTITY_HANDLING);
 | 
						|
    MYCONST(XML_ERROR_NOT_STANDALONE);
 | 
						|
    MYCONST(XML_ERROR_UNEXPECTED_STATE);
 | 
						|
    MYCONST(XML_ERROR_ENTITY_DECLARED_IN_PE);
 | 
						|
    MYCONST(XML_ERROR_FEATURE_REQUIRES_XML_DTD);
 | 
						|
    MYCONST(XML_ERROR_CANT_CHANGE_FEATURE_ONCE_PARSING);
 | 
						|
    /* Added in Expat 1.95.7. */
 | 
						|
    MYCONST(XML_ERROR_UNBOUND_PREFIX);
 | 
						|
    /* Added in Expat 1.95.8. */
 | 
						|
    MYCONST(XML_ERROR_UNDECLARING_PREFIX);
 | 
						|
    MYCONST(XML_ERROR_INCOMPLETE_PE);
 | 
						|
    MYCONST(XML_ERROR_XML_DECL);
 | 
						|
    MYCONST(XML_ERROR_TEXT_DECL);
 | 
						|
    MYCONST(XML_ERROR_PUBLICID);
 | 
						|
    MYCONST(XML_ERROR_SUSPENDED);
 | 
						|
    MYCONST(XML_ERROR_NOT_SUSPENDED);
 | 
						|
    MYCONST(XML_ERROR_ABORTED);
 | 
						|
    MYCONST(XML_ERROR_FINISHED);
 | 
						|
    MYCONST(XML_ERROR_SUSPEND_PE);
 | 
						|
 | 
						|
    if (PyModule_AddStringConstant(errors_module, "__doc__",
 | 
						|
                                   "Constants used to describe "
 | 
						|
                                   "error conditions.") < 0)
 | 
						|
        return NULL;
 | 
						|
 | 
						|
    if (PyModule_AddObject(errors_module, "codes", codes_dict) < 0)
 | 
						|
        return NULL;
 | 
						|
    if (PyModule_AddObject(errors_module, "messages", rev_codes_dict) < 0)
 | 
						|
        return NULL;
 | 
						|
 | 
						|
#undef MYCONST
 | 
						|
 | 
						|
#define MYCONST(c) PyModule_AddIntConstant(m, #c, c)
 | 
						|
    MYCONST(XML_PARAM_ENTITY_PARSING_NEVER);
 | 
						|
    MYCONST(XML_PARAM_ENTITY_PARSING_UNLESS_STANDALONE);
 | 
						|
    MYCONST(XML_PARAM_ENTITY_PARSING_ALWAYS);
 | 
						|
#undef MYCONST
 | 
						|
 | 
						|
#define MYCONST(c) PyModule_AddIntConstant(model_module, #c, c)
 | 
						|
    PyModule_AddStringConstant(model_module, "__doc__",
 | 
						|
                     "Constants used to interpret content model information.");
 | 
						|
 | 
						|
    MYCONST(XML_CTYPE_EMPTY);
 | 
						|
    MYCONST(XML_CTYPE_ANY);
 | 
						|
    MYCONST(XML_CTYPE_MIXED);
 | 
						|
    MYCONST(XML_CTYPE_NAME);
 | 
						|
    MYCONST(XML_CTYPE_CHOICE);
 | 
						|
    MYCONST(XML_CTYPE_SEQ);
 | 
						|
 | 
						|
    MYCONST(XML_CQUANT_NONE);
 | 
						|
    MYCONST(XML_CQUANT_OPT);
 | 
						|
    MYCONST(XML_CQUANT_REP);
 | 
						|
    MYCONST(XML_CQUANT_PLUS);
 | 
						|
#undef MYCONST
 | 
						|
 | 
						|
    /* initialize pyexpat dispatch table */
 | 
						|
    capi.size = sizeof(capi);
 | 
						|
    capi.magic = PyExpat_CAPI_MAGIC;
 | 
						|
    capi.MAJOR_VERSION = XML_MAJOR_VERSION;
 | 
						|
    capi.MINOR_VERSION = XML_MINOR_VERSION;
 | 
						|
    capi.MICRO_VERSION = XML_MICRO_VERSION;
 | 
						|
    capi.ErrorString = XML_ErrorString;
 | 
						|
    capi.GetErrorCode = XML_GetErrorCode;
 | 
						|
    capi.GetErrorColumnNumber = XML_GetErrorColumnNumber;
 | 
						|
    capi.GetErrorLineNumber = XML_GetErrorLineNumber;
 | 
						|
    capi.Parse = XML_Parse;
 | 
						|
    capi.ParserCreate_MM = XML_ParserCreate_MM;
 | 
						|
    capi.ParserFree = XML_ParserFree;
 | 
						|
    capi.SetCharacterDataHandler = XML_SetCharacterDataHandler;
 | 
						|
    capi.SetCommentHandler = XML_SetCommentHandler;
 | 
						|
    capi.SetDefaultHandlerExpand = XML_SetDefaultHandlerExpand;
 | 
						|
    capi.SetElementHandler = XML_SetElementHandler;
 | 
						|
    capi.SetNamespaceDeclHandler = XML_SetNamespaceDeclHandler;
 | 
						|
    capi.SetProcessingInstructionHandler = XML_SetProcessingInstructionHandler;
 | 
						|
    capi.SetUnknownEncodingHandler = XML_SetUnknownEncodingHandler;
 | 
						|
    capi.SetUserData = XML_SetUserData;
 | 
						|
    capi.SetStartDoctypeDeclHandler = XML_SetStartDoctypeDeclHandler;
 | 
						|
    capi.SetEncoding = XML_SetEncoding;
 | 
						|
    capi.DefaultUnknownEncodingHandler = PyUnknownEncodingHandler;
 | 
						|
 | 
						|
    /* export using capsule */
 | 
						|
    capi_object = PyCapsule_New(&capi, PyExpat_CAPSULE_NAME, NULL);
 | 
						|
    if (capi_object)
 | 
						|
        PyModule_AddObject(m, "expat_CAPI", capi_object);
 | 
						|
    return m;
 | 
						|
}
 | 
						|
 | 
						|
static void
 | 
						|
clear_handlers(xmlparseobject *self, int initial)
 | 
						|
{
 | 
						|
    int i = 0;
 | 
						|
    PyObject *temp;
 | 
						|
 | 
						|
    for (; handler_info[i].name != NULL; i++) {
 | 
						|
        if (initial)
 | 
						|
            self->handlers[i] = NULL;
 | 
						|
        else {
 | 
						|
            temp = self->handlers[i];
 | 
						|
            self->handlers[i] = NULL;
 | 
						|
            Py_XDECREF(temp);
 | 
						|
            handler_info[i].setter(self->itself, NULL);
 | 
						|
        }
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
static struct HandlerInfo handler_info[] = {
 | 
						|
    {"StartElementHandler",
 | 
						|
     (xmlhandlersetter)XML_SetStartElementHandler,
 | 
						|
     (xmlhandler)my_StartElementHandler},
 | 
						|
    {"EndElementHandler",
 | 
						|
     (xmlhandlersetter)XML_SetEndElementHandler,
 | 
						|
     (xmlhandler)my_EndElementHandler},
 | 
						|
    {"ProcessingInstructionHandler",
 | 
						|
     (xmlhandlersetter)XML_SetProcessingInstructionHandler,
 | 
						|
     (xmlhandler)my_ProcessingInstructionHandler},
 | 
						|
    {"CharacterDataHandler",
 | 
						|
     (xmlhandlersetter)XML_SetCharacterDataHandler,
 | 
						|
     (xmlhandler)my_CharacterDataHandler},
 | 
						|
    {"UnparsedEntityDeclHandler",
 | 
						|
     (xmlhandlersetter)XML_SetUnparsedEntityDeclHandler,
 | 
						|
     (xmlhandler)my_UnparsedEntityDeclHandler},
 | 
						|
    {"NotationDeclHandler",
 | 
						|
     (xmlhandlersetter)XML_SetNotationDeclHandler,
 | 
						|
     (xmlhandler)my_NotationDeclHandler},
 | 
						|
    {"StartNamespaceDeclHandler",
 | 
						|
     (xmlhandlersetter)XML_SetStartNamespaceDeclHandler,
 | 
						|
     (xmlhandler)my_StartNamespaceDeclHandler},
 | 
						|
    {"EndNamespaceDeclHandler",
 | 
						|
     (xmlhandlersetter)XML_SetEndNamespaceDeclHandler,
 | 
						|
     (xmlhandler)my_EndNamespaceDeclHandler},
 | 
						|
    {"CommentHandler",
 | 
						|
     (xmlhandlersetter)XML_SetCommentHandler,
 | 
						|
     (xmlhandler)my_CommentHandler},
 | 
						|
    {"StartCdataSectionHandler",
 | 
						|
     (xmlhandlersetter)XML_SetStartCdataSectionHandler,
 | 
						|
     (xmlhandler)my_StartCdataSectionHandler},
 | 
						|
    {"EndCdataSectionHandler",
 | 
						|
     (xmlhandlersetter)XML_SetEndCdataSectionHandler,
 | 
						|
     (xmlhandler)my_EndCdataSectionHandler},
 | 
						|
    {"DefaultHandler",
 | 
						|
     (xmlhandlersetter)XML_SetDefaultHandler,
 | 
						|
     (xmlhandler)my_DefaultHandler},
 | 
						|
    {"DefaultHandlerExpand",
 | 
						|
     (xmlhandlersetter)XML_SetDefaultHandlerExpand,
 | 
						|
     (xmlhandler)my_DefaultHandlerExpandHandler},
 | 
						|
    {"NotStandaloneHandler",
 | 
						|
     (xmlhandlersetter)XML_SetNotStandaloneHandler,
 | 
						|
     (xmlhandler)my_NotStandaloneHandler},
 | 
						|
    {"ExternalEntityRefHandler",
 | 
						|
     (xmlhandlersetter)XML_SetExternalEntityRefHandler,
 | 
						|
     (xmlhandler)my_ExternalEntityRefHandler},
 | 
						|
    {"StartDoctypeDeclHandler",
 | 
						|
     (xmlhandlersetter)XML_SetStartDoctypeDeclHandler,
 | 
						|
     (xmlhandler)my_StartDoctypeDeclHandler},
 | 
						|
    {"EndDoctypeDeclHandler",
 | 
						|
     (xmlhandlersetter)XML_SetEndDoctypeDeclHandler,
 | 
						|
     (xmlhandler)my_EndDoctypeDeclHandler},
 | 
						|
    {"EntityDeclHandler",
 | 
						|
     (xmlhandlersetter)XML_SetEntityDeclHandler,
 | 
						|
     (xmlhandler)my_EntityDeclHandler},
 | 
						|
    {"XmlDeclHandler",
 | 
						|
     (xmlhandlersetter)XML_SetXmlDeclHandler,
 | 
						|
     (xmlhandler)my_XmlDeclHandler},
 | 
						|
    {"ElementDeclHandler",
 | 
						|
     (xmlhandlersetter)XML_SetElementDeclHandler,
 | 
						|
     (xmlhandler)my_ElementDeclHandler},
 | 
						|
    {"AttlistDeclHandler",
 | 
						|
     (xmlhandlersetter)XML_SetAttlistDeclHandler,
 | 
						|
     (xmlhandler)my_AttlistDeclHandler},
 | 
						|
#if XML_COMBINED_VERSION >= 19504
 | 
						|
    {"SkippedEntityHandler",
 | 
						|
     (xmlhandlersetter)XML_SetSkippedEntityHandler,
 | 
						|
     (xmlhandler)my_SkippedEntityHandler},
 | 
						|
#endif
 | 
						|
 | 
						|
    {NULL, NULL, NULL} /* sentinel */
 | 
						|
};
 | 
						|
 | 
						|
/*[clinic input]
 | 
						|
dump buffer
 | 
						|
[clinic start generated code]*/
 | 
						|
/*[clinic end generated code: output=da39a3ee5e6b4b0d input=524ce2e021e4eba6]*/
 |