summaryrefslogtreecommitdiffstats
blob: 158958bab789a8c06cdeb42a7352c41ebfb40071 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
/*
 * Copyright (c) 2010-2019 Isode Limited.
 * All rights reserved.
 * See the COPYING file for more information.
 */

#include <Swiften/Parser/LibXMLParser.h>

#include <cassert>
#include <cstring>
#include <limits>
#include <memory>
#include <string>

#include <libxml/parser.h>

#include <Swiften/Base/Log.h>
#include <Swiften/Parser/XMLParserClient.h>

namespace {
std::string asString(const unsigned char* s) {
    return s ? std::string(reinterpret_cast<const char*>(s)) : std::string();
}
}

namespace Swift {

struct LibXMLParser::Private {
    xmlSAXHandler handler_;
    xmlParserCtxtPtr context_;
};

static void handleStartElement(void* parser, const xmlChar* name, const xmlChar* prefix, const xmlChar* xmlns, int nbNamespaces, const xmlChar** namespaces, int nbAttributes, int nbDefaulted, const xmlChar ** attributes) {
    AttributeMap attributeValues;
    if (nbDefaulted != 0) {
        // Just because i don't understand what this means yet :-)
        SWIFT_LOG(error) << "Unexpected nbDefaulted on XML element" << std::endl;
    }
    for (int i = 0; i < nbAttributes*5; i += 5) {
        std::string attributeName = asString(attributes[i]);
        std::string attributePrefix = asString(attributes[i+1]);
        std::string attributeNS = asString(attributes[i+2]);
        assert(attributes[i+4] >= attributes[i+3]);
        attributeValues.addAttribute(
                attributeName,
                attributeNS,
                attributePrefix,
                std::string(reinterpret_cast<const char*>(attributes[i+3]),
                    static_cast<size_t>(attributes[i+4]-attributes[i+3])));
    }
    auto* client = static_cast<XMLParser*>(parser)->getClient();
    for (auto i = 0; i < nbNamespaces * 2; i += 2) {
        const auto prefix = asString(namespaces[i]);
        const auto uri = asString(namespaces[i + 1]);
        client->handleNamespaceDeclaration(prefix, uri);
    }
    auto nameStr = asString(name);
    auto xmlsnsStr = asString(xmlns);
    auto prefixStr = asString(prefix);
    client->handleStartElementPrefix(prefixStr, xmlsnsStr, nameStr, attributeValues);
    client->handleStartElement(nameStr, xmlsnsStr, attributeValues);
}

static void handleEndElement(void *parser, const xmlChar* name, const xmlChar*, const xmlChar* xmlns) {
    static_cast<XMLParser*>(parser)->getClient()->handleEndElement(asString(name), asString(xmlns));
}

static void handleCharacterData(void* parser, const xmlChar* data, int len) {
    assert(len >= 0);
    static_cast<XMLParser*>(parser)->getClient()->handleCharacterData(std::string(reinterpret_cast<const char*>(data), static_cast<size_t>(len)));
}

static void handleComment(void* parser, const xmlChar* /*data*/) {
    if (!static_cast<LibXMLParser*>(parser)->allowsComments()) {
        static_cast<LibXMLParser*>(parser)->stopParser();
    }
}

static void handleEntityDeclaration(void * parser, const xmlChar* /*name*/, int /*type*/, const xmlChar* /*publicId*/, const xmlChar* /*systemId*/, xmlChar* /*content*/) {
    static_cast<LibXMLParser*>(parser)->stopParser();
}

static void handleProcessingInstruction(void* parser, const xmlChar* /*target*/, const xmlChar* /*data*/) {
    static_cast<LibXMLParser*>(parser)->stopParser();
}

static void handleExternalSubset(void* parser, const xmlChar * /*name*/, const xmlChar * /*ExternalID*/, const xmlChar * /*SystemID*/) {
    static_cast<LibXMLParser*>(parser)->stopParser();
}

static void handleError(void*, const char* /*m*/, ... ) {
    /*
    va_list args;
    va_start(args, m);
    vfprintf(stdout, m, args);
    va_end(args);
    */
}

static void handleWarning(void*, const char*, ... ) {
}

static void handleGenericError(void*, const char*, ... ) {
}

static void handleStructuredError(void*, xmlErrorPtr) {
}

bool LibXMLParser::initialized = false;

LibXMLParser::LibXMLParser(XMLParserClient* client, bool allowComments) : XMLParser(client, allowComments), p(new Private()) {
    // Initialize libXML for multithreaded applications
    if (!initialized) {
        xmlInitParser();
        xmlSetGenericErrorFunc(nullptr, handleGenericError);
        xmlSetStructuredErrorFunc(nullptr, handleStructuredError);
        initialized = true;
    }

    memset(&p->handler_, 0, sizeof(p->handler_) );
    p->handler_.initialized = XML_SAX2_MAGIC;
    p->handler_.startElementNs = &handleStartElement;
    p->handler_.endElementNs = &handleEndElement;
    p->handler_.characters = &handleCharacterData;
    p->handler_.warning = &handleWarning;
    p->handler_.error = &handleError;
    p->handler_.comment = &handleComment;
    p->handler_.entityDecl = &handleEntityDeclaration;
    p->handler_.processingInstruction = &handleProcessingInstruction;
    p->handler_.externalSubset = &handleExternalSubset;

    p->context_ = xmlCreatePushParserCtxt(&p->handler_, this, nullptr, 0, nullptr);
    xmlCtxtUseOptions(p->context_, XML_PARSE_NOENT);
    assert(p->context_);
}

LibXMLParser::~LibXMLParser() {
    if (p->context_) {
        xmlFreeParserCtxt(p->context_);
    }
}

bool LibXMLParser::parse(const std::string& data, bool finalData) {
    if (data.size() > std::numeric_limits<int>::max()) {
        return false;
    }
    auto error = xmlParseChunk(p->context_, data.c_str(), static_cast<int>(data.size()), finalData);
    if (error == XML_ERR_OK) {
        return true;
    }
    if (stopped_) return false;
    if (error == XML_WAR_NS_URI || error == XML_WAR_NS_URI_RELATIVE) {
        xmlCtxtResetLastError(p->context_);
        p->context_->errNo = XML_ERR_OK;
        return true;
    }
    return false;
}

void LibXMLParser::stopParser() {
    stopped_ = true;
    xmlStopParser(p->context_);
}

}