| [d2596b] | 1 | /**
 | 
|---|
 | 2 |  * pugixml parser - version 1.0
 | 
|---|
 | 3 |  * --------------------------------------------------------
 | 
|---|
 | 4 |  * Copyright (C) 2006-2010, by Arseny Kapoulkine (arseny.kapoulkine@gmail.com)
 | 
|---|
 | 5 |  * Report bugs and download new versions at http://pugixml.org/
 | 
|---|
 | 6 |  *
 | 
|---|
 | 7 |  * This library is distributed under the MIT License. See notice at the end
 | 
|---|
 | 8 |  * of this file.
 | 
|---|
 | 9 |  *
 | 
|---|
 | 10 |  * This work is based on the pugxml parser, which is:
 | 
|---|
 | 11 |  * Copyright (C) 2003, by Kristen Wegner (kristen@tima.net)
 | 
|---|
 | 12 |  */
 | 
|---|
 | 13 | 
 | 
|---|
 | 14 | #include "pugixml.hpp"
 | 
|---|
 | 15 | 
 | 
|---|
 | 16 | #include <stdlib.h>
 | 
|---|
 | 17 | #include <stdio.h>
 | 
|---|
 | 18 | #include <string.h>
 | 
|---|
 | 19 | #include <assert.h>
 | 
|---|
 | 20 | #include <setjmp.h>
 | 
|---|
 | 21 | #include <wchar.h>
 | 
|---|
 | 22 | 
 | 
|---|
 | 23 | #ifndef PUGIXML_NO_XPATH
 | 
|---|
 | 24 | #       include <math.h>
 | 
|---|
 | 25 | #       include <float.h>
 | 
|---|
 | 26 | #endif
 | 
|---|
 | 27 | 
 | 
|---|
 | 28 | #ifndef PUGIXML_NO_STL
 | 
|---|
 | 29 | #       include <istream>
 | 
|---|
 | 30 | #       include <ostream>
 | 
|---|
 | 31 | #       include <string>
 | 
|---|
 | 32 | #endif
 | 
|---|
 | 33 | 
 | 
|---|
 | 34 | // For placement new
 | 
|---|
 | 35 | #include <new>
 | 
|---|
 | 36 | 
 | 
|---|
 | 37 | #ifdef _MSC_VER
 | 
|---|
 | 38 | #       pragma warning(disable: 4127) // conditional expression is constant
 | 
|---|
 | 39 | #       pragma warning(disable: 4324) // structure was padded due to __declspec(align())
 | 
|---|
 | 40 | #       pragma warning(disable: 4611) // interaction between '_setjmp' and C++ object destruction is non-portable
 | 
|---|
 | 41 | #       pragma warning(disable: 4702) // unreachable code
 | 
|---|
 | 42 | #       pragma warning(disable: 4996) // this function or variable may be unsafe
 | 
|---|
 | 43 | #endif
 | 
|---|
 | 44 | 
 | 
|---|
 | 45 | #ifdef __INTEL_COMPILER
 | 
|---|
 | 46 | #       pragma warning(disable: 177) // function was declared but never referenced 
 | 
|---|
 | 47 | #       pragma warning(disable: 279) // controlling expression is constant
 | 
|---|
 | 48 | #       pragma warning(disable: 1478 1786) // function was declared "deprecated"
 | 
|---|
 | 49 | #endif
 | 
|---|
 | 50 | 
 | 
|---|
 | 51 | #ifdef __BORLANDC__
 | 
|---|
 | 52 | #       pragma warn -8008 // condition is always false
 | 
|---|
 | 53 | #       pragma warn -8066 // unreachable code
 | 
|---|
 | 54 | #endif
 | 
|---|
 | 55 | 
 | 
|---|
 | 56 | #ifdef __SNC__
 | 
|---|
 | 57 | #       pragma diag_suppress=178 // function was declared but never referenced
 | 
|---|
 | 58 | #       pragma diag_suppress=237 // controlling expression is constant
 | 
|---|
 | 59 | #endif
 | 
|---|
 | 60 | 
 | 
|---|
 | 61 | // uintptr_t
 | 
|---|
 | 62 | #if !defined(_MSC_VER) || _MSC_VER >= 1600
 | 
|---|
 | 63 | #       include <stdint.h>
 | 
|---|
 | 64 | #else
 | 
|---|
 | 65 | #       if _MSC_VER < 1300
 | 
|---|
 | 66 | // No native uintptr_t in MSVC6
 | 
|---|
 | 67 | typedef size_t uintptr_t;
 | 
|---|
 | 68 | #       endif
 | 
|---|
 | 69 | typedef unsigned __int8 uint8_t;
 | 
|---|
 | 70 | typedef unsigned __int16 uint16_t;
 | 
|---|
 | 71 | typedef unsigned __int32 uint32_t;
 | 
|---|
 | 72 | typedef __int32 int32_t;
 | 
|---|
 | 73 | #endif
 | 
|---|
 | 74 | 
 | 
|---|
 | 75 | // Inlining controls
 | 
|---|
 | 76 | #if defined(_MSC_VER) && _MSC_VER >= 1300
 | 
|---|
 | 77 | #       define PUGIXML_NO_INLINE __declspec(noinline)
 | 
|---|
 | 78 | #elif defined(__GNUC__)
 | 
|---|
 | 79 | #       define PUGIXML_NO_INLINE __attribute__((noinline))
 | 
|---|
 | 80 | #else
 | 
|---|
 | 81 | #       define PUGIXML_NO_INLINE 
 | 
|---|
 | 82 | #endif
 | 
|---|
 | 83 | 
 | 
|---|
 | 84 | // Simple static assertion
 | 
|---|
 | 85 | #define STATIC_ASSERT(cond) { static const char condition_failed[(cond) ? 1 : -1] = {0}; (void)condition_failed[0]; }
 | 
|---|
 | 86 | 
 | 
|---|
 | 87 | // Digital Mars C++ bug workaround for passing char loaded from memory via stack
 | 
|---|
 | 88 | #ifdef __DMC__
 | 
|---|
 | 89 | #       define DMC_VOLATILE volatile
 | 
|---|
 | 90 | #else
 | 
|---|
 | 91 | #       define DMC_VOLATILE
 | 
|---|
 | 92 | #endif
 | 
|---|
 | 93 | 
 | 
|---|
 | 94 | using namespace pugi;
 | 
|---|
 | 95 | 
 | 
|---|
 | 96 | // Memory allocation
 | 
|---|
 | 97 | namespace
 | 
|---|
 | 98 | {
 | 
|---|
 | 99 |         void* default_allocate(size_t size)
 | 
|---|
 | 100 |         {
 | 
|---|
 | 101 |                 return malloc(size);
 | 
|---|
 | 102 |         }
 | 
|---|
 | 103 | 
 | 
|---|
 | 104 |         void default_deallocate(void* ptr)
 | 
|---|
 | 105 |         {
 | 
|---|
 | 106 |                 free(ptr);
 | 
|---|
 | 107 |         }
 | 
|---|
 | 108 | 
 | 
|---|
 | 109 |         allocation_function global_allocate = default_allocate;
 | 
|---|
 | 110 |         deallocation_function global_deallocate = default_deallocate;
 | 
|---|
 | 111 | }
 | 
|---|
 | 112 | 
 | 
|---|
 | 113 | // String utilities
 | 
|---|
 | 114 | namespace
 | 
|---|
 | 115 | {
 | 
|---|
 | 116 |         // Get string length
 | 
|---|
 | 117 |         size_t strlength(const char_t* s)
 | 
|---|
 | 118 |         {
 | 
|---|
 | 119 |                 assert(s);
 | 
|---|
 | 120 | 
 | 
|---|
 | 121 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 122 |                 return wcslen(s);
 | 
|---|
 | 123 |         #else
 | 
|---|
 | 124 |                 return strlen(s);
 | 
|---|
 | 125 |         #endif
 | 
|---|
 | 126 |         }
 | 
|---|
 | 127 | 
 | 
|---|
 | 128 |         // Compare two strings
 | 
|---|
 | 129 |         bool strequal(const char_t* src, const char_t* dst)
 | 
|---|
 | 130 |         {
 | 
|---|
 | 131 |                 assert(src && dst);
 | 
|---|
 | 132 | 
 | 
|---|
 | 133 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 134 |                 return wcscmp(src, dst) == 0;
 | 
|---|
 | 135 |         #else
 | 
|---|
 | 136 |                 return strcmp(src, dst) == 0;
 | 
|---|
 | 137 |         #endif
 | 
|---|
 | 138 |         }
 | 
|---|
 | 139 | 
 | 
|---|
 | 140 |         // Compare lhs with [rhs_begin, rhs_end)
 | 
|---|
 | 141 |         bool strequalrange(const char_t* lhs, const char_t* rhs, size_t count)
 | 
|---|
 | 142 |         {
 | 
|---|
 | 143 |                 for (size_t i = 0; i < count; ++i)
 | 
|---|
 | 144 |                         if (lhs[i] != rhs[i])
 | 
|---|
 | 145 |                                 return false;
 | 
|---|
 | 146 |         
 | 
|---|
 | 147 |                 return lhs[count] == 0;
 | 
|---|
 | 148 |         }
 | 
|---|
 | 149 |         
 | 
|---|
 | 150 | #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 151 |         // Convert string to wide string, assuming all symbols are ASCII
 | 
|---|
 | 152 |         void widen_ascii(wchar_t* dest, const char* source)
 | 
|---|
 | 153 |         {
 | 
|---|
 | 154 |                 for (const char* i = source; *i; ++i) *dest++ = *i;
 | 
|---|
 | 155 |                 *dest = 0;
 | 
|---|
 | 156 |         }
 | 
|---|
 | 157 | #endif
 | 
|---|
 | 158 | }
 | 
|---|
 | 159 | 
 | 
|---|
 | 160 | #if !defined(PUGIXML_NO_STL) || !defined(PUGIXML_NO_XPATH)
 | 
|---|
 | 161 | // auto_ptr-like buffer holder for exception recovery
 | 
|---|
 | 162 | namespace
 | 
|---|
 | 163 | {
 | 
|---|
 | 164 |         struct buffer_holder
 | 
|---|
 | 165 |         {
 | 
|---|
 | 166 |                 void* data;
 | 
|---|
 | 167 |                 void (*deleter)(void*);
 | 
|---|
 | 168 | 
 | 
|---|
 | 169 |                 buffer_holder(void* data, void (*deleter)(void*)): data(data), deleter(deleter)
 | 
|---|
 | 170 |                 {
 | 
|---|
 | 171 |                 }
 | 
|---|
 | 172 | 
 | 
|---|
 | 173 |                 ~buffer_holder()
 | 
|---|
 | 174 |                 {
 | 
|---|
 | 175 |                         if (data) deleter(data);
 | 
|---|
 | 176 |                 }
 | 
|---|
 | 177 | 
 | 
|---|
 | 178 |                 void* release()
 | 
|---|
 | 179 |                 {
 | 
|---|
 | 180 |                         void* result = data;
 | 
|---|
 | 181 |                         data = 0;
 | 
|---|
 | 182 |                         return result;
 | 
|---|
 | 183 |                 }
 | 
|---|
 | 184 |         };
 | 
|---|
 | 185 | }
 | 
|---|
 | 186 | #endif
 | 
|---|
 | 187 | 
 | 
|---|
 | 188 | namespace
 | 
|---|
 | 189 | {
 | 
|---|
 | 190 |         static const size_t xml_memory_page_size = 32768;
 | 
|---|
 | 191 | 
 | 
|---|
 | 192 |         static const uintptr_t xml_memory_page_alignment = 32;
 | 
|---|
 | 193 |         static const uintptr_t xml_memory_page_pointer_mask = ~(xml_memory_page_alignment - 1);
 | 
|---|
 | 194 |         static const uintptr_t xml_memory_page_name_allocated_mask = 16;
 | 
|---|
 | 195 |         static const uintptr_t xml_memory_page_value_allocated_mask = 8;
 | 
|---|
 | 196 |         static const uintptr_t xml_memory_page_type_mask = 7;
 | 
|---|
 | 197 | 
 | 
|---|
 | 198 |         struct xml_allocator;
 | 
|---|
 | 199 | 
 | 
|---|
 | 200 |         struct xml_memory_page
 | 
|---|
 | 201 |         {
 | 
|---|
 | 202 |                 static xml_memory_page* construct(void* memory)
 | 
|---|
 | 203 |                 {
 | 
|---|
 | 204 |                         if (!memory) return 0; //$ redundant, left for performance
 | 
|---|
 | 205 | 
 | 
|---|
 | 206 |                         xml_memory_page* result = static_cast<xml_memory_page*>(memory);
 | 
|---|
 | 207 | 
 | 
|---|
 | 208 |                         result->allocator = 0;
 | 
|---|
 | 209 |                         result->memory = 0;
 | 
|---|
 | 210 |                         result->prev = 0;
 | 
|---|
 | 211 |                         result->next = 0;
 | 
|---|
 | 212 |                         result->busy_size = 0;
 | 
|---|
 | 213 |                         result->freed_size = 0;
 | 
|---|
 | 214 | 
 | 
|---|
 | 215 |                         return result;
 | 
|---|
 | 216 |                 }
 | 
|---|
 | 217 | 
 | 
|---|
 | 218 |                 xml_allocator* allocator;
 | 
|---|
 | 219 | 
 | 
|---|
 | 220 |                 void* memory;
 | 
|---|
 | 221 | 
 | 
|---|
 | 222 |                 xml_memory_page* prev;
 | 
|---|
 | 223 |                 xml_memory_page* next;
 | 
|---|
 | 224 | 
 | 
|---|
 | 225 |                 size_t busy_size;
 | 
|---|
 | 226 |                 size_t freed_size;
 | 
|---|
 | 227 | 
 | 
|---|
 | 228 |                 char data[1];
 | 
|---|
 | 229 |         };
 | 
|---|
 | 230 | 
 | 
|---|
 | 231 |         struct xml_memory_string_header
 | 
|---|
 | 232 |         {
 | 
|---|
 | 233 |                 uint16_t page_offset; // offset from page->data
 | 
|---|
 | 234 |                 uint16_t full_size; // 0 if string occupies whole page
 | 
|---|
 | 235 |         };
 | 
|---|
 | 236 | 
 | 
|---|
 | 237 |         struct xml_allocator
 | 
|---|
 | 238 |         {
 | 
|---|
 | 239 |                 xml_allocator(xml_memory_page* root): _root(root), _busy_size(root->busy_size)
 | 
|---|
 | 240 |                 {
 | 
|---|
 | 241 |                 }
 | 
|---|
 | 242 | 
 | 
|---|
 | 243 |                 xml_memory_page* allocate_page(size_t data_size)
 | 
|---|
 | 244 |                 {
 | 
|---|
 | 245 |                         size_t size = offsetof(xml_memory_page, data) + data_size;
 | 
|---|
 | 246 | 
 | 
|---|
 | 247 |                         // allocate block with some alignment, leaving memory for worst-case padding
 | 
|---|
 | 248 |                         void* memory = global_allocate(size + xml_memory_page_alignment);
 | 
|---|
 | 249 |                         if (!memory) return 0;
 | 
|---|
 | 250 | 
 | 
|---|
 | 251 |                         // align upwards to page boundary
 | 
|---|
 | 252 |                         void* page_memory = reinterpret_cast<void*>((reinterpret_cast<uintptr_t>(memory) + (xml_memory_page_alignment - 1)) & ~(xml_memory_page_alignment - 1));
 | 
|---|
 | 253 | 
 | 
|---|
 | 254 |                         // prepare page structure
 | 
|---|
 | 255 |                         xml_memory_page* page = xml_memory_page::construct(page_memory);
 | 
|---|
 | 256 | 
 | 
|---|
 | 257 |                         page->memory = memory;
 | 
|---|
 | 258 |                         page->allocator = _root->allocator;
 | 
|---|
 | 259 | 
 | 
|---|
 | 260 |                         return page;
 | 
|---|
 | 261 |                 }
 | 
|---|
 | 262 | 
 | 
|---|
 | 263 |                 static void deallocate_page(xml_memory_page* page)
 | 
|---|
 | 264 |                 {
 | 
|---|
 | 265 |                         global_deallocate(page->memory);
 | 
|---|
 | 266 |                 }
 | 
|---|
 | 267 | 
 | 
|---|
 | 268 |                 void* allocate_memory_oob(size_t size, xml_memory_page*& out_page);
 | 
|---|
 | 269 | 
 | 
|---|
 | 270 |                 void* allocate_memory(size_t size, xml_memory_page*& out_page)
 | 
|---|
 | 271 |                 {
 | 
|---|
 | 272 |                         if (_busy_size + size > xml_memory_page_size) return allocate_memory_oob(size, out_page);
 | 
|---|
 | 273 | 
 | 
|---|
 | 274 |                         void* buf = _root->data + _busy_size;
 | 
|---|
 | 275 | 
 | 
|---|
 | 276 |                         _busy_size += size;
 | 
|---|
 | 277 | 
 | 
|---|
 | 278 |                         out_page = _root;
 | 
|---|
 | 279 | 
 | 
|---|
 | 280 |                         return buf;
 | 
|---|
 | 281 |                 }
 | 
|---|
 | 282 | 
 | 
|---|
 | 283 |                 void deallocate_memory(void* ptr, size_t size, xml_memory_page* page)
 | 
|---|
 | 284 |                 {
 | 
|---|
 | 285 |                         if (page == _root) page->busy_size = _busy_size;
 | 
|---|
 | 286 | 
 | 
|---|
 | 287 |                         assert(ptr >= page->data && ptr < page->data + page->busy_size);
 | 
|---|
 | 288 |                         (void)!ptr;
 | 
|---|
 | 289 | 
 | 
|---|
 | 290 |                         page->freed_size += size;
 | 
|---|
 | 291 |                         assert(page->freed_size <= page->busy_size);
 | 
|---|
 | 292 | 
 | 
|---|
 | 293 |                         if (page->freed_size == page->busy_size)
 | 
|---|
 | 294 |                         {
 | 
|---|
 | 295 |                                 if (page->next == 0)
 | 
|---|
 | 296 |                                 {
 | 
|---|
 | 297 |                                         assert(_root == page);
 | 
|---|
 | 298 | 
 | 
|---|
 | 299 |                                         // top page freed, just reset sizes
 | 
|---|
 | 300 |                                         page->busy_size = page->freed_size = 0;
 | 
|---|
 | 301 |                                         _busy_size = 0;
 | 
|---|
 | 302 |                                 }
 | 
|---|
 | 303 |                                 else
 | 
|---|
 | 304 |                                 {
 | 
|---|
 | 305 |                                         assert(_root != page);
 | 
|---|
 | 306 |                                         assert(page->prev);
 | 
|---|
 | 307 | 
 | 
|---|
 | 308 |                                         // remove from the list
 | 
|---|
 | 309 |                                         page->prev->next = page->next;
 | 
|---|
 | 310 |                                         page->next->prev = page->prev;
 | 
|---|
 | 311 | 
 | 
|---|
 | 312 |                                         // deallocate
 | 
|---|
 | 313 |                                         deallocate_page(page);
 | 
|---|
 | 314 |                                 }
 | 
|---|
 | 315 |                         }
 | 
|---|
 | 316 |                 }
 | 
|---|
 | 317 | 
 | 
|---|
 | 318 |                 char_t* allocate_string(size_t length)
 | 
|---|
 | 319 |                 {
 | 
|---|
 | 320 |                         // allocate memory for string and header block
 | 
|---|
 | 321 |                         size_t size = sizeof(xml_memory_string_header) + length * sizeof(char_t);
 | 
|---|
 | 322 |                         
 | 
|---|
 | 323 |                         // round size up to pointer alignment boundary
 | 
|---|
 | 324 |                         size_t full_size = (size + (sizeof(void*) - 1)) & ~(sizeof(void*) - 1);
 | 
|---|
 | 325 | 
 | 
|---|
 | 326 |                         xml_memory_page* page;
 | 
|---|
 | 327 |                         xml_memory_string_header* header = static_cast<xml_memory_string_header*>(allocate_memory(full_size, page));
 | 
|---|
 | 328 | 
 | 
|---|
 | 329 |                         if (!header) return 0;
 | 
|---|
 | 330 | 
 | 
|---|
 | 331 |                         // setup header
 | 
|---|
 | 332 |                         ptrdiff_t page_offset = reinterpret_cast<char*>(header) - page->data;
 | 
|---|
 | 333 | 
 | 
|---|
 | 334 |                         assert(page_offset >= 0 && page_offset < (1 << 16));
 | 
|---|
 | 335 |                         header->page_offset = static_cast<uint16_t>(page_offset);
 | 
|---|
 | 336 | 
 | 
|---|
 | 337 |                         // full_size == 0 for large strings that occupy the whole page
 | 
|---|
 | 338 |                         assert(full_size < (1 << 16) || (page->busy_size == full_size && page_offset == 0));
 | 
|---|
 | 339 |                         header->full_size = static_cast<uint16_t>(full_size < (1 << 16) ? full_size : 0);
 | 
|---|
 | 340 | 
 | 
|---|
 | 341 |                         return reinterpret_cast<char_t*>(header + 1);
 | 
|---|
 | 342 |                 }
 | 
|---|
 | 343 | 
 | 
|---|
 | 344 |                 void deallocate_string(char_t* string)
 | 
|---|
 | 345 |                 {
 | 
|---|
 | 346 |                         // get header
 | 
|---|
 | 347 |                         xml_memory_string_header* header = reinterpret_cast<xml_memory_string_header*>(string) - 1;
 | 
|---|
 | 348 | 
 | 
|---|
 | 349 |                         // deallocate
 | 
|---|
 | 350 |                         size_t page_offset = offsetof(xml_memory_page, data) + header->page_offset;
 | 
|---|
 | 351 |                         xml_memory_page* page = reinterpret_cast<xml_memory_page*>(reinterpret_cast<char*>(header) - page_offset);
 | 
|---|
 | 352 | 
 | 
|---|
 | 353 |                         // if full_size == 0 then this string occupies the whole page
 | 
|---|
 | 354 |                         size_t full_size = header->full_size == 0 ? page->busy_size : header->full_size;
 | 
|---|
 | 355 | 
 | 
|---|
 | 356 |                         deallocate_memory(header, full_size, page);
 | 
|---|
 | 357 |                 }
 | 
|---|
 | 358 | 
 | 
|---|
 | 359 |                 xml_memory_page* _root;
 | 
|---|
 | 360 |                 size_t _busy_size;
 | 
|---|
 | 361 |         };
 | 
|---|
 | 362 | 
 | 
|---|
 | 363 |         PUGIXML_NO_INLINE void* xml_allocator::allocate_memory_oob(size_t size, xml_memory_page*& out_page)
 | 
|---|
 | 364 |         {
 | 
|---|
 | 365 |                 const size_t large_allocation_threshold = xml_memory_page_size / 4;
 | 
|---|
 | 366 | 
 | 
|---|
 | 367 |                 xml_memory_page* page = allocate_page(size <= large_allocation_threshold ? xml_memory_page_size : size);
 | 
|---|
 | 368 |                 if (!page) return 0;
 | 
|---|
 | 369 | 
 | 
|---|
 | 370 |                 if (size <= large_allocation_threshold)
 | 
|---|
 | 371 |                 {
 | 
|---|
 | 372 |                         _root->busy_size = _busy_size;
 | 
|---|
 | 373 | 
 | 
|---|
 | 374 |                         // insert page at the end of linked list
 | 
|---|
 | 375 |                         page->prev = _root;
 | 
|---|
 | 376 |                         _root->next = page;
 | 
|---|
 | 377 |                         _root = page;
 | 
|---|
 | 378 | 
 | 
|---|
 | 379 |                         _busy_size = size;
 | 
|---|
 | 380 |                 }
 | 
|---|
 | 381 |                 else
 | 
|---|
 | 382 |                 {
 | 
|---|
 | 383 |                         // insert page before the end of linked list, so that it is deleted as soon as possible
 | 
|---|
 | 384 |                         // the last page is not deleted even if it's empty (see deallocate_memory)
 | 
|---|
 | 385 |                         assert(_root->prev);
 | 
|---|
 | 386 | 
 | 
|---|
 | 387 |                         page->prev = _root->prev;
 | 
|---|
 | 388 |                         page->next = _root;
 | 
|---|
 | 389 | 
 | 
|---|
 | 390 |                         _root->prev->next = page;
 | 
|---|
 | 391 |                         _root->prev = page;
 | 
|---|
 | 392 |                 }
 | 
|---|
 | 393 | 
 | 
|---|
 | 394 |                 // allocate inside page
 | 
|---|
 | 395 |                 page->busy_size = size;
 | 
|---|
 | 396 | 
 | 
|---|
 | 397 |                 out_page = page;
 | 
|---|
 | 398 |                 return page->data;
 | 
|---|
 | 399 |         }
 | 
|---|
 | 400 | }
 | 
|---|
 | 401 | 
 | 
|---|
 | 402 | namespace pugi
 | 
|---|
 | 403 | {
 | 
|---|
 | 404 |         /// A 'name=value' XML attribute structure.
 | 
|---|
 | 405 |         struct xml_attribute_struct
 | 
|---|
 | 406 |         {
 | 
|---|
 | 407 |                 /// Default ctor
 | 
|---|
 | 408 |                 xml_attribute_struct(xml_memory_page* page): header(reinterpret_cast<uintptr_t>(page)), name(0), value(0), prev_attribute_c(0), next_attribute(0)
 | 
|---|
 | 409 |                 {
 | 
|---|
 | 410 |                 }
 | 
|---|
 | 411 | 
 | 
|---|
 | 412 |                 uintptr_t header;
 | 
|---|
 | 413 | 
 | 
|---|
 | 414 |                 char_t* name;   ///< Pointer to attribute name.
 | 
|---|
 | 415 |                 char_t* value;  ///< Pointer to attribute value.
 | 
|---|
 | 416 | 
 | 
|---|
 | 417 |                 xml_attribute_struct* prev_attribute_c; ///< Previous attribute (cyclic list)
 | 
|---|
 | 418 |                 xml_attribute_struct* next_attribute;   ///< Next attribute
 | 
|---|
 | 419 |         };
 | 
|---|
 | 420 | 
 | 
|---|
 | 421 |         /// An XML document tree node.
 | 
|---|
 | 422 |         struct xml_node_struct
 | 
|---|
 | 423 |         {
 | 
|---|
 | 424 |                 /// Default ctor
 | 
|---|
 | 425 |                 /// \param type - node type
 | 
|---|
 | 426 |                 xml_node_struct(xml_memory_page* page, xml_node_type type): header(reinterpret_cast<uintptr_t>(page) | (type - 1)), parent(0), name(0), value(0), first_child(0), prev_sibling_c(0), next_sibling(0), first_attribute(0)
 | 
|---|
 | 427 |                 {
 | 
|---|
 | 428 |                 }
 | 
|---|
 | 429 | 
 | 
|---|
 | 430 |                 uintptr_t header;
 | 
|---|
 | 431 | 
 | 
|---|
 | 432 |                 xml_node_struct*                parent;                                 ///< Pointer to parent
 | 
|---|
 | 433 | 
 | 
|---|
 | 434 |                 char_t*                                 name;                                   ///< Pointer to element name.
 | 
|---|
 | 435 |                 char_t*                                 value;                                  ///< Pointer to any associated string data.
 | 
|---|
 | 436 | 
 | 
|---|
 | 437 |                 xml_node_struct*                first_child;                    ///< First child
 | 
|---|
 | 438 |                 
 | 
|---|
 | 439 |                 xml_node_struct*                prev_sibling_c;                 ///< Left brother (cyclic list)
 | 
|---|
 | 440 |                 xml_node_struct*                next_sibling;                   ///< Right brother
 | 
|---|
 | 441 |                 
 | 
|---|
 | 442 |                 xml_attribute_struct*   first_attribute;                ///< First attribute
 | 
|---|
 | 443 |         };
 | 
|---|
 | 444 | }
 | 
|---|
 | 445 | 
 | 
|---|
 | 446 | namespace
 | 
|---|
 | 447 | {
 | 
|---|
 | 448 |         struct xml_document_struct: public xml_node_struct, public xml_allocator
 | 
|---|
 | 449 |         {
 | 
|---|
 | 450 |                 xml_document_struct(xml_memory_page* page): xml_node_struct(page, node_document), xml_allocator(page), buffer(0)
 | 
|---|
 | 451 |                 {
 | 
|---|
 | 452 |                 }
 | 
|---|
 | 453 | 
 | 
|---|
 | 454 |                 const char_t* buffer;
 | 
|---|
 | 455 |         };
 | 
|---|
 | 456 | 
 | 
|---|
 | 457 |         static inline xml_allocator& get_allocator(const xml_node_struct* node)
 | 
|---|
 | 458 |         {
 | 
|---|
 | 459 |                 assert(node);
 | 
|---|
 | 460 | 
 | 
|---|
 | 461 |                 return *reinterpret_cast<xml_memory_page*>(node->header & xml_memory_page_pointer_mask)->allocator;
 | 
|---|
 | 462 |         }
 | 
|---|
 | 463 | }
 | 
|---|
 | 464 | 
 | 
|---|
 | 465 | // Low-level DOM operations
 | 
|---|
 | 466 | namespace
 | 
|---|
 | 467 | {
 | 
|---|
 | 468 |         inline xml_attribute_struct* allocate_attribute(xml_allocator& alloc)
 | 
|---|
 | 469 |         {
 | 
|---|
 | 470 |                 xml_memory_page* page;
 | 
|---|
 | 471 |                 void* memory = alloc.allocate_memory(sizeof(xml_attribute_struct), page);
 | 
|---|
 | 472 | 
 | 
|---|
 | 473 |                 return new (memory) xml_attribute_struct(page);
 | 
|---|
 | 474 |         }
 | 
|---|
 | 475 | 
 | 
|---|
 | 476 |         inline xml_node_struct* allocate_node(xml_allocator& alloc, xml_node_type type)
 | 
|---|
 | 477 |         {
 | 
|---|
 | 478 |                 xml_memory_page* page;
 | 
|---|
 | 479 |                 void* memory = alloc.allocate_memory(sizeof(xml_node_struct), page);
 | 
|---|
 | 480 | 
 | 
|---|
 | 481 |                 return new (memory) xml_node_struct(page, type);
 | 
|---|
 | 482 |         }
 | 
|---|
 | 483 | 
 | 
|---|
 | 484 |         inline void destroy_attribute(xml_attribute_struct* a, xml_allocator& alloc)
 | 
|---|
 | 485 |         {
 | 
|---|
 | 486 |                 uintptr_t header = a->header;
 | 
|---|
 | 487 | 
 | 
|---|
 | 488 |                 if (header & xml_memory_page_name_allocated_mask) alloc.deallocate_string(a->name);
 | 
|---|
 | 489 |                 if (header & xml_memory_page_value_allocated_mask) alloc.deallocate_string(a->value);
 | 
|---|
 | 490 | 
 | 
|---|
 | 491 |                 alloc.deallocate_memory(a, sizeof(xml_attribute_struct), reinterpret_cast<xml_memory_page*>(header & xml_memory_page_pointer_mask));
 | 
|---|
 | 492 |         }
 | 
|---|
 | 493 | 
 | 
|---|
 | 494 |         inline void destroy_node(xml_node_struct* n, xml_allocator& alloc)
 | 
|---|
 | 495 |         {
 | 
|---|
 | 496 |                 uintptr_t header = n->header;
 | 
|---|
 | 497 | 
 | 
|---|
 | 498 |                 if (header & xml_memory_page_name_allocated_mask) alloc.deallocate_string(n->name);
 | 
|---|
 | 499 |                 if (header & xml_memory_page_value_allocated_mask) alloc.deallocate_string(n->value);
 | 
|---|
 | 500 | 
 | 
|---|
 | 501 |                 for (xml_attribute_struct* attr = n->first_attribute; attr; )
 | 
|---|
 | 502 |                 {
 | 
|---|
 | 503 |                         xml_attribute_struct* next = attr->next_attribute;
 | 
|---|
 | 504 | 
 | 
|---|
 | 505 |                         destroy_attribute(attr, alloc);
 | 
|---|
 | 506 | 
 | 
|---|
 | 507 |                         attr = next;
 | 
|---|
 | 508 |                 }
 | 
|---|
 | 509 | 
 | 
|---|
 | 510 |                 for (xml_node_struct* child = n->first_child; child; )
 | 
|---|
 | 511 |                 {
 | 
|---|
 | 512 |                         xml_node_struct* next = child->next_sibling;
 | 
|---|
 | 513 | 
 | 
|---|
 | 514 |                         destroy_node(child, alloc);
 | 
|---|
 | 515 | 
 | 
|---|
 | 516 |                         child = next;
 | 
|---|
 | 517 |                 }
 | 
|---|
 | 518 | 
 | 
|---|
 | 519 |                 alloc.deallocate_memory(n, sizeof(xml_node_struct), reinterpret_cast<xml_memory_page*>(header & xml_memory_page_pointer_mask));
 | 
|---|
 | 520 |         }
 | 
|---|
 | 521 | 
 | 
|---|
 | 522 |         PUGIXML_NO_INLINE xml_node_struct* append_node(xml_node_struct* node, xml_allocator& alloc, xml_node_type type = node_element)
 | 
|---|
 | 523 |         {
 | 
|---|
 | 524 |                 xml_node_struct* child = allocate_node(alloc, type);
 | 
|---|
 | 525 |                 if (!child) return 0;
 | 
|---|
 | 526 | 
 | 
|---|
 | 527 |                 child->parent = node;
 | 
|---|
 | 528 | 
 | 
|---|
 | 529 |                 xml_node_struct* first_child = node->first_child;
 | 
|---|
 | 530 |                         
 | 
|---|
 | 531 |                 if (first_child)
 | 
|---|
 | 532 |                 {
 | 
|---|
 | 533 |                         xml_node_struct* last_child = first_child->prev_sibling_c;
 | 
|---|
 | 534 | 
 | 
|---|
 | 535 |                         last_child->next_sibling = child;
 | 
|---|
 | 536 |                         child->prev_sibling_c = last_child;
 | 
|---|
 | 537 |                         first_child->prev_sibling_c = child;
 | 
|---|
 | 538 |                 }
 | 
|---|
 | 539 |                 else
 | 
|---|
 | 540 |                 {
 | 
|---|
 | 541 |                         node->first_child = child;
 | 
|---|
 | 542 |                         child->prev_sibling_c = child;
 | 
|---|
 | 543 |                 }
 | 
|---|
 | 544 |                         
 | 
|---|
 | 545 |                 return child;
 | 
|---|
 | 546 |         }
 | 
|---|
 | 547 | 
 | 
|---|
 | 548 |         PUGIXML_NO_INLINE xml_attribute_struct* append_attribute_ll(xml_node_struct* node, xml_allocator& alloc)
 | 
|---|
 | 549 |         {
 | 
|---|
 | 550 |                 xml_attribute_struct* a = allocate_attribute(alloc);
 | 
|---|
 | 551 |                 if (!a) return 0;
 | 
|---|
 | 552 | 
 | 
|---|
 | 553 |                 xml_attribute_struct* first_attribute = node->first_attribute;
 | 
|---|
 | 554 | 
 | 
|---|
 | 555 |                 if (first_attribute)
 | 
|---|
 | 556 |                 {
 | 
|---|
 | 557 |                         xml_attribute_struct* last_attribute = first_attribute->prev_attribute_c;
 | 
|---|
 | 558 | 
 | 
|---|
 | 559 |                         last_attribute->next_attribute = a;
 | 
|---|
 | 560 |                         a->prev_attribute_c = last_attribute;
 | 
|---|
 | 561 |                         first_attribute->prev_attribute_c = a;
 | 
|---|
 | 562 |                 }
 | 
|---|
 | 563 |                 else
 | 
|---|
 | 564 |                 {
 | 
|---|
 | 565 |                         node->first_attribute = a;
 | 
|---|
 | 566 |                         a->prev_attribute_c = a;
 | 
|---|
 | 567 |                 }
 | 
|---|
 | 568 |                         
 | 
|---|
 | 569 |                 return a;
 | 
|---|
 | 570 |         }
 | 
|---|
 | 571 | }
 | 
|---|
 | 572 | 
 | 
|---|
 | 573 | // Helper classes for code generation
 | 
|---|
 | 574 | namespace
 | 
|---|
 | 575 | {
 | 
|---|
 | 576 |         struct opt_false
 | 
|---|
 | 577 |         {
 | 
|---|
 | 578 |                 enum { value = 0 };
 | 
|---|
 | 579 |         };
 | 
|---|
 | 580 | 
 | 
|---|
 | 581 |         struct opt_true
 | 
|---|
 | 582 |         {
 | 
|---|
 | 583 |                 enum { value = 1 };
 | 
|---|
 | 584 |         };
 | 
|---|
 | 585 | }
 | 
|---|
 | 586 | 
 | 
|---|
 | 587 | // Unicode utilities
 | 
|---|
 | 588 | namespace
 | 
|---|
 | 589 | {
 | 
|---|
 | 590 |         inline uint16_t endian_swap(uint16_t value)
 | 
|---|
 | 591 |         {
 | 
|---|
 | 592 |                 return static_cast<uint16_t>(((value & 0xff) << 8) | (value >> 8));
 | 
|---|
 | 593 |         }
 | 
|---|
 | 594 | 
 | 
|---|
 | 595 |         inline uint32_t endian_swap(uint32_t value)
 | 
|---|
 | 596 |         {
 | 
|---|
 | 597 |                 return ((value & 0xff) << 24) | ((value & 0xff00) << 8) | ((value & 0xff0000) >> 8) | (value >> 24);
 | 
|---|
 | 598 |         }
 | 
|---|
 | 599 | 
 | 
|---|
 | 600 |         struct utf8_counter
 | 
|---|
 | 601 |         {
 | 
|---|
 | 602 |                 typedef size_t value_type;
 | 
|---|
 | 603 | 
 | 
|---|
 | 604 |                 static value_type low(value_type result, uint32_t ch)
 | 
|---|
 | 605 |                 {
 | 
|---|
 | 606 |                         // U+0000..U+007F
 | 
|---|
 | 607 |                         if (ch < 0x80) return result + 1;
 | 
|---|
 | 608 |                         // U+0080..U+07FF
 | 
|---|
 | 609 |                         else if (ch < 0x800) return result + 2;
 | 
|---|
 | 610 |                         // U+0800..U+FFFF
 | 
|---|
 | 611 |                         else return result + 3;
 | 
|---|
 | 612 |                 }
 | 
|---|
 | 613 | 
 | 
|---|
 | 614 |                 static value_type high(value_type result, uint32_t)
 | 
|---|
 | 615 |                 {
 | 
|---|
 | 616 |                         // U+10000..U+10FFFF
 | 
|---|
 | 617 |                         return result + 4;
 | 
|---|
 | 618 |                 }
 | 
|---|
 | 619 |         };
 | 
|---|
 | 620 | 
 | 
|---|
 | 621 |         struct utf8_writer
 | 
|---|
 | 622 |         {
 | 
|---|
 | 623 |                 typedef uint8_t* value_type;
 | 
|---|
 | 624 | 
 | 
|---|
 | 625 |                 static value_type low(value_type result, uint32_t ch)
 | 
|---|
 | 626 |                 {
 | 
|---|
 | 627 |                         // U+0000..U+007F
 | 
|---|
 | 628 |                         if (ch < 0x80)
 | 
|---|
 | 629 |                         {
 | 
|---|
 | 630 |                                 *result = static_cast<uint8_t>(ch);
 | 
|---|
 | 631 |                                 return result + 1;
 | 
|---|
 | 632 |                         }
 | 
|---|
 | 633 |                         // U+0080..U+07FF
 | 
|---|
 | 634 |                         else if (ch < 0x800)
 | 
|---|
 | 635 |                         {
 | 
|---|
 | 636 |                                 result[0] = static_cast<uint8_t>(0xC0 | (ch >> 6));
 | 
|---|
 | 637 |                                 result[1] = static_cast<uint8_t>(0x80 | (ch & 0x3F));
 | 
|---|
 | 638 |                                 return result + 2;
 | 
|---|
 | 639 |                         }
 | 
|---|
 | 640 |                         // U+0800..U+FFFF
 | 
|---|
 | 641 |                         else
 | 
|---|
 | 642 |                         {
 | 
|---|
 | 643 |                                 result[0] = static_cast<uint8_t>(0xE0 | (ch >> 12));
 | 
|---|
 | 644 |                                 result[1] = static_cast<uint8_t>(0x80 | ((ch >> 6) & 0x3F));
 | 
|---|
 | 645 |                                 result[2] = static_cast<uint8_t>(0x80 | (ch & 0x3F));
 | 
|---|
 | 646 |                                 return result + 3;
 | 
|---|
 | 647 |                         }
 | 
|---|
 | 648 |                 }
 | 
|---|
 | 649 | 
 | 
|---|
 | 650 |                 static value_type high(value_type result, uint32_t ch)
 | 
|---|
 | 651 |                 {
 | 
|---|
 | 652 |                         // U+10000..U+10FFFF
 | 
|---|
 | 653 |                         result[0] = static_cast<uint8_t>(0xF0 | (ch >> 18));
 | 
|---|
 | 654 |                         result[1] = static_cast<uint8_t>(0x80 | ((ch >> 12) & 0x3F));
 | 
|---|
 | 655 |                         result[2] = static_cast<uint8_t>(0x80 | ((ch >> 6) & 0x3F));
 | 
|---|
 | 656 |                         result[3] = static_cast<uint8_t>(0x80 | (ch & 0x3F));
 | 
|---|
 | 657 |                         return result + 4;
 | 
|---|
 | 658 |                 }
 | 
|---|
 | 659 | 
 | 
|---|
 | 660 |                 static value_type any(value_type result, uint32_t ch)
 | 
|---|
 | 661 |                 {
 | 
|---|
 | 662 |                         return (ch < 0x10000) ? low(result, ch) : high(result, ch);
 | 
|---|
 | 663 |                 }
 | 
|---|
 | 664 |         };
 | 
|---|
 | 665 | 
 | 
|---|
 | 666 |         struct utf16_counter
 | 
|---|
 | 667 |         {
 | 
|---|
 | 668 |                 typedef size_t value_type;
 | 
|---|
 | 669 | 
 | 
|---|
 | 670 |                 static value_type low(value_type result, uint32_t)
 | 
|---|
 | 671 |                 {
 | 
|---|
 | 672 |                         return result + 1;
 | 
|---|
 | 673 |                 }
 | 
|---|
 | 674 | 
 | 
|---|
 | 675 |                 static value_type high(value_type result, uint32_t)
 | 
|---|
 | 676 |                 {
 | 
|---|
 | 677 |                         return result + 2;
 | 
|---|
 | 678 |                 }
 | 
|---|
 | 679 |         };
 | 
|---|
 | 680 | 
 | 
|---|
 | 681 |         struct utf16_writer
 | 
|---|
 | 682 |         {
 | 
|---|
 | 683 |                 typedef uint16_t* value_type;
 | 
|---|
 | 684 | 
 | 
|---|
 | 685 |                 static value_type low(value_type result, uint32_t ch)
 | 
|---|
 | 686 |                 {
 | 
|---|
 | 687 |                         *result = static_cast<uint16_t>(ch);
 | 
|---|
 | 688 | 
 | 
|---|
 | 689 |                         return result + 1;
 | 
|---|
 | 690 |                 }
 | 
|---|
 | 691 | 
 | 
|---|
 | 692 |                 static value_type high(value_type result, uint32_t ch)
 | 
|---|
 | 693 |                 {
 | 
|---|
 | 694 |                         uint32_t msh = (uint32_t)(ch - 0x10000) >> 10;
 | 
|---|
 | 695 |                         uint32_t lsh = (uint32_t)(ch - 0x10000) & 0x3ff;
 | 
|---|
 | 696 | 
 | 
|---|
 | 697 |                         result[0] = static_cast<uint16_t>(0xD800 + msh);
 | 
|---|
 | 698 |                         result[1] = static_cast<uint16_t>(0xDC00 + lsh);
 | 
|---|
 | 699 | 
 | 
|---|
 | 700 |                         return result + 2;
 | 
|---|
 | 701 |                 }
 | 
|---|
 | 702 | 
 | 
|---|
 | 703 |                 static value_type any(value_type result, uint32_t ch)
 | 
|---|
 | 704 |                 {
 | 
|---|
 | 705 |                         return (ch < 0x10000) ? low(result, ch) : high(result, ch);
 | 
|---|
 | 706 |                 }
 | 
|---|
 | 707 |         };
 | 
|---|
 | 708 | 
 | 
|---|
 | 709 |         struct utf32_counter
 | 
|---|
 | 710 |         {
 | 
|---|
 | 711 |                 typedef size_t value_type;
 | 
|---|
 | 712 | 
 | 
|---|
 | 713 |                 static value_type low(value_type result, uint32_t)
 | 
|---|
 | 714 |                 {
 | 
|---|
 | 715 |                         return result + 1;
 | 
|---|
 | 716 |                 }
 | 
|---|
 | 717 | 
 | 
|---|
 | 718 |                 static value_type high(value_type result, uint32_t)
 | 
|---|
 | 719 |                 {
 | 
|---|
 | 720 |                         return result + 1;
 | 
|---|
 | 721 |                 }
 | 
|---|
 | 722 |         };
 | 
|---|
 | 723 | 
 | 
|---|
 | 724 |         struct utf32_writer
 | 
|---|
 | 725 |         {
 | 
|---|
 | 726 |                 typedef uint32_t* value_type;
 | 
|---|
 | 727 | 
 | 
|---|
 | 728 |                 static value_type low(value_type result, uint32_t ch)
 | 
|---|
 | 729 |                 {
 | 
|---|
 | 730 |                         *result = ch;
 | 
|---|
 | 731 | 
 | 
|---|
 | 732 |                         return result + 1;
 | 
|---|
 | 733 |                 }
 | 
|---|
 | 734 | 
 | 
|---|
 | 735 |                 static value_type high(value_type result, uint32_t ch)
 | 
|---|
 | 736 |                 {
 | 
|---|
 | 737 |                         *result = ch;
 | 
|---|
 | 738 | 
 | 
|---|
 | 739 |                         return result + 1;
 | 
|---|
 | 740 |                 }
 | 
|---|
 | 741 | 
 | 
|---|
 | 742 |                 static value_type any(value_type result, uint32_t ch)
 | 
|---|
 | 743 |                 {
 | 
|---|
 | 744 |                         *result = ch;
 | 
|---|
 | 745 | 
 | 
|---|
 | 746 |                         return result + 1;
 | 
|---|
 | 747 |                 }
 | 
|---|
 | 748 |         };
 | 
|---|
 | 749 | 
 | 
|---|
 | 750 |         template <size_t size> struct wchar_selector;
 | 
|---|
 | 751 | 
 | 
|---|
 | 752 |         template <> struct wchar_selector<2>
 | 
|---|
 | 753 |         {
 | 
|---|
 | 754 |                 typedef uint16_t type;
 | 
|---|
 | 755 |                 typedef utf16_counter counter;
 | 
|---|
 | 756 |                 typedef utf16_writer writer;
 | 
|---|
 | 757 |         };
 | 
|---|
 | 758 | 
 | 
|---|
 | 759 |         template <> struct wchar_selector<4>
 | 
|---|
 | 760 |         {
 | 
|---|
 | 761 |                 typedef uint32_t type;
 | 
|---|
 | 762 |                 typedef utf32_counter counter;
 | 
|---|
 | 763 |                 typedef utf32_writer writer;
 | 
|---|
 | 764 |         };
 | 
|---|
 | 765 | 
 | 
|---|
 | 766 |         typedef wchar_selector<sizeof(wchar_t)>::counter wchar_counter;
 | 
|---|
 | 767 |         typedef wchar_selector<sizeof(wchar_t)>::writer wchar_writer;
 | 
|---|
 | 768 | 
 | 
|---|
 | 769 |         template <typename Traits, typename opt_swap = opt_false> struct utf_decoder
 | 
|---|
 | 770 |         {
 | 
|---|
 | 771 |                 static inline typename Traits::value_type decode_utf8_block(const uint8_t* data, size_t size, typename Traits::value_type result)
 | 
|---|
 | 772 |                 {
 | 
|---|
 | 773 |                         const uint8_t utf8_byte_mask = 0x3f;
 | 
|---|
 | 774 | 
 | 
|---|
 | 775 |                         while (size)
 | 
|---|
 | 776 |                         {
 | 
|---|
 | 777 |                                 uint8_t lead = *data;
 | 
|---|
 | 778 | 
 | 
|---|
 | 779 |                                 // 0xxxxxxx -> U+0000..U+007F
 | 
|---|
 | 780 |                                 if (lead < 0x80)
 | 
|---|
 | 781 |                                 {
 | 
|---|
 | 782 |                                         result = Traits::low(result, lead);
 | 
|---|
 | 783 |                                         data += 1;
 | 
|---|
 | 784 |                                         size -= 1;
 | 
|---|
 | 785 | 
 | 
|---|
 | 786 |                                         // process aligned single-byte (ascii) blocks
 | 
|---|
 | 787 |                                         if ((reinterpret_cast<uintptr_t>(data) & 3) == 0)
 | 
|---|
 | 788 |                                         {
 | 
|---|
 | 789 |                                                 while (size >= 4 && (*reinterpret_cast<const uint32_t*>(data) & 0x80808080) == 0)
 | 
|---|
 | 790 |                                                 {
 | 
|---|
 | 791 |                                                         result = Traits::low(result, data[0]);
 | 
|---|
 | 792 |                                                         result = Traits::low(result, data[1]);
 | 
|---|
 | 793 |                                                         result = Traits::low(result, data[2]);
 | 
|---|
 | 794 |                                                         result = Traits::low(result, data[3]);
 | 
|---|
 | 795 |                                                         data += 4;
 | 
|---|
 | 796 |                                                         size -= 4;
 | 
|---|
 | 797 |                                                 }
 | 
|---|
 | 798 |                                         }
 | 
|---|
 | 799 |                                 }
 | 
|---|
 | 800 |                                 // 110xxxxx -> U+0080..U+07FF
 | 
|---|
 | 801 |                                 else if ((unsigned)(lead - 0xC0) < 0x20 && size >= 2 && (data[1] & 0xc0) == 0x80)
 | 
|---|
 | 802 |                                 {
 | 
|---|
 | 803 |                                         result = Traits::low(result, ((lead & ~0xC0) << 6) | (data[1] & utf8_byte_mask));
 | 
|---|
 | 804 |                                         data += 2;
 | 
|---|
 | 805 |                                         size -= 2;
 | 
|---|
 | 806 |                                 }
 | 
|---|
 | 807 |                                 // 1110xxxx -> U+0800-U+FFFF
 | 
|---|
 | 808 |                                 else if ((unsigned)(lead - 0xE0) < 0x10 && size >= 3 && (data[1] & 0xc0) == 0x80 && (data[2] & 0xc0) == 0x80)
 | 
|---|
 | 809 |                                 {
 | 
|---|
 | 810 |                                         result = Traits::low(result, ((lead & ~0xE0) << 12) | ((data[1] & utf8_byte_mask) << 6) | (data[2] & utf8_byte_mask));
 | 
|---|
 | 811 |                                         data += 3;
 | 
|---|
 | 812 |                                         size -= 3;
 | 
|---|
 | 813 |                                 }
 | 
|---|
 | 814 |                                 // 11110xxx -> U+10000..U+10FFFF
 | 
|---|
 | 815 |                                 else if ((unsigned)(lead - 0xF0) < 0x08 && size >= 4 && (data[1] & 0xc0) == 0x80 && (data[2] & 0xc0) == 0x80 && (data[3] & 0xc0) == 0x80)
 | 
|---|
 | 816 |                                 {
 | 
|---|
 | 817 |                                         result = Traits::high(result, ((lead & ~0xF0) << 18) | ((data[1] & utf8_byte_mask) << 12) | ((data[2] & utf8_byte_mask) << 6) | (data[3] & utf8_byte_mask));
 | 
|---|
 | 818 |                                         data += 4;
 | 
|---|
 | 819 |                                         size -= 4;
 | 
|---|
 | 820 |                                 }
 | 
|---|
 | 821 |                                 // 10xxxxxx or 11111xxx -> invalid
 | 
|---|
 | 822 |                                 else
 | 
|---|
 | 823 |                                 {
 | 
|---|
 | 824 |                                         data += 1;
 | 
|---|
 | 825 |                                         size -= 1;
 | 
|---|
 | 826 |                                 }
 | 
|---|
 | 827 |                         }
 | 
|---|
 | 828 | 
 | 
|---|
 | 829 |                         return result;
 | 
|---|
 | 830 |                 }
 | 
|---|
 | 831 | 
 | 
|---|
 | 832 |                 static inline typename Traits::value_type decode_utf16_block(const uint16_t* data, size_t size, typename Traits::value_type result)
 | 
|---|
 | 833 |                 {
 | 
|---|
 | 834 |                         const uint16_t* end = data + size;
 | 
|---|
 | 835 | 
 | 
|---|
 | 836 |                         while (data < end)
 | 
|---|
 | 837 |                         {
 | 
|---|
 | 838 |                                 uint16_t lead = opt_swap::value ? endian_swap(*data) : *data;
 | 
|---|
 | 839 | 
 | 
|---|
 | 840 |                                 // U+0000..U+D7FF
 | 
|---|
 | 841 |                                 if (lead < 0xD800)
 | 
|---|
 | 842 |                                 {
 | 
|---|
 | 843 |                                         result = Traits::low(result, lead);
 | 
|---|
 | 844 |                                         data += 1;
 | 
|---|
 | 845 |                                 }
 | 
|---|
 | 846 |                                 // U+E000..U+FFFF
 | 
|---|
 | 847 |                                 else if ((unsigned)(lead - 0xE000) < 0x2000)
 | 
|---|
 | 848 |                                 {
 | 
|---|
 | 849 |                                         result = Traits::low(result, lead);
 | 
|---|
 | 850 |                                         data += 1;
 | 
|---|
 | 851 |                                 }
 | 
|---|
 | 852 |                                 // surrogate pair lead
 | 
|---|
 | 853 |                                 else if ((unsigned)(lead - 0xD800) < 0x400 && data + 1 < end)
 | 
|---|
 | 854 |                                 {
 | 
|---|
 | 855 |                                         uint16_t next = opt_swap::value ? endian_swap(data[1]) : data[1];
 | 
|---|
 | 856 | 
 | 
|---|
 | 857 |                                         if ((unsigned)(next - 0xDC00) < 0x400)
 | 
|---|
 | 858 |                                         {
 | 
|---|
 | 859 |                                                 result = Traits::high(result, 0x10000 + ((lead & 0x3ff) << 10) + (next & 0x3ff));
 | 
|---|
 | 860 |                                                 data += 2;
 | 
|---|
 | 861 |                                         }
 | 
|---|
 | 862 |                                         else
 | 
|---|
 | 863 |                                         {
 | 
|---|
 | 864 |                                                 data += 1;
 | 
|---|
 | 865 |                                         }
 | 
|---|
 | 866 |                                 }
 | 
|---|
 | 867 |                                 else
 | 
|---|
 | 868 |                                 {
 | 
|---|
 | 869 |                                         data += 1;
 | 
|---|
 | 870 |                                 }
 | 
|---|
 | 871 |                         }
 | 
|---|
 | 872 | 
 | 
|---|
 | 873 |                         return result;
 | 
|---|
 | 874 |                 }
 | 
|---|
 | 875 | 
 | 
|---|
 | 876 |                 static inline typename Traits::value_type decode_utf32_block(const uint32_t* data, size_t size, typename Traits::value_type result)
 | 
|---|
 | 877 |                 {
 | 
|---|
 | 878 |                         const uint32_t* end = data + size;
 | 
|---|
 | 879 | 
 | 
|---|
 | 880 |                         while (data < end)
 | 
|---|
 | 881 |                         {
 | 
|---|
 | 882 |                                 uint32_t lead = opt_swap::value ? endian_swap(*data) : *data;
 | 
|---|
 | 883 | 
 | 
|---|
 | 884 |                                 // U+0000..U+FFFF
 | 
|---|
 | 885 |                                 if (lead < 0x10000)
 | 
|---|
 | 886 |                                 {
 | 
|---|
 | 887 |                                         result = Traits::low(result, lead);
 | 
|---|
 | 888 |                                         data += 1;
 | 
|---|
 | 889 |                                 }
 | 
|---|
 | 890 |                                 // U+10000..U+10FFFF
 | 
|---|
 | 891 |                                 else
 | 
|---|
 | 892 |                                 {
 | 
|---|
 | 893 |                                         result = Traits::high(result, lead);
 | 
|---|
 | 894 |                                         data += 1;
 | 
|---|
 | 895 |                                 }
 | 
|---|
 | 896 |                         }
 | 
|---|
 | 897 | 
 | 
|---|
 | 898 |                         return result;
 | 
|---|
 | 899 |                 }
 | 
|---|
 | 900 |         };
 | 
|---|
 | 901 | 
 | 
|---|
 | 902 |         template <typename T> inline void convert_utf_endian_swap(T* result, const T* data, size_t length)
 | 
|---|
 | 903 |         {
 | 
|---|
 | 904 |                 for (size_t i = 0; i < length; ++i) result[i] = endian_swap(data[i]);
 | 
|---|
 | 905 |         }
 | 
|---|
 | 906 | 
 | 
|---|
 | 907 |         inline void convert_wchar_endian_swap(wchar_t* result, const wchar_t* data, size_t length)
 | 
|---|
 | 908 |         {
 | 
|---|
 | 909 |                 for (size_t i = 0; i < length; ++i) result[i] = static_cast<wchar_t>(endian_swap(static_cast<wchar_selector<sizeof(wchar_t)>::type>(data[i])));
 | 
|---|
 | 910 |         }
 | 
|---|
 | 911 | }
 | 
|---|
 | 912 | 
 | 
|---|
 | 913 | namespace
 | 
|---|
 | 914 | {       
 | 
|---|
 | 915 |         enum chartype_t
 | 
|---|
 | 916 |         {
 | 
|---|
 | 917 |                 ct_parse_pcdata = 1,    // \0, &, \r, <
 | 
|---|
 | 918 |                 ct_parse_attr = 2,              // \0, &, \r, ', "
 | 
|---|
 | 919 |                 ct_parse_attr_ws = 4,   // \0, &, \r, ', ", \n, tab
 | 
|---|
 | 920 |                 ct_space = 8,                   // \r, \n, space, tab
 | 
|---|
 | 921 |                 ct_parse_cdata = 16,    // \0, ], >, \r
 | 
|---|
 | 922 |                 ct_parse_comment = 32,  // \0, -, >, \r
 | 
|---|
 | 923 |                 ct_symbol = 64,                 // Any symbol > 127, a-z, A-Z, 0-9, _, :, -, .
 | 
|---|
 | 924 |                 ct_start_symbol = 128   // Any symbol > 127, a-z, A-Z, _, :
 | 
|---|
 | 925 |         };
 | 
|---|
 | 926 | 
 | 
|---|
 | 927 |         const unsigned char chartype_table[256] =
 | 
|---|
 | 928 |         {
 | 
|---|
 | 929 |                 55,  0,   0,   0,   0,   0,   0,   0,      0,   12,  12,  0,   0,   63,  0,   0,   // 0-15
 | 
|---|
 | 930 |                 0,   0,   0,   0,   0,   0,   0,   0,      0,   0,   0,   0,   0,   0,   0,   0,   // 16-31
 | 
|---|
 | 931 |                 8,   0,   6,   0,   0,   0,   7,   6,      0,   0,   0,   0,   0,   96,  64,  0,   // 32-47
 | 
|---|
 | 932 |                 64,  64,  64,  64,  64,  64,  64,  64,     64,  64,  192, 0,   1,   0,   48,  0,   // 48-63
 | 
|---|
 | 933 |                 0,   192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 192, 192, 192, 192, 192, // 64-79
 | 
|---|
 | 934 |                 192, 192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 0,   0,   16,  0,   192, // 80-95
 | 
|---|
 | 935 |                 0,   192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 192, 192, 192, 192, 192, // 96-111
 | 
|---|
 | 936 |                 192, 192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 0, 0, 0, 0, 0,           // 112-127
 | 
|---|
 | 937 | 
 | 
|---|
 | 938 |                 192, 192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 192, 192, 192, 192, 192, // 128+
 | 
|---|
 | 939 |                 192, 192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 192, 192, 192, 192, 192,
 | 
|---|
 | 940 |                 192, 192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 192, 192, 192, 192, 192,
 | 
|---|
 | 941 |                 192, 192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 192, 192, 192, 192, 192,
 | 
|---|
 | 942 |                 192, 192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 192, 192, 192, 192, 192,
 | 
|---|
 | 943 |                 192, 192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 192, 192, 192, 192, 192,
 | 
|---|
 | 944 |                 192, 192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 192, 192, 192, 192, 192,
 | 
|---|
 | 945 |                 192, 192, 192, 192, 192, 192, 192, 192,    192, 192, 192, 192, 192, 192, 192, 192
 | 
|---|
 | 946 |         };
 | 
|---|
 | 947 | 
 | 
|---|
 | 948 |         enum chartypex_t
 | 
|---|
 | 949 |         {
 | 
|---|
 | 950 |                 ctx_special_pcdata = 1,   // Any symbol >= 0 and < 32 (except \t, \r, \n), &, <, >
 | 
|---|
 | 951 |                 ctx_special_attr = 2,     // Any symbol >= 0 and < 32 (except \t), &, <, >, "
 | 
|---|
 | 952 |                 ctx_start_symbol = 4,     // Any symbol > 127, a-z, A-Z, _
 | 
|---|
 | 953 |                 ctx_digit = 8,                    // 0-9
 | 
|---|
 | 954 |                 ctx_symbol = 16                   // Any symbol > 127, a-z, A-Z, 0-9, _, -, .
 | 
|---|
 | 955 |         };
 | 
|---|
 | 956 |         
 | 
|---|
 | 957 |         const unsigned char chartypex_table[256] =
 | 
|---|
 | 958 |         {
 | 
|---|
 | 959 |                 3,  3,  3,  3,  3,  3,  3,  3,     3,  0,  2,  3,  3,  2,  3,  3,     // 0-15
 | 
|---|
 | 960 |                 3,  3,  3,  3,  3,  3,  3,  3,     3,  3,  3,  3,  3,  3,  3,  3,     // 16-31
 | 
|---|
 | 961 |                 0,  0,  2,  0,  0,  0,  3,  0,     0,  0,  0,  0,  0, 16, 16,  0,     // 32-47
 | 
|---|
 | 962 |                 24, 24, 24, 24, 24, 24, 24, 24,    24, 24, 0,  0,  3,  0,  3,  0,     // 48-63
 | 
|---|
 | 963 | 
 | 
|---|
 | 964 |                 0,  20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 20, 20, 20, 20, 20,    // 64-79
 | 
|---|
 | 965 |                 20, 20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 0,  0,  0,  0,  20,    // 80-95
 | 
|---|
 | 966 |                 0,  20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 20, 20, 20, 20, 20,    // 96-111
 | 
|---|
 | 967 |                 20, 20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 0,  0,  0,  0,  0,     // 112-127
 | 
|---|
 | 968 | 
 | 
|---|
 | 969 |                 20, 20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 20, 20, 20, 20, 20,    // 128+
 | 
|---|
 | 970 |                 20, 20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 20, 20, 20, 20, 20,
 | 
|---|
 | 971 |                 20, 20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 20, 20, 20, 20, 20,
 | 
|---|
 | 972 |                 20, 20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 20, 20, 20, 20, 20,
 | 
|---|
 | 973 |                 20, 20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 20, 20, 20, 20, 20,
 | 
|---|
 | 974 |                 20, 20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 20, 20, 20, 20, 20,
 | 
|---|
 | 975 |                 20, 20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 20, 20, 20, 20, 20,
 | 
|---|
 | 976 |                 20, 20, 20, 20, 20, 20, 20, 20,    20, 20, 20, 20, 20, 20, 20, 20
 | 
|---|
 | 977 |         };
 | 
|---|
 | 978 |         
 | 
|---|
 | 979 | #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 980 |         #define IS_CHARTYPE_IMPL(c, ct, table) ((static_cast<unsigned int>(c) < 128 ? table[static_cast<unsigned int>(c)] : table[128]) & (ct))
 | 
|---|
 | 981 | #else
 | 
|---|
 | 982 |         #define IS_CHARTYPE_IMPL(c, ct, table) (table[static_cast<unsigned char>(c)] & (ct))
 | 
|---|
 | 983 | #endif
 | 
|---|
 | 984 | 
 | 
|---|
 | 985 |         #define IS_CHARTYPE(c, ct) IS_CHARTYPE_IMPL(c, ct, chartype_table)
 | 
|---|
 | 986 |         #define IS_CHARTYPEX(c, ct) IS_CHARTYPE_IMPL(c, ct, chartypex_table)
 | 
|---|
 | 987 | 
 | 
|---|
 | 988 |         bool is_little_endian()
 | 
|---|
 | 989 |         {
 | 
|---|
 | 990 |                 unsigned int ui = 1;
 | 
|---|
 | 991 | 
 | 
|---|
 | 992 |                 return *reinterpret_cast<unsigned char*>(&ui) == 1;
 | 
|---|
 | 993 |         }
 | 
|---|
 | 994 | 
 | 
|---|
 | 995 |         xml_encoding get_wchar_encoding()
 | 
|---|
 | 996 |         {
 | 
|---|
 | 997 |                 STATIC_ASSERT(sizeof(wchar_t) == 2 || sizeof(wchar_t) == 4);
 | 
|---|
 | 998 | 
 | 
|---|
 | 999 |                 if (sizeof(wchar_t) == 2)
 | 
|---|
 | 1000 |                         return is_little_endian() ? encoding_utf16_le : encoding_utf16_be;
 | 
|---|
 | 1001 |                 else 
 | 
|---|
 | 1002 |                         return is_little_endian() ? encoding_utf32_le : encoding_utf32_be;
 | 
|---|
 | 1003 |         }
 | 
|---|
 | 1004 | 
 | 
|---|
 | 1005 |         xml_encoding guess_buffer_encoding(uint8_t d0, uint8_t d1, uint8_t d2, uint8_t d3)
 | 
|---|
 | 1006 |         {
 | 
|---|
 | 1007 |                 // look for BOM in first few bytes
 | 
|---|
 | 1008 |                 if (d0 == 0 && d1 == 0 && d2 == 0xfe && d3 == 0xff) return encoding_utf32_be;
 | 
|---|
 | 1009 |                 if (d0 == 0xff && d1 == 0xfe && d2 == 0 && d3 == 0) return encoding_utf32_le;
 | 
|---|
 | 1010 |                 if (d0 == 0xfe && d1 == 0xff) return encoding_utf16_be;
 | 
|---|
 | 1011 |                 if (d0 == 0xff && d1 == 0xfe) return encoding_utf16_le;
 | 
|---|
 | 1012 |                 if (d0 == 0xef && d1 == 0xbb && d2 == 0xbf) return encoding_utf8;
 | 
|---|
 | 1013 | 
 | 
|---|
 | 1014 |                 // look for <, <? or <?xm in various encodings
 | 
|---|
 | 1015 |                 if (d0 == 0 && d1 == 0 && d2 == 0 && d3 == 0x3c) return encoding_utf32_be;
 | 
|---|
 | 1016 |                 if (d0 == 0x3c && d1 == 0 && d2 == 0 && d3 == 0) return encoding_utf32_le;
 | 
|---|
 | 1017 |                 if (d0 == 0 && d1 == 0x3c && d2 == 0 && d3 == 0x3f) return encoding_utf16_be;
 | 
|---|
 | 1018 |                 if (d0 == 0x3c && d1 == 0 && d2 == 0x3f && d3 == 0) return encoding_utf16_le;
 | 
|---|
 | 1019 |                 if (d0 == 0x3c && d1 == 0x3f && d2 == 0x78 && d3 == 0x6d) return encoding_utf8;
 | 
|---|
 | 1020 | 
 | 
|---|
 | 1021 |                 // look for utf16 < followed by node name (this may fail, but is better than utf8 since it's zero terminated so early)
 | 
|---|
 | 1022 |                 if (d0 == 0 && d1 == 0x3c) return encoding_utf16_be;
 | 
|---|
 | 1023 |                 if (d0 == 0x3c && d1 == 0) return encoding_utf16_le;
 | 
|---|
 | 1024 | 
 | 
|---|
 | 1025 |                 // no known BOM detected, assume utf8
 | 
|---|
 | 1026 |                 return encoding_utf8;
 | 
|---|
 | 1027 |         }
 | 
|---|
 | 1028 | 
 | 
|---|
 | 1029 |         xml_encoding get_buffer_encoding(xml_encoding encoding, const void* contents, size_t size)
 | 
|---|
 | 1030 |         {
 | 
|---|
 | 1031 |                 // replace wchar encoding with utf implementation
 | 
|---|
 | 1032 |                 if (encoding == encoding_wchar) return get_wchar_encoding();
 | 
|---|
 | 1033 | 
 | 
|---|
 | 1034 |                 // replace utf16 encoding with utf16 with specific endianness
 | 
|---|
 | 1035 |                 if (encoding == encoding_utf16) return is_little_endian() ? encoding_utf16_le : encoding_utf16_be;
 | 
|---|
 | 1036 | 
 | 
|---|
 | 1037 |                 // replace utf32 encoding with utf32 with specific endianness
 | 
|---|
 | 1038 |                 if (encoding == encoding_utf32) return is_little_endian() ? encoding_utf32_le : encoding_utf32_be;
 | 
|---|
 | 1039 | 
 | 
|---|
 | 1040 |                 // only do autodetection if no explicit encoding is requested
 | 
|---|
 | 1041 |                 if (encoding != encoding_auto) return encoding;
 | 
|---|
 | 1042 | 
 | 
|---|
 | 1043 |                 // skip encoding autodetection if input buffer is too small
 | 
|---|
 | 1044 |                 if (size < 4) return encoding_utf8;
 | 
|---|
 | 1045 | 
 | 
|---|
 | 1046 |                 // try to guess encoding (based on XML specification, Appendix F.1)
 | 
|---|
 | 1047 |                 const uint8_t* data = static_cast<const uint8_t*>(contents);
 | 
|---|
 | 1048 | 
 | 
|---|
 | 1049 |                 DMC_VOLATILE uint8_t d0 = data[0], d1 = data[1], d2 = data[2], d3 = data[3];
 | 
|---|
 | 1050 | 
 | 
|---|
 | 1051 |                 return guess_buffer_encoding(d0, d1, d2, d3);
 | 
|---|
 | 1052 |         }
 | 
|---|
 | 1053 | 
 | 
|---|
 | 1054 |         bool get_mutable_buffer(char_t*& out_buffer, size_t& out_length, const void* contents, size_t size, bool is_mutable)
 | 
|---|
 | 1055 |         {
 | 
|---|
 | 1056 |                 if (is_mutable)
 | 
|---|
 | 1057 |                 {
 | 
|---|
 | 1058 |                         out_buffer = static_cast<char_t*>(const_cast<void*>(contents));
 | 
|---|
 | 1059 |                 }
 | 
|---|
 | 1060 |                 else
 | 
|---|
 | 1061 |                 {
 | 
|---|
 | 1062 |                         void* buffer = global_allocate(size > 0 ? size : 1);
 | 
|---|
 | 1063 |                         if (!buffer) return false;
 | 
|---|
 | 1064 | 
 | 
|---|
 | 1065 |                         memcpy(buffer, contents, size);
 | 
|---|
 | 1066 | 
 | 
|---|
 | 1067 |                         out_buffer = static_cast<char_t*>(buffer);
 | 
|---|
 | 1068 |                 }
 | 
|---|
 | 1069 | 
 | 
|---|
 | 1070 |                 out_length = size / sizeof(char_t);
 | 
|---|
 | 1071 | 
 | 
|---|
 | 1072 |                 return true;
 | 
|---|
 | 1073 |         }
 | 
|---|
 | 1074 | 
 | 
|---|
 | 1075 | #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 1076 |         inline bool need_endian_swap_utf(xml_encoding le, xml_encoding re)
 | 
|---|
 | 1077 |         {
 | 
|---|
 | 1078 |                 return (le == encoding_utf16_be && re == encoding_utf16_le) || (le == encoding_utf16_le && re == encoding_utf16_be) ||
 | 
|---|
 | 1079 |                        (le == encoding_utf32_be && re == encoding_utf32_le) || (le == encoding_utf32_le && re == encoding_utf32_be);
 | 
|---|
 | 1080 |         }
 | 
|---|
 | 1081 | 
 | 
|---|
 | 1082 |         bool convert_buffer_endian_swap(char_t*& out_buffer, size_t& out_length, const void* contents, size_t size, bool is_mutable)
 | 
|---|
 | 1083 |         {
 | 
|---|
 | 1084 |                 const char_t* data = static_cast<const char_t*>(contents);
 | 
|---|
 | 1085 |         
 | 
|---|
 | 1086 |                 if (is_mutable)
 | 
|---|
 | 1087 |                 {
 | 
|---|
 | 1088 |                         out_buffer = const_cast<char_t*>(data);
 | 
|---|
 | 1089 |                 }
 | 
|---|
 | 1090 |                 else
 | 
|---|
 | 1091 |                 {
 | 
|---|
 | 1092 |                         out_buffer = static_cast<char_t*>(global_allocate(size > 0 ? size : 1));
 | 
|---|
 | 1093 |                         if (!out_buffer) return false;
 | 
|---|
 | 1094 |                 }
 | 
|---|
 | 1095 | 
 | 
|---|
 | 1096 |                 out_length = size / sizeof(char_t);
 | 
|---|
 | 1097 | 
 | 
|---|
 | 1098 |                 convert_wchar_endian_swap(out_buffer, data, out_length);
 | 
|---|
 | 1099 | 
 | 
|---|
 | 1100 |                 return true;
 | 
|---|
 | 1101 |         }
 | 
|---|
 | 1102 | 
 | 
|---|
 | 1103 |         bool convert_buffer_utf8(char_t*& out_buffer, size_t& out_length, const void* contents, size_t size)
 | 
|---|
 | 1104 |         {
 | 
|---|
 | 1105 |                 const uint8_t* data = static_cast<const uint8_t*>(contents);
 | 
|---|
 | 1106 | 
 | 
|---|
 | 1107 |                 // first pass: get length in wchar_t units
 | 
|---|
 | 1108 |                 out_length = utf_decoder<wchar_counter>::decode_utf8_block(data, size, 0);
 | 
|---|
 | 1109 | 
 | 
|---|
 | 1110 |                 // allocate buffer of suitable length
 | 
|---|
 | 1111 |                 out_buffer = static_cast<char_t*>(global_allocate((out_length > 0 ? out_length : 1) * sizeof(char_t)));
 | 
|---|
 | 1112 |                 if (!out_buffer) return false;
 | 
|---|
 | 1113 | 
 | 
|---|
 | 1114 |                 // second pass: convert utf8 input to wchar_t
 | 
|---|
 | 1115 |                 wchar_writer::value_type out_begin = reinterpret_cast<wchar_writer::value_type>(out_buffer);
 | 
|---|
 | 1116 |                 wchar_writer::value_type out_end = utf_decoder<wchar_writer>::decode_utf8_block(data, size, out_begin);
 | 
|---|
 | 1117 | 
 | 
|---|
 | 1118 |                 assert(out_end == out_begin + out_length);
 | 
|---|
 | 1119 |                 (void)!out_end;
 | 
|---|
 | 1120 | 
 | 
|---|
 | 1121 |                 return true;
 | 
|---|
 | 1122 |         }
 | 
|---|
 | 1123 | 
 | 
|---|
 | 1124 |         template <typename opt_swap> bool convert_buffer_utf16(char_t*& out_buffer, size_t& out_length, const void* contents, size_t size, opt_swap)
 | 
|---|
 | 1125 |         {
 | 
|---|
 | 1126 |                 const uint16_t* data = static_cast<const uint16_t*>(contents);
 | 
|---|
 | 1127 |                 size_t length = size / sizeof(uint16_t);
 | 
|---|
 | 1128 | 
 | 
|---|
 | 1129 |                 // first pass: get length in wchar_t units
 | 
|---|
 | 1130 |                 out_length = utf_decoder<wchar_counter, opt_swap>::decode_utf16_block(data, length, 0);
 | 
|---|
 | 1131 | 
 | 
|---|
 | 1132 |                 // allocate buffer of suitable length
 | 
|---|
 | 1133 |                 out_buffer = static_cast<char_t*>(global_allocate((out_length > 0 ? out_length : 1) * sizeof(char_t)));
 | 
|---|
 | 1134 |                 if (!out_buffer) return false;
 | 
|---|
 | 1135 | 
 | 
|---|
 | 1136 |                 // second pass: convert utf16 input to wchar_t
 | 
|---|
 | 1137 |                 wchar_writer::value_type out_begin = reinterpret_cast<wchar_writer::value_type>(out_buffer);
 | 
|---|
 | 1138 |                 wchar_writer::value_type out_end = utf_decoder<wchar_writer, opt_swap>::decode_utf16_block(data, length, out_begin);
 | 
|---|
 | 1139 | 
 | 
|---|
 | 1140 |                 assert(out_end == out_begin + out_length);
 | 
|---|
 | 1141 |                 (void)!out_end;
 | 
|---|
 | 1142 | 
 | 
|---|
 | 1143 |                 return true;
 | 
|---|
 | 1144 |         }
 | 
|---|
 | 1145 | 
 | 
|---|
 | 1146 |         template <typename opt_swap> bool convert_buffer_utf32(char_t*& out_buffer, size_t& out_length, const void* contents, size_t size, opt_swap)
 | 
|---|
 | 1147 |         {
 | 
|---|
 | 1148 |                 const uint32_t* data = static_cast<const uint32_t*>(contents);
 | 
|---|
 | 1149 |                 size_t length = size / sizeof(uint32_t);
 | 
|---|
 | 1150 | 
 | 
|---|
 | 1151 |                 // first pass: get length in wchar_t units
 | 
|---|
 | 1152 |                 out_length = utf_decoder<wchar_counter, opt_swap>::decode_utf32_block(data, length, 0);
 | 
|---|
 | 1153 | 
 | 
|---|
 | 1154 |                 // allocate buffer of suitable length
 | 
|---|
 | 1155 |                 out_buffer = static_cast<char_t*>(global_allocate((out_length > 0 ? out_length : 1) * sizeof(char_t)));
 | 
|---|
 | 1156 |                 if (!out_buffer) return false;
 | 
|---|
 | 1157 | 
 | 
|---|
 | 1158 |                 // second pass: convert utf32 input to wchar_t
 | 
|---|
 | 1159 |                 wchar_writer::value_type out_begin = reinterpret_cast<wchar_writer::value_type>(out_buffer);
 | 
|---|
 | 1160 |                 wchar_writer::value_type out_end = utf_decoder<wchar_writer, opt_swap>::decode_utf32_block(data, length, out_begin);
 | 
|---|
 | 1161 | 
 | 
|---|
 | 1162 |                 assert(out_end == out_begin + out_length);
 | 
|---|
 | 1163 |                 (void)!out_end;
 | 
|---|
 | 1164 | 
 | 
|---|
 | 1165 |                 return true;
 | 
|---|
 | 1166 |         }
 | 
|---|
 | 1167 | 
 | 
|---|
 | 1168 |         bool convert_buffer(char_t*& out_buffer, size_t& out_length, xml_encoding encoding, const void* contents, size_t size, bool is_mutable)
 | 
|---|
 | 1169 |         {
 | 
|---|
 | 1170 |                 // get native encoding
 | 
|---|
 | 1171 |                 xml_encoding wchar_encoding = get_wchar_encoding();
 | 
|---|
 | 1172 | 
 | 
|---|
 | 1173 |                 // fast path: no conversion required
 | 
|---|
 | 1174 |                 if (encoding == wchar_encoding) return get_mutable_buffer(out_buffer, out_length, contents, size, is_mutable);
 | 
|---|
 | 1175 | 
 | 
|---|
 | 1176 |                 // only endian-swapping is required
 | 
|---|
 | 1177 |                 if (need_endian_swap_utf(encoding, wchar_encoding)) return convert_buffer_endian_swap(out_buffer, out_length, contents, size, is_mutable);
 | 
|---|
 | 1178 | 
 | 
|---|
 | 1179 |                 // source encoding is utf8
 | 
|---|
 | 1180 |                 if (encoding == encoding_utf8) return convert_buffer_utf8(out_buffer, out_length, contents, size);
 | 
|---|
 | 1181 | 
 | 
|---|
 | 1182 |                 // source encoding is utf16
 | 
|---|
 | 1183 |                 if (encoding == encoding_utf16_be || encoding == encoding_utf16_le)
 | 
|---|
 | 1184 |                 {
 | 
|---|
 | 1185 |                         xml_encoding native_encoding = is_little_endian() ? encoding_utf16_le : encoding_utf16_be;
 | 
|---|
 | 1186 | 
 | 
|---|
 | 1187 |                         return (native_encoding == encoding) ?
 | 
|---|
 | 1188 |                                 convert_buffer_utf16(out_buffer, out_length, contents, size, opt_false()) :
 | 
|---|
 | 1189 |                                 convert_buffer_utf16(out_buffer, out_length, contents, size, opt_true());
 | 
|---|
 | 1190 |                 }
 | 
|---|
 | 1191 | 
 | 
|---|
 | 1192 |                 // source encoding is utf32
 | 
|---|
 | 1193 |                 if (encoding == encoding_utf32_be || encoding == encoding_utf32_le)
 | 
|---|
 | 1194 |                 {
 | 
|---|
 | 1195 |                         xml_encoding native_encoding = is_little_endian() ? encoding_utf32_le : encoding_utf32_be;
 | 
|---|
 | 1196 | 
 | 
|---|
 | 1197 |                         return (native_encoding == encoding) ?
 | 
|---|
 | 1198 |                                 convert_buffer_utf32(out_buffer, out_length, contents, size, opt_false()) :
 | 
|---|
 | 1199 |                                 convert_buffer_utf32(out_buffer, out_length, contents, size, opt_true());
 | 
|---|
 | 1200 |                 }
 | 
|---|
 | 1201 | 
 | 
|---|
 | 1202 |                 assert(!"Invalid encoding");
 | 
|---|
 | 1203 |                 return false;
 | 
|---|
 | 1204 |         }
 | 
|---|
 | 1205 | #else
 | 
|---|
 | 1206 |         template <typename opt_swap> bool convert_buffer_utf16(char_t*& out_buffer, size_t& out_length, const void* contents, size_t size, opt_swap)
 | 
|---|
 | 1207 |         {
 | 
|---|
 | 1208 |                 const uint16_t* data = static_cast<const uint16_t*>(contents);
 | 
|---|
 | 1209 |                 size_t length = size / sizeof(uint16_t);
 | 
|---|
 | 1210 | 
 | 
|---|
 | 1211 |                 // first pass: get length in utf8 units
 | 
|---|
 | 1212 |                 out_length = utf_decoder<utf8_counter, opt_swap>::decode_utf16_block(data, length, 0);
 | 
|---|
 | 1213 | 
 | 
|---|
 | 1214 |                 // allocate buffer of suitable length
 | 
|---|
 | 1215 |                 out_buffer = static_cast<char_t*>(global_allocate((out_length > 0 ? out_length : 1) * sizeof(char_t)));
 | 
|---|
 | 1216 |                 if (!out_buffer) return false;
 | 
|---|
 | 1217 | 
 | 
|---|
 | 1218 |                 // second pass: convert utf16 input to utf8
 | 
|---|
 | 1219 |                 uint8_t* out_begin = reinterpret_cast<uint8_t*>(out_buffer);
 | 
|---|
 | 1220 |                 uint8_t* out_end = utf_decoder<utf8_writer, opt_swap>::decode_utf16_block(data, length, out_begin);
 | 
|---|
 | 1221 | 
 | 
|---|
 | 1222 |                 assert(out_end == out_begin + out_length);
 | 
|---|
 | 1223 |                 (void)!out_end;
 | 
|---|
 | 1224 | 
 | 
|---|
 | 1225 |                 return true;
 | 
|---|
 | 1226 |         }
 | 
|---|
 | 1227 | 
 | 
|---|
 | 1228 |         template <typename opt_swap> bool convert_buffer_utf32(char_t*& out_buffer, size_t& out_length, const void* contents, size_t size, opt_swap)
 | 
|---|
 | 1229 |         {
 | 
|---|
 | 1230 |                 const uint32_t* data = static_cast<const uint32_t*>(contents);
 | 
|---|
 | 1231 |                 size_t length = size / sizeof(uint32_t);
 | 
|---|
 | 1232 | 
 | 
|---|
 | 1233 |                 // first pass: get length in utf8 units
 | 
|---|
 | 1234 |                 out_length = utf_decoder<utf8_counter, opt_swap>::decode_utf32_block(data, length, 0);
 | 
|---|
 | 1235 | 
 | 
|---|
 | 1236 |                 // allocate buffer of suitable length
 | 
|---|
 | 1237 |                 out_buffer = static_cast<char_t*>(global_allocate((out_length > 0 ? out_length : 1) * sizeof(char_t)));
 | 
|---|
 | 1238 |                 if (!out_buffer) return false;
 | 
|---|
 | 1239 | 
 | 
|---|
 | 1240 |                 // second pass: convert utf32 input to utf8
 | 
|---|
 | 1241 |                 uint8_t* out_begin = reinterpret_cast<uint8_t*>(out_buffer);
 | 
|---|
 | 1242 |                 uint8_t* out_end = utf_decoder<utf8_writer, opt_swap>::decode_utf32_block(data, length, out_begin);
 | 
|---|
 | 1243 | 
 | 
|---|
 | 1244 |                 assert(out_end == out_begin + out_length);
 | 
|---|
 | 1245 |                 (void)!out_end;
 | 
|---|
 | 1246 | 
 | 
|---|
 | 1247 |                 return true;
 | 
|---|
 | 1248 |         }
 | 
|---|
 | 1249 | 
 | 
|---|
 | 1250 |         bool convert_buffer(char_t*& out_buffer, size_t& out_length, xml_encoding encoding, const void* contents, size_t size, bool is_mutable)
 | 
|---|
 | 1251 |         {
 | 
|---|
 | 1252 |                 // fast path: no conversion required
 | 
|---|
 | 1253 |                 if (encoding == encoding_utf8) return get_mutable_buffer(out_buffer, out_length, contents, size, is_mutable);
 | 
|---|
 | 1254 | 
 | 
|---|
 | 1255 |                 // source encoding is utf16
 | 
|---|
 | 1256 |                 if (encoding == encoding_utf16_be || encoding == encoding_utf16_le)
 | 
|---|
 | 1257 |                 {
 | 
|---|
 | 1258 |                         xml_encoding native_encoding = is_little_endian() ? encoding_utf16_le : encoding_utf16_be;
 | 
|---|
 | 1259 | 
 | 
|---|
 | 1260 |                         return (native_encoding == encoding) ?
 | 
|---|
 | 1261 |                                 convert_buffer_utf16(out_buffer, out_length, contents, size, opt_false()) :
 | 
|---|
 | 1262 |                                 convert_buffer_utf16(out_buffer, out_length, contents, size, opt_true());
 | 
|---|
 | 1263 |                 }
 | 
|---|
 | 1264 | 
 | 
|---|
 | 1265 |                 // source encoding is utf32
 | 
|---|
 | 1266 |                 if (encoding == encoding_utf32_be || encoding == encoding_utf32_le)
 | 
|---|
 | 1267 |                 {
 | 
|---|
 | 1268 |                         xml_encoding native_encoding = is_little_endian() ? encoding_utf32_le : encoding_utf32_be;
 | 
|---|
 | 1269 | 
 | 
|---|
 | 1270 |                         return (native_encoding == encoding) ?
 | 
|---|
 | 1271 |                                 convert_buffer_utf32(out_buffer, out_length, contents, size, opt_false()) :
 | 
|---|
 | 1272 |                                 convert_buffer_utf32(out_buffer, out_length, contents, size, opt_true());
 | 
|---|
 | 1273 |                 }
 | 
|---|
 | 1274 | 
 | 
|---|
 | 1275 |                 assert(!"Invalid encoding");
 | 
|---|
 | 1276 |                 return false;
 | 
|---|
 | 1277 |         }
 | 
|---|
 | 1278 | #endif
 | 
|---|
 | 1279 | 
 | 
|---|
 | 1280 |         size_t as_utf8_begin(const wchar_t* str, size_t length)
 | 
|---|
 | 1281 |         {
 | 
|---|
 | 1282 |                 STATIC_ASSERT(sizeof(wchar_t) == 2 || sizeof(wchar_t) == 4);
 | 
|---|
 | 1283 | 
 | 
|---|
 | 1284 |                 // get length in utf8 characters
 | 
|---|
 | 1285 |                 return sizeof(wchar_t) == 2 ?
 | 
|---|
 | 1286 |                         utf_decoder<utf8_counter>::decode_utf16_block(reinterpret_cast<const uint16_t*>(str), length, 0) :
 | 
|---|
 | 1287 |                         utf_decoder<utf8_counter>::decode_utf32_block(reinterpret_cast<const uint32_t*>(str), length, 0);
 | 
|---|
 | 1288 |     }
 | 
|---|
 | 1289 | 
 | 
|---|
 | 1290 |     void as_utf8_end(char* buffer, size_t size, const wchar_t* str, size_t length)
 | 
|---|
 | 1291 |     {
 | 
|---|
 | 1292 |                 STATIC_ASSERT(sizeof(wchar_t) == 2 || sizeof(wchar_t) == 4);
 | 
|---|
 | 1293 | 
 | 
|---|
 | 1294 |         // convert to utf8
 | 
|---|
 | 1295 |         uint8_t* begin = reinterpret_cast<uint8_t*>(buffer);
 | 
|---|
 | 1296 |         uint8_t* end = sizeof(wchar_t) == 2 ?
 | 
|---|
 | 1297 |             utf_decoder<utf8_writer>::decode_utf16_block(reinterpret_cast<const uint16_t*>(str), length, begin) :
 | 
|---|
 | 1298 |             utf_decoder<utf8_writer>::decode_utf32_block(reinterpret_cast<const uint32_t*>(str), length, begin);
 | 
|---|
 | 1299 |     
 | 
|---|
 | 1300 |         assert(begin + size == end);
 | 
|---|
 | 1301 |         (void)!end;
 | 
|---|
 | 1302 | 
 | 
|---|
 | 1303 |                 // zero-terminate
 | 
|---|
 | 1304 |                 buffer[size] = 0;
 | 
|---|
 | 1305 |         }
 | 
|---|
 | 1306 |     
 | 
|---|
 | 1307 | #ifndef PUGIXML_NO_STL
 | 
|---|
 | 1308 |     std::string as_utf8_impl(const wchar_t* str, size_t length)
 | 
|---|
 | 1309 |     {
 | 
|---|
 | 1310 |                 // first pass: get length in utf8 characters
 | 
|---|
 | 1311 |         size_t size = as_utf8_begin(str, length);
 | 
|---|
 | 1312 | 
 | 
|---|
 | 1313 |                 // allocate resulting string
 | 
|---|
 | 1314 |                 std::string result;
 | 
|---|
 | 1315 |                 result.resize(size);
 | 
|---|
 | 1316 | 
 | 
|---|
 | 1317 |                 // second pass: convert to utf8
 | 
|---|
 | 1318 |                 if (size > 0) as_utf8_end(&result[0], size, str, length);
 | 
|---|
 | 1319 | 
 | 
|---|
 | 1320 |                 return result;
 | 
|---|
 | 1321 |     }
 | 
|---|
 | 1322 | 
 | 
|---|
 | 1323 |         std::wstring as_wide_impl(const char* str, size_t size)
 | 
|---|
 | 1324 |         {
 | 
|---|
 | 1325 |                 const uint8_t* data = reinterpret_cast<const uint8_t*>(str);
 | 
|---|
 | 1326 | 
 | 
|---|
 | 1327 |                 // first pass: get length in wchar_t units
 | 
|---|
 | 1328 |                 size_t length = utf_decoder<wchar_counter>::decode_utf8_block(data, size, 0);
 | 
|---|
 | 1329 | 
 | 
|---|
 | 1330 |                 // allocate resulting string
 | 
|---|
 | 1331 |                 std::wstring result;
 | 
|---|
 | 1332 |                 result.resize(length);
 | 
|---|
 | 1333 | 
 | 
|---|
 | 1334 |                 // second pass: convert to wchar_t
 | 
|---|
 | 1335 |                 if (length > 0)
 | 
|---|
 | 1336 |                 {
 | 
|---|
 | 1337 |                         wchar_writer::value_type begin = reinterpret_cast<wchar_writer::value_type>(&result[0]);
 | 
|---|
 | 1338 |                         wchar_writer::value_type end = utf_decoder<wchar_writer>::decode_utf8_block(data, size, begin);
 | 
|---|
 | 1339 | 
 | 
|---|
 | 1340 |                         assert(begin + length == end);
 | 
|---|
 | 1341 |                         (void)!end;
 | 
|---|
 | 1342 |                 }
 | 
|---|
 | 1343 | 
 | 
|---|
 | 1344 |                 return result;
 | 
|---|
 | 1345 |         }
 | 
|---|
 | 1346 | #endif
 | 
|---|
 | 1347 | 
 | 
|---|
 | 1348 |         inline bool strcpy_insitu_allow(size_t length, uintptr_t allocated, char_t* target)
 | 
|---|
 | 1349 |         {
 | 
|---|
 | 1350 |                 assert(target);
 | 
|---|
 | 1351 |                 size_t target_length = strlength(target);
 | 
|---|
 | 1352 | 
 | 
|---|
 | 1353 |                 // always reuse document buffer memory if possible
 | 
|---|
 | 1354 |                 if (!allocated) return target_length >= length;
 | 
|---|
 | 1355 | 
 | 
|---|
 | 1356 |                 // reuse heap memory if waste is not too great
 | 
|---|
 | 1357 |                 const size_t reuse_threshold = 32;
 | 
|---|
 | 1358 | 
 | 
|---|
 | 1359 |                 return target_length >= length && (target_length < reuse_threshold || target_length - length < target_length / 2);
 | 
|---|
 | 1360 |         }
 | 
|---|
 | 1361 | 
 | 
|---|
 | 1362 |         bool strcpy_insitu(char_t*& dest, uintptr_t& header, uintptr_t header_mask, const char_t* source)
 | 
|---|
 | 1363 |         {
 | 
|---|
 | 1364 |                 size_t source_length = strlength(source);
 | 
|---|
 | 1365 | 
 | 
|---|
 | 1366 |                 if (source_length == 0)
 | 
|---|
 | 1367 |                 {
 | 
|---|
 | 1368 |                         // empty string and null pointer are equivalent, so just deallocate old memory
 | 
|---|
 | 1369 |                         xml_allocator* alloc = reinterpret_cast<xml_memory_page*>(header & xml_memory_page_pointer_mask)->allocator;
 | 
|---|
 | 1370 | 
 | 
|---|
 | 1371 |                         if (header & header_mask) alloc->deallocate_string(dest);
 | 
|---|
 | 1372 |                         
 | 
|---|
 | 1373 |                         // mark the string as not allocated
 | 
|---|
 | 1374 |                         dest = 0;
 | 
|---|
 | 1375 |                         header &= ~header_mask;
 | 
|---|
 | 1376 | 
 | 
|---|
 | 1377 |                         return true;
 | 
|---|
 | 1378 |                 }
 | 
|---|
 | 1379 |                 else if (dest && strcpy_insitu_allow(source_length, header & header_mask, dest))
 | 
|---|
 | 1380 |                 {
 | 
|---|
 | 1381 |                         // we can reuse old buffer, so just copy the new data (including zero terminator)
 | 
|---|
 | 1382 |                         memcpy(dest, source, (source_length + 1) * sizeof(char_t));
 | 
|---|
 | 1383 |                         
 | 
|---|
 | 1384 |                         return true;
 | 
|---|
 | 1385 |                 }
 | 
|---|
 | 1386 |                 else
 | 
|---|
 | 1387 |                 {
 | 
|---|
 | 1388 |                         xml_allocator* alloc = reinterpret_cast<xml_memory_page*>(header & xml_memory_page_pointer_mask)->allocator;
 | 
|---|
 | 1389 | 
 | 
|---|
 | 1390 |                         // allocate new buffer
 | 
|---|
 | 1391 |                         char_t* buf = alloc->allocate_string(source_length + 1);
 | 
|---|
 | 1392 |                         if (!buf) return false;
 | 
|---|
 | 1393 | 
 | 
|---|
 | 1394 |                         // copy the string (including zero terminator)
 | 
|---|
 | 1395 |                         memcpy(buf, source, (source_length + 1) * sizeof(char_t));
 | 
|---|
 | 1396 | 
 | 
|---|
 | 1397 |                         // deallocate old buffer (*after* the above to protect against overlapping memory and/or allocation failures)
 | 
|---|
 | 1398 |                         if (header & header_mask) alloc->deallocate_string(dest);
 | 
|---|
 | 1399 |                         
 | 
|---|
 | 1400 |                         // the string is now allocated, so set the flag
 | 
|---|
 | 1401 |                         dest = buf;
 | 
|---|
 | 1402 |                         header |= header_mask;
 | 
|---|
 | 1403 | 
 | 
|---|
 | 1404 |                         return true;
 | 
|---|
 | 1405 |                 }
 | 
|---|
 | 1406 |         }
 | 
|---|
 | 1407 | 
 | 
|---|
 | 1408 |         struct gap
 | 
|---|
 | 1409 |         {
 | 
|---|
 | 1410 |                 char_t* end;
 | 
|---|
 | 1411 |                 size_t size;
 | 
|---|
 | 1412 |                         
 | 
|---|
 | 1413 |                 gap(): end(0), size(0)
 | 
|---|
 | 1414 |                 {
 | 
|---|
 | 1415 |                 }
 | 
|---|
 | 1416 |                         
 | 
|---|
 | 1417 |                 // Push new gap, move s count bytes further (skipping the gap).
 | 
|---|
 | 1418 |                 // Collapse previous gap.
 | 
|---|
 | 1419 |                 void push(char_t*& s, size_t count)
 | 
|---|
 | 1420 |                 {
 | 
|---|
 | 1421 |                         if (end) // there was a gap already; collapse it
 | 
|---|
 | 1422 |                         {
 | 
|---|
 | 1423 |                                 // Move [old_gap_end, new_gap_start) to [old_gap_start, ...)
 | 
|---|
 | 1424 |                                 assert(s >= end);
 | 
|---|
 | 1425 |                                 memmove(end - size, end, reinterpret_cast<char*>(s) - reinterpret_cast<char*>(end));
 | 
|---|
 | 1426 |                         }
 | 
|---|
 | 1427 |                                 
 | 
|---|
 | 1428 |                         s += count; // end of current gap
 | 
|---|
 | 1429 |                                 
 | 
|---|
 | 1430 |                         // "merge" two gaps
 | 
|---|
 | 1431 |                         end = s;
 | 
|---|
 | 1432 |                         size += count;
 | 
|---|
 | 1433 |                 }
 | 
|---|
 | 1434 |                         
 | 
|---|
 | 1435 |                 // Collapse all gaps, return past-the-end pointer
 | 
|---|
 | 1436 |                 char_t* flush(char_t* s)
 | 
|---|
 | 1437 |                 {
 | 
|---|
 | 1438 |                         if (end)
 | 
|---|
 | 1439 |                         {
 | 
|---|
 | 1440 |                                 // Move [old_gap_end, current_pos) to [old_gap_start, ...)
 | 
|---|
 | 1441 |                                 assert(s >= end);
 | 
|---|
 | 1442 |                                 memmove(end - size, end, reinterpret_cast<char*>(s) - reinterpret_cast<char*>(end));
 | 
|---|
 | 1443 | 
 | 
|---|
 | 1444 |                                 return s - size;
 | 
|---|
 | 1445 |                         }
 | 
|---|
 | 1446 |                         else return s;
 | 
|---|
 | 1447 |                 }
 | 
|---|
 | 1448 |         };
 | 
|---|
 | 1449 |         
 | 
|---|
 | 1450 |         char_t* strconv_escape(char_t* s, gap& g)
 | 
|---|
 | 1451 |         {
 | 
|---|
 | 1452 |                 char_t* stre = s + 1;
 | 
|---|
 | 1453 | 
 | 
|---|
 | 1454 |                 switch (*stre)
 | 
|---|
 | 1455 |                 {
 | 
|---|
 | 1456 |                         case '#':       // &#...
 | 
|---|
 | 1457 |                         {
 | 
|---|
 | 1458 |                                 unsigned int ucsc = 0;
 | 
|---|
 | 1459 | 
 | 
|---|
 | 1460 |                                 if (stre[1] == 'x') // &#x... (hex code)
 | 
|---|
 | 1461 |                                 {
 | 
|---|
 | 1462 |                                         stre += 2;
 | 
|---|
 | 1463 | 
 | 
|---|
 | 1464 |                                         char_t ch = *stre;
 | 
|---|
 | 1465 | 
 | 
|---|
 | 1466 |                                         if (ch == ';') return stre;
 | 
|---|
 | 1467 | 
 | 
|---|
 | 1468 |                                         for (;;)
 | 
|---|
 | 1469 |                                         {
 | 
|---|
 | 1470 |                                                 if (static_cast<unsigned int>(ch - '0') <= 9)
 | 
|---|
 | 1471 |                                                         ucsc = 16 * ucsc + (ch - '0');
 | 
|---|
 | 1472 |                                                 else if (static_cast<unsigned int>((ch | ' ') - 'a') <= 5)
 | 
|---|
 | 1473 |                                                         ucsc = 16 * ucsc + ((ch | ' ') - 'a' + 10);
 | 
|---|
 | 1474 |                                                 else if (ch == ';')
 | 
|---|
 | 1475 |                                                         break;
 | 
|---|
 | 1476 |                                                 else // cancel
 | 
|---|
 | 1477 |                                                         return stre;
 | 
|---|
 | 1478 | 
 | 
|---|
 | 1479 |                                                 ch = *++stre;
 | 
|---|
 | 1480 |                                         }
 | 
|---|
 | 1481 |                                         
 | 
|---|
 | 1482 |                                         ++stre;
 | 
|---|
 | 1483 |                                 }
 | 
|---|
 | 1484 |                                 else    // &#... (dec code)
 | 
|---|
 | 1485 |                                 {
 | 
|---|
 | 1486 |                                         char_t ch = *++stre;
 | 
|---|
 | 1487 | 
 | 
|---|
 | 1488 |                                         if (ch == ';') return stre;
 | 
|---|
 | 1489 | 
 | 
|---|
 | 1490 |                                         for (;;)
 | 
|---|
 | 1491 |                                         {
 | 
|---|
 | 1492 |                                                 if (static_cast<unsigned int>(ch - '0') <= 9)
 | 
|---|
 | 1493 |                                                         ucsc = 10 * ucsc + (ch - '0');
 | 
|---|
 | 1494 |                                                 else if (ch == ';')
 | 
|---|
 | 1495 |                                                         break;
 | 
|---|
 | 1496 |                                                 else // cancel
 | 
|---|
 | 1497 |                                                         return stre;
 | 
|---|
 | 1498 | 
 | 
|---|
 | 1499 |                                                 ch = *++stre;
 | 
|---|
 | 1500 |                                         }
 | 
|---|
 | 1501 |                                         
 | 
|---|
 | 1502 |                                         ++stre;
 | 
|---|
 | 1503 |                                 }
 | 
|---|
 | 1504 | 
 | 
|---|
 | 1505 |                         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 1506 |                                 s = reinterpret_cast<char_t*>(wchar_writer::any(reinterpret_cast<wchar_writer::value_type>(s), ucsc));
 | 
|---|
 | 1507 |                         #else
 | 
|---|
 | 1508 |                                 s = reinterpret_cast<char_t*>(utf8_writer::any(reinterpret_cast<uint8_t*>(s), ucsc));
 | 
|---|
 | 1509 |                         #endif
 | 
|---|
 | 1510 |                                         
 | 
|---|
 | 1511 |                                 g.push(s, stre - s);
 | 
|---|
 | 1512 |                                 return stre;
 | 
|---|
 | 1513 |                         }
 | 
|---|
 | 1514 |                         case 'a':       // &a
 | 
|---|
 | 1515 |                         {
 | 
|---|
 | 1516 |                                 ++stre;
 | 
|---|
 | 1517 | 
 | 
|---|
 | 1518 |                                 if (*stre == 'm') // &am
 | 
|---|
 | 1519 |                                 {
 | 
|---|
 | 1520 |                                         if (*++stre == 'p' && *++stre == ';') // &
 | 
|---|
 | 1521 |                                         {
 | 
|---|
 | 1522 |                                                 *s++ = '&';
 | 
|---|
 | 1523 |                                                 ++stre;
 | 
|---|
 | 1524 |                                                         
 | 
|---|
 | 1525 |                                                 g.push(s, stre - s);
 | 
|---|
 | 1526 |                                                 return stre;
 | 
|---|
 | 1527 |                                         }
 | 
|---|
 | 1528 |                                 }
 | 
|---|
 | 1529 |                                 else if (*stre == 'p') // &ap
 | 
|---|
 | 1530 |                                 {
 | 
|---|
 | 1531 |                                         if (*++stre == 'o' && *++stre == 's' && *++stre == ';') // '
 | 
|---|
 | 1532 |                                         {
 | 
|---|
 | 1533 |                                                 *s++ = '\'';
 | 
|---|
 | 1534 |                                                 ++stre;
 | 
|---|
 | 1535 | 
 | 
|---|
 | 1536 |                                                 g.push(s, stre - s);
 | 
|---|
 | 1537 |                                                 return stre;
 | 
|---|
 | 1538 |                                         }
 | 
|---|
 | 1539 |                                 }
 | 
|---|
 | 1540 |                                 break;
 | 
|---|
 | 1541 |                         }
 | 
|---|
 | 1542 |                         case 'g': // &g
 | 
|---|
 | 1543 |                         {
 | 
|---|
 | 1544 |                                 if (*++stre == 't' && *++stre == ';') // >
 | 
|---|
 | 1545 |                                 {
 | 
|---|
 | 1546 |                                         *s++ = '>';
 | 
|---|
 | 1547 |                                         ++stre;
 | 
|---|
 | 1548 |                                         
 | 
|---|
 | 1549 |                                         g.push(s, stre - s);
 | 
|---|
 | 1550 |                                         return stre;
 | 
|---|
 | 1551 |                                 }
 | 
|---|
 | 1552 |                                 break;
 | 
|---|
 | 1553 |                         }
 | 
|---|
 | 1554 |                         case 'l': // &l
 | 
|---|
 | 1555 |                         {
 | 
|---|
 | 1556 |                                 if (*++stre == 't' && *++stre == ';') // <
 | 
|---|
 | 1557 |                                 {
 | 
|---|
 | 1558 |                                         *s++ = '<';
 | 
|---|
 | 1559 |                                         ++stre;
 | 
|---|
 | 1560 |                                                 
 | 
|---|
 | 1561 |                                         g.push(s, stre - s);
 | 
|---|
 | 1562 |                                         return stre;
 | 
|---|
 | 1563 |                                 }
 | 
|---|
 | 1564 |                                 break;
 | 
|---|
 | 1565 |                         }
 | 
|---|
 | 1566 |                         case 'q': // &q
 | 
|---|
 | 1567 |                         {
 | 
|---|
 | 1568 |                                 if (*++stre == 'u' && *++stre == 'o' && *++stre == 't' && *++stre == ';') // "
 | 
|---|
 | 1569 |                                 {
 | 
|---|
 | 1570 |                                         *s++ = '"';
 | 
|---|
 | 1571 |                                         ++stre;
 | 
|---|
 | 1572 |                                         
 | 
|---|
 | 1573 |                                         g.push(s, stre - s);
 | 
|---|
 | 1574 |                                         return stre;
 | 
|---|
 | 1575 |                                 }
 | 
|---|
 | 1576 |                                 break;
 | 
|---|
 | 1577 |                         }
 | 
|---|
 | 1578 |                 }
 | 
|---|
 | 1579 |                 
 | 
|---|
 | 1580 |                 return stre;
 | 
|---|
 | 1581 |         }
 | 
|---|
 | 1582 | 
 | 
|---|
 | 1583 |         // Utility macro for last character handling
 | 
|---|
 | 1584 |         #define ENDSWITH(c, e) ((c) == (e) || ((c) == 0 && endch == (e)))
 | 
|---|
 | 1585 | 
 | 
|---|
 | 1586 |         char_t* strconv_comment(char_t* s, char_t endch)
 | 
|---|
 | 1587 |         {
 | 
|---|
 | 1588 |                 gap g;
 | 
|---|
 | 1589 |                 
 | 
|---|
 | 1590 |                 while (true)
 | 
|---|
 | 1591 |                 {
 | 
|---|
 | 1592 |                         while (!IS_CHARTYPE(*s, ct_parse_comment)) ++s;
 | 
|---|
 | 1593 |                 
 | 
|---|
 | 1594 |                         if (*s == '\r') // Either a single 0x0d or 0x0d 0x0a pair
 | 
|---|
 | 1595 |                         {
 | 
|---|
 | 1596 |                                 *s++ = '\n'; // replace first one with 0x0a
 | 
|---|
 | 1597 |                                 
 | 
|---|
 | 1598 |                                 if (*s == '\n') g.push(s, 1);
 | 
|---|
 | 1599 |                         }
 | 
|---|
 | 1600 |                         else if (s[0] == '-' && s[1] == '-' && ENDSWITH(s[2], '>')) // comment ends here
 | 
|---|
 | 1601 |                         {
 | 
|---|
 | 1602 |                                 *g.flush(s) = 0;
 | 
|---|
 | 1603 |                                 
 | 
|---|
 | 1604 |                                 return s + (s[2] == '>' ? 3 : 2);
 | 
|---|
 | 1605 |                         }
 | 
|---|
 | 1606 |                         else if (*s == 0)
 | 
|---|
 | 1607 |                         {
 | 
|---|
 | 1608 |                                 return 0;
 | 
|---|
 | 1609 |                         }
 | 
|---|
 | 1610 |                         else ++s;
 | 
|---|
 | 1611 |                 }
 | 
|---|
 | 1612 |         }
 | 
|---|
 | 1613 | 
 | 
|---|
 | 1614 |         char_t* strconv_cdata(char_t* s, char_t endch)
 | 
|---|
 | 1615 |         {
 | 
|---|
 | 1616 |                 gap g;
 | 
|---|
 | 1617 |                         
 | 
|---|
 | 1618 |                 while (true)
 | 
|---|
 | 1619 |                 {
 | 
|---|
 | 1620 |                         while (!IS_CHARTYPE(*s, ct_parse_cdata)) ++s;
 | 
|---|
 | 1621 |                         
 | 
|---|
 | 1622 |                         if (*s == '\r') // Either a single 0x0d or 0x0d 0x0a pair
 | 
|---|
 | 1623 |                         {
 | 
|---|
 | 1624 |                                 *s++ = '\n'; // replace first one with 0x0a
 | 
|---|
 | 1625 |                                 
 | 
|---|
 | 1626 |                                 if (*s == '\n') g.push(s, 1);
 | 
|---|
 | 1627 |                         }
 | 
|---|
 | 1628 |                         else if (s[0] == ']' && s[1] == ']' && ENDSWITH(s[2], '>')) // CDATA ends here
 | 
|---|
 | 1629 |                         {
 | 
|---|
 | 1630 |                                 *g.flush(s) = 0;
 | 
|---|
 | 1631 |                                 
 | 
|---|
 | 1632 |                                 return s + 1;
 | 
|---|
 | 1633 |                         }
 | 
|---|
 | 1634 |                         else if (*s == 0)
 | 
|---|
 | 1635 |                         {
 | 
|---|
 | 1636 |                                 return 0;
 | 
|---|
 | 1637 |                         }
 | 
|---|
 | 1638 |                         else ++s;
 | 
|---|
 | 1639 |                 }
 | 
|---|
 | 1640 |         }
 | 
|---|
 | 1641 |         
 | 
|---|
 | 1642 |         typedef char_t* (*strconv_pcdata_t)(char_t*);
 | 
|---|
 | 1643 |                 
 | 
|---|
 | 1644 |         template <typename opt_eol, typename opt_escape> struct strconv_pcdata_impl
 | 
|---|
 | 1645 |         {
 | 
|---|
 | 1646 |                 static char_t* parse(char_t* s)
 | 
|---|
 | 1647 |                 {
 | 
|---|
 | 1648 |                         gap g;
 | 
|---|
 | 1649 |                         
 | 
|---|
 | 1650 |                         while (true)
 | 
|---|
 | 1651 |                         {
 | 
|---|
 | 1652 |                                 while (!IS_CHARTYPE(*s, ct_parse_pcdata)) ++s;
 | 
|---|
 | 1653 |                                         
 | 
|---|
 | 1654 |                                 if (*s == '<') // PCDATA ends here
 | 
|---|
 | 1655 |                                 {
 | 
|---|
 | 1656 |                                         *g.flush(s) = 0;
 | 
|---|
 | 1657 |                                         
 | 
|---|
 | 1658 |                                         return s + 1;
 | 
|---|
 | 1659 |                                 }
 | 
|---|
 | 1660 |                                 else if (opt_eol::value && *s == '\r') // Either a single 0x0d or 0x0d 0x0a pair
 | 
|---|
 | 1661 |                                 {
 | 
|---|
 | 1662 |                                         *s++ = '\n'; // replace first one with 0x0a
 | 
|---|
 | 1663 |                                         
 | 
|---|
 | 1664 |                                         if (*s == '\n') g.push(s, 1);
 | 
|---|
 | 1665 |                                 }
 | 
|---|
 | 1666 |                                 else if (opt_escape::value && *s == '&')
 | 
|---|
 | 1667 |                                 {
 | 
|---|
 | 1668 |                                         s = strconv_escape(s, g);
 | 
|---|
 | 1669 |                                 }
 | 
|---|
 | 1670 |                                 else if (*s == 0)
 | 
|---|
 | 1671 |                                 {
 | 
|---|
 | 1672 |                                         return s;
 | 
|---|
 | 1673 |                                 }
 | 
|---|
 | 1674 |                                 else ++s;
 | 
|---|
 | 1675 |                         }
 | 
|---|
 | 1676 |                 }
 | 
|---|
 | 1677 |         };
 | 
|---|
 | 1678 |         
 | 
|---|
 | 1679 |         strconv_pcdata_t get_strconv_pcdata(unsigned int optmask)
 | 
|---|
 | 1680 |         {
 | 
|---|
 | 1681 |                 STATIC_ASSERT(parse_escapes == 0x10 && parse_eol == 0x20);
 | 
|---|
 | 1682 | 
 | 
|---|
 | 1683 |                 switch ((optmask >> 4) & 3) // get bitmask for flags (eol escapes)
 | 
|---|
 | 1684 |                 {
 | 
|---|
 | 1685 |                 case 0: return strconv_pcdata_impl<opt_false, opt_false>::parse;
 | 
|---|
 | 1686 |                 case 1: return strconv_pcdata_impl<opt_false, opt_true>::parse;
 | 
|---|
 | 1687 |                 case 2: return strconv_pcdata_impl<opt_true, opt_false>::parse;
 | 
|---|
 | 1688 |                 case 3: return strconv_pcdata_impl<opt_true, opt_true>::parse;
 | 
|---|
 | 1689 |                 default: return 0; // should not get here
 | 
|---|
 | 1690 |                 }
 | 
|---|
 | 1691 |         }
 | 
|---|
 | 1692 | 
 | 
|---|
 | 1693 |         typedef char_t* (*strconv_attribute_t)(char_t*, char_t);
 | 
|---|
 | 1694 |         
 | 
|---|
 | 1695 |         template <typename opt_escape> struct strconv_attribute_impl
 | 
|---|
 | 1696 |         {
 | 
|---|
 | 1697 |                 static char_t* parse_wnorm(char_t* s, char_t end_quote)
 | 
|---|
 | 1698 |                 {
 | 
|---|
 | 1699 |                         gap g;
 | 
|---|
 | 1700 | 
 | 
|---|
 | 1701 |                         // trim leading whitespaces
 | 
|---|
 | 1702 |                         if (IS_CHARTYPE(*s, ct_space))
 | 
|---|
 | 1703 |                         {
 | 
|---|
 | 1704 |                                 char_t* str = s;
 | 
|---|
 | 1705 |                                 
 | 
|---|
 | 1706 |                                 do ++str;
 | 
|---|
 | 1707 |                                 while (IS_CHARTYPE(*str, ct_space));
 | 
|---|
 | 1708 |                                 
 | 
|---|
 | 1709 |                                 g.push(s, str - s);
 | 
|---|
 | 1710 |                         }
 | 
|---|
 | 1711 | 
 | 
|---|
 | 1712 |                         while (true)
 | 
|---|
 | 1713 |                         {
 | 
|---|
 | 1714 |                                 while (!IS_CHARTYPE(*s, ct_parse_attr_ws | ct_space)) ++s;
 | 
|---|
 | 1715 |                                 
 | 
|---|
 | 1716 |                                 if (*s == end_quote)
 | 
|---|
 | 1717 |                                 {
 | 
|---|
 | 1718 |                                         char_t* str = g.flush(s);
 | 
|---|
 | 1719 |                                         
 | 
|---|
 | 1720 |                                         do *str-- = 0;
 | 
|---|
 | 1721 |                                         while (IS_CHARTYPE(*str, ct_space));
 | 
|---|
 | 1722 |                                 
 | 
|---|
 | 1723 |                                         return s + 1;
 | 
|---|
 | 1724 |                                 }
 | 
|---|
 | 1725 |                                 else if (IS_CHARTYPE(*s, ct_space))
 | 
|---|
 | 1726 |                                 {
 | 
|---|
 | 1727 |                                         *s++ = ' ';
 | 
|---|
 | 1728 |                 
 | 
|---|
 | 1729 |                                         if (IS_CHARTYPE(*s, ct_space))
 | 
|---|
 | 1730 |                                         {
 | 
|---|
 | 1731 |                                                 char_t* str = s + 1;
 | 
|---|
 | 1732 |                                                 while (IS_CHARTYPE(*str, ct_space)) ++str;
 | 
|---|
 | 1733 |                                                 
 | 
|---|
 | 1734 |                                                 g.push(s, str - s);
 | 
|---|
 | 1735 |                                         }
 | 
|---|
 | 1736 |                                 }
 | 
|---|
 | 1737 |                                 else if (opt_escape::value && *s == '&')
 | 
|---|
 | 1738 |                                 {
 | 
|---|
 | 1739 |                                         s = strconv_escape(s, g);
 | 
|---|
 | 1740 |                                 }
 | 
|---|
 | 1741 |                                 else if (!*s)
 | 
|---|
 | 1742 |                                 {
 | 
|---|
 | 1743 |                                         return 0;
 | 
|---|
 | 1744 |                                 }
 | 
|---|
 | 1745 |                                 else ++s;
 | 
|---|
 | 1746 |                         }
 | 
|---|
 | 1747 |                 }
 | 
|---|
 | 1748 | 
 | 
|---|
 | 1749 |                 static char_t* parse_wconv(char_t* s, char_t end_quote)
 | 
|---|
 | 1750 |                 {
 | 
|---|
 | 1751 |                         gap g;
 | 
|---|
 | 1752 | 
 | 
|---|
 | 1753 |                         while (true)
 | 
|---|
 | 1754 |                         {
 | 
|---|
 | 1755 |                                 while (!IS_CHARTYPE(*s, ct_parse_attr_ws)) ++s;
 | 
|---|
 | 1756 |                                 
 | 
|---|
 | 1757 |                                 if (*s == end_quote)
 | 
|---|
 | 1758 |                                 {
 | 
|---|
 | 1759 |                                         *g.flush(s) = 0;
 | 
|---|
 | 1760 |                                 
 | 
|---|
 | 1761 |                                         return s + 1;
 | 
|---|
 | 1762 |                                 }
 | 
|---|
 | 1763 |                                 else if (IS_CHARTYPE(*s, ct_space))
 | 
|---|
 | 1764 |                                 {
 | 
|---|
 | 1765 |                                         if (*s == '\r')
 | 
|---|
 | 1766 |                                         {
 | 
|---|
 | 1767 |                                                 *s++ = ' ';
 | 
|---|
 | 1768 |                                 
 | 
|---|
 | 1769 |                                                 if (*s == '\n') g.push(s, 1);
 | 
|---|
 | 1770 |                                         }
 | 
|---|
 | 1771 |                                         else *s++ = ' ';
 | 
|---|
 | 1772 |                                 }
 | 
|---|
 | 1773 |                                 else if (opt_escape::value && *s == '&')
 | 
|---|
 | 1774 |                                 {
 | 
|---|
 | 1775 |                                         s = strconv_escape(s, g);
 | 
|---|
 | 1776 |                                 }
 | 
|---|
 | 1777 |                                 else if (!*s)
 | 
|---|
 | 1778 |                                 {
 | 
|---|
 | 1779 |                                         return 0;
 | 
|---|
 | 1780 |                                 }
 | 
|---|
 | 1781 |                                 else ++s;
 | 
|---|
 | 1782 |                         }
 | 
|---|
 | 1783 |                 }
 | 
|---|
 | 1784 | 
 | 
|---|
 | 1785 |                 static char_t* parse_eol(char_t* s, char_t end_quote)
 | 
|---|
 | 1786 |                 {
 | 
|---|
 | 1787 |                         gap g;
 | 
|---|
 | 1788 | 
 | 
|---|
 | 1789 |                         while (true)
 | 
|---|
 | 1790 |                         {
 | 
|---|
 | 1791 |                                 while (!IS_CHARTYPE(*s, ct_parse_attr)) ++s;
 | 
|---|
 | 1792 |                                 
 | 
|---|
 | 1793 |                                 if (*s == end_quote)
 | 
|---|
 | 1794 |                                 {
 | 
|---|
 | 1795 |                                         *g.flush(s) = 0;
 | 
|---|
 | 1796 |                                 
 | 
|---|
 | 1797 |                                         return s + 1;
 | 
|---|
 | 1798 |                                 }
 | 
|---|
 | 1799 |                                 else if (*s == '\r')
 | 
|---|
 | 1800 |                                 {
 | 
|---|
 | 1801 |                                         *s++ = '\n';
 | 
|---|
 | 1802 |                                         
 | 
|---|
 | 1803 |                                         if (*s == '\n') g.push(s, 1);
 | 
|---|
 | 1804 |                                 }
 | 
|---|
 | 1805 |                                 else if (opt_escape::value && *s == '&')
 | 
|---|
 | 1806 |                                 {
 | 
|---|
 | 1807 |                                         s = strconv_escape(s, g);
 | 
|---|
 | 1808 |                                 }
 | 
|---|
 | 1809 |                                 else if (!*s)
 | 
|---|
 | 1810 |                                 {
 | 
|---|
 | 1811 |                                         return 0;
 | 
|---|
 | 1812 |                                 }
 | 
|---|
 | 1813 |                                 else ++s;
 | 
|---|
 | 1814 |                         }
 | 
|---|
 | 1815 |                 }
 | 
|---|
 | 1816 | 
 | 
|---|
 | 1817 |                 static char_t* parse_simple(char_t* s, char_t end_quote)
 | 
|---|
 | 1818 |                 {
 | 
|---|
 | 1819 |                         gap g;
 | 
|---|
 | 1820 | 
 | 
|---|
 | 1821 |                         while (true)
 | 
|---|
 | 1822 |                         {
 | 
|---|
 | 1823 |                                 while (!IS_CHARTYPE(*s, ct_parse_attr)) ++s;
 | 
|---|
 | 1824 |                                 
 | 
|---|
 | 1825 |                                 if (*s == end_quote)
 | 
|---|
 | 1826 |                                 {
 | 
|---|
 | 1827 |                                         *g.flush(s) = 0;
 | 
|---|
 | 1828 |                                 
 | 
|---|
 | 1829 |                                         return s + 1;
 | 
|---|
 | 1830 |                                 }
 | 
|---|
 | 1831 |                                 else if (opt_escape::value && *s == '&')
 | 
|---|
 | 1832 |                                 {
 | 
|---|
 | 1833 |                                         s = strconv_escape(s, g);
 | 
|---|
 | 1834 |                                 }
 | 
|---|
 | 1835 |                                 else if (!*s)
 | 
|---|
 | 1836 |                                 {
 | 
|---|
 | 1837 |                                         return 0;
 | 
|---|
 | 1838 |                                 }
 | 
|---|
 | 1839 |                                 else ++s;
 | 
|---|
 | 1840 |                         }
 | 
|---|
 | 1841 |                 }
 | 
|---|
 | 1842 |         };
 | 
|---|
 | 1843 | 
 | 
|---|
 | 1844 |         strconv_attribute_t get_strconv_attribute(unsigned int optmask)
 | 
|---|
 | 1845 |         {
 | 
|---|
 | 1846 |                 STATIC_ASSERT(parse_escapes == 0x10 && parse_eol == 0x20 && parse_wconv_attribute == 0x40 && parse_wnorm_attribute == 0x80);
 | 
|---|
 | 1847 |                 
 | 
|---|
 | 1848 |                 switch ((optmask >> 4) & 15) // get bitmask for flags (wconv wnorm eol escapes)
 | 
|---|
 | 1849 |                 {
 | 
|---|
 | 1850 |                 case 0:  return strconv_attribute_impl<opt_false>::parse_simple;
 | 
|---|
 | 1851 |                 case 1:  return strconv_attribute_impl<opt_true>::parse_simple;
 | 
|---|
 | 1852 |                 case 2:  return strconv_attribute_impl<opt_false>::parse_eol;
 | 
|---|
 | 1853 |                 case 3:  return strconv_attribute_impl<opt_true>::parse_eol;
 | 
|---|
 | 1854 |                 case 4:  return strconv_attribute_impl<opt_false>::parse_wconv;
 | 
|---|
 | 1855 |                 case 5:  return strconv_attribute_impl<opt_true>::parse_wconv;
 | 
|---|
 | 1856 |                 case 6:  return strconv_attribute_impl<opt_false>::parse_wconv;
 | 
|---|
 | 1857 |                 case 7:  return strconv_attribute_impl<opt_true>::parse_wconv;
 | 
|---|
 | 1858 |                 case 8:  return strconv_attribute_impl<opt_false>::parse_wnorm;
 | 
|---|
 | 1859 |                 case 9:  return strconv_attribute_impl<opt_true>::parse_wnorm;
 | 
|---|
 | 1860 |                 case 10: return strconv_attribute_impl<opt_false>::parse_wnorm;
 | 
|---|
 | 1861 |                 case 11: return strconv_attribute_impl<opt_true>::parse_wnorm;
 | 
|---|
 | 1862 |                 case 12: return strconv_attribute_impl<opt_false>::parse_wnorm;
 | 
|---|
 | 1863 |                 case 13: return strconv_attribute_impl<opt_true>::parse_wnorm;
 | 
|---|
 | 1864 |                 case 14: return strconv_attribute_impl<opt_false>::parse_wnorm;
 | 
|---|
 | 1865 |                 case 15: return strconv_attribute_impl<opt_true>::parse_wnorm;
 | 
|---|
 | 1866 |                 default: return 0; // should not get here
 | 
|---|
 | 1867 |                 }
 | 
|---|
 | 1868 |         }
 | 
|---|
 | 1869 | 
 | 
|---|
 | 1870 |         inline xml_parse_result make_parse_result(xml_parse_status status, ptrdiff_t offset = 0)
 | 
|---|
 | 1871 |         {
 | 
|---|
 | 1872 |                 xml_parse_result result;
 | 
|---|
 | 1873 |                 result.status = status;
 | 
|---|
 | 1874 |                 result.offset = offset;
 | 
|---|
 | 1875 | 
 | 
|---|
 | 1876 |                 return result;
 | 
|---|
 | 1877 |         }
 | 
|---|
 | 1878 | 
 | 
|---|
 | 1879 |         struct xml_parser
 | 
|---|
 | 1880 |         {
 | 
|---|
 | 1881 |                 xml_allocator alloc;
 | 
|---|
 | 1882 |                 char_t* error_offset;
 | 
|---|
 | 1883 |                 jmp_buf error_handler;
 | 
|---|
 | 1884 |                 
 | 
|---|
 | 1885 |                 // Parser utilities.
 | 
|---|
 | 1886 |                 #define SKIPWS()                        { while (IS_CHARTYPE(*s, ct_space)) ++s; }
 | 
|---|
 | 1887 |                 #define OPTSET(OPT)                     ( optmsk & OPT )
 | 
|---|
 | 1888 |                 #define PUSHNODE(TYPE)          { cursor = append_node(cursor, alloc, TYPE); if (!cursor) THROW_ERROR(status_out_of_memory, s); }
 | 
|---|
 | 1889 |                 #define POPNODE()                       { cursor = cursor->parent; }
 | 
|---|
 | 1890 |                 #define SCANFOR(X)                      { while (*s != 0 && !(X)) ++s; }
 | 
|---|
 | 1891 |                 #define SCANWHILE(X)            { while ((X)) ++s; }
 | 
|---|
 | 1892 |                 #define ENDSEG()                        { ch = *s; *s = 0; ++s; }
 | 
|---|
 | 1893 |                 #define THROW_ERROR(err, m)     error_offset = m, longjmp(error_handler, err)
 | 
|---|
 | 1894 |                 #define CHECK_ERROR(err, m)     { if (*s == 0) THROW_ERROR(err, m); }
 | 
|---|
 | 1895 |                 
 | 
|---|
 | 1896 |                 xml_parser(const xml_allocator& alloc): alloc(alloc), error_offset(0)
 | 
|---|
 | 1897 |                 {
 | 
|---|
 | 1898 |                 }
 | 
|---|
 | 1899 | 
 | 
|---|
 | 1900 |                 // DOCTYPE consists of nested sections of the following possible types:
 | 
|---|
 | 1901 |                 // <!-- ... -->, <? ... ?>, "...", '...'
 | 
|---|
 | 1902 |                 // <![...]]>
 | 
|---|
 | 1903 |                 // <!...>
 | 
|---|
 | 1904 |                 // First group can not contain nested groups
 | 
|---|
 | 1905 |                 // Second group can contain nested groups of the same type
 | 
|---|
 | 1906 |                 // Third group can contain all other groups
 | 
|---|
 | 1907 |                 char_t* parse_doctype_primitive(char_t* s)
 | 
|---|
 | 1908 |                 {
 | 
|---|
 | 1909 |                         if (*s == '"' || *s == '\'')
 | 
|---|
 | 1910 |                         {
 | 
|---|
 | 1911 |                                 // quoted string
 | 
|---|
 | 1912 |                                 char_t ch = *s++;
 | 
|---|
 | 1913 |                                 SCANFOR(*s == ch);
 | 
|---|
 | 1914 |                                 if (!*s) THROW_ERROR(status_bad_doctype, s);
 | 
|---|
 | 1915 | 
 | 
|---|
 | 1916 |                                 s++;
 | 
|---|
 | 1917 |                         }
 | 
|---|
 | 1918 |                         else if (s[0] == '<' && s[1] == '?')
 | 
|---|
 | 1919 |                         {
 | 
|---|
 | 1920 |                                 // <? ... ?>
 | 
|---|
 | 1921 |                                 s += 2;
 | 
|---|
 | 1922 |                                 SCANFOR(s[0] == '?' && s[1] == '>'); // no need for ENDSWITH because ?> can't terminate proper doctype
 | 
|---|
 | 1923 |                                 if (!*s) THROW_ERROR(status_bad_doctype, s);
 | 
|---|
 | 1924 | 
 | 
|---|
 | 1925 |                                 s += 2;
 | 
|---|
 | 1926 |                         }
 | 
|---|
 | 1927 |                         else if (s[0] == '<' && s[1] == '!' && s[2] == '-' && s[3] == '-')
 | 
|---|
 | 1928 |                         {
 | 
|---|
 | 1929 |                                 s += 4;
 | 
|---|
 | 1930 |                                 SCANFOR(s[0] == '-' && s[1] == '-' && s[2] == '>'); // no need for ENDSWITH because --> can't terminate proper doctype
 | 
|---|
 | 1931 |                                 if (!*s) THROW_ERROR(status_bad_doctype, s);
 | 
|---|
 | 1932 | 
 | 
|---|
 | 1933 |                                 s += 4;
 | 
|---|
 | 1934 |                         }
 | 
|---|
 | 1935 |                         else THROW_ERROR(status_bad_doctype, s);
 | 
|---|
 | 1936 | 
 | 
|---|
 | 1937 |                         return s;
 | 
|---|
 | 1938 |                 }
 | 
|---|
 | 1939 | 
 | 
|---|
 | 1940 |                 char_t* parse_doctype_ignore(char_t* s)
 | 
|---|
 | 1941 |                 {
 | 
|---|
 | 1942 |                         assert(s[0] == '<' && s[1] == '!' && s[2] == '[');
 | 
|---|
 | 1943 |                         s++;
 | 
|---|
 | 1944 | 
 | 
|---|
 | 1945 |                         while (*s)
 | 
|---|
 | 1946 |                         {
 | 
|---|
 | 1947 |                                 if (s[0] == '<' && s[1] == '!' && s[2] == '[')
 | 
|---|
 | 1948 |                                 {
 | 
|---|
 | 1949 |                                         // nested ignore section
 | 
|---|
 | 1950 |                                         s = parse_doctype_ignore(s);
 | 
|---|
 | 1951 |                                 }
 | 
|---|
 | 1952 |                                 else if (s[0] == ']' && s[1] == ']' && s[2] == '>')
 | 
|---|
 | 1953 |                                 {
 | 
|---|
 | 1954 |                                         // ignore section end
 | 
|---|
 | 1955 |                                         s += 3;
 | 
|---|
 | 1956 | 
 | 
|---|
 | 1957 |                                         return s;
 | 
|---|
 | 1958 |                                 }
 | 
|---|
 | 1959 |                                 else s++;
 | 
|---|
 | 1960 |                         }
 | 
|---|
 | 1961 | 
 | 
|---|
 | 1962 |                         THROW_ERROR(status_bad_doctype, s);
 | 
|---|
 | 1963 | 
 | 
|---|
 | 1964 |                         return s;
 | 
|---|
 | 1965 |                 }
 | 
|---|
 | 1966 | 
 | 
|---|
 | 1967 |                 char_t* parse_doctype_group(char_t* s, char_t endch, bool toplevel)
 | 
|---|
 | 1968 |                 {
 | 
|---|
 | 1969 |                         assert(s[0] == '<' && s[1] == '!');
 | 
|---|
 | 1970 |                         s++;
 | 
|---|
 | 1971 | 
 | 
|---|
 | 1972 |                         while (*s)
 | 
|---|
 | 1973 |                         {
 | 
|---|
 | 1974 |                                 if (s[0] == '<' && s[1] == '!' && s[2] != '-')
 | 
|---|
 | 1975 |                                 {
 | 
|---|
 | 1976 |                                         if (s[2] == '[')
 | 
|---|
 | 1977 |                                         {
 | 
|---|
 | 1978 |                                                 // ignore
 | 
|---|
 | 1979 |                                                 s = parse_doctype_ignore(s);
 | 
|---|
 | 1980 |                                         }
 | 
|---|
 | 1981 |                                         else
 | 
|---|
 | 1982 |                                         {
 | 
|---|
 | 1983 |                                                 // some control group
 | 
|---|
 | 1984 |                                                 s = parse_doctype_group(s, endch, false);
 | 
|---|
 | 1985 |                                         }
 | 
|---|
 | 1986 |                                 }
 | 
|---|
 | 1987 |                                 else if (s[0] == '<' || s[0] == '"' || s[0] == '\'')
 | 
|---|
 | 1988 |                                 {
 | 
|---|
 | 1989 |                                         // unknown tag (forbidden), or some primitive group
 | 
|---|
 | 1990 |                                         s = parse_doctype_primitive(s);
 | 
|---|
 | 1991 |                                 }
 | 
|---|
 | 1992 |                                 else if (*s == '>')
 | 
|---|
 | 1993 |                                 {
 | 
|---|
 | 1994 |                                         s++;
 | 
|---|
 | 1995 | 
 | 
|---|
 | 1996 |                                         return s;
 | 
|---|
 | 1997 |                                 }
 | 
|---|
 | 1998 |                                 else s++;
 | 
|---|
 | 1999 |                         }
 | 
|---|
 | 2000 | 
 | 
|---|
 | 2001 |                         if (!toplevel || endch != '>') THROW_ERROR(status_bad_doctype, s);
 | 
|---|
 | 2002 | 
 | 
|---|
 | 2003 |                         return s;
 | 
|---|
 | 2004 |                 }
 | 
|---|
 | 2005 | 
 | 
|---|
 | 2006 |                 char_t* parse_exclamation(char_t* s, xml_node_struct* cursor, unsigned int optmsk, char_t endch)
 | 
|---|
 | 2007 |                 {
 | 
|---|
 | 2008 |                         // parse node contents, starting with exclamation mark
 | 
|---|
 | 2009 |                         ++s;
 | 
|---|
 | 2010 | 
 | 
|---|
 | 2011 |                         if (*s == '-') // '<!-...'
 | 
|---|
 | 2012 |                         {
 | 
|---|
 | 2013 |                                 ++s;
 | 
|---|
 | 2014 | 
 | 
|---|
 | 2015 |                                 if (*s == '-') // '<!--...'
 | 
|---|
 | 2016 |                                 {
 | 
|---|
 | 2017 |                                         ++s;
 | 
|---|
 | 2018 | 
 | 
|---|
 | 2019 |                                         if (OPTSET(parse_comments))
 | 
|---|
 | 2020 |                                         {
 | 
|---|
 | 2021 |                                                 PUSHNODE(node_comment); // Append a new node on the tree.
 | 
|---|
 | 2022 |                                                 cursor->value = s; // Save the offset.
 | 
|---|
 | 2023 |                                         }
 | 
|---|
 | 2024 | 
 | 
|---|
 | 2025 |                                         if (OPTSET(parse_eol) && OPTSET(parse_comments))
 | 
|---|
 | 2026 |                                         {
 | 
|---|
 | 2027 |                                                 s = strconv_comment(s, endch);
 | 
|---|
 | 2028 | 
 | 
|---|
 | 2029 |                                                 if (!s) THROW_ERROR(status_bad_comment, cursor->value);
 | 
|---|
 | 2030 |                                         }
 | 
|---|
 | 2031 |                                         else
 | 
|---|
 | 2032 |                                         {
 | 
|---|
 | 2033 |                                                 // Scan for terminating '-->'.
 | 
|---|
 | 2034 |                                                 SCANFOR(s[0] == '-' && s[1] == '-' && ENDSWITH(s[2], '>'));
 | 
|---|
 | 2035 |                                                 CHECK_ERROR(status_bad_comment, s);
 | 
|---|
 | 2036 | 
 | 
|---|
 | 2037 |                                                 if (OPTSET(parse_comments))
 | 
|---|
 | 2038 |                                                         *s = 0; // Zero-terminate this segment at the first terminating '-'.
 | 
|---|
 | 2039 | 
 | 
|---|
 | 2040 |                                                 s += (s[2] == '>' ? 3 : 2); // Step over the '\0->'.
 | 
|---|
 | 2041 |                                         }
 | 
|---|
 | 2042 |                                 }
 | 
|---|
 | 2043 |                                 else THROW_ERROR(status_bad_comment, s);
 | 
|---|
 | 2044 |                         }
 | 
|---|
 | 2045 |                         else if (*s == '[')
 | 
|---|
 | 2046 |                         {
 | 
|---|
 | 2047 |                                 // '<![CDATA[...'
 | 
|---|
 | 2048 |                                 if (*++s=='C' && *++s=='D' && *++s=='A' && *++s=='T' && *++s=='A' && *++s == '[')
 | 
|---|
 | 2049 |                                 {
 | 
|---|
 | 2050 |                                         ++s;
 | 
|---|
 | 2051 | 
 | 
|---|
 | 2052 |                                         if (OPTSET(parse_cdata))
 | 
|---|
 | 2053 |                                         {
 | 
|---|
 | 2054 |                                                 PUSHNODE(node_cdata); // Append a new node on the tree.
 | 
|---|
 | 2055 |                                                 cursor->value = s; // Save the offset.
 | 
|---|
 | 2056 | 
 | 
|---|
 | 2057 |                                                 if (OPTSET(parse_eol))
 | 
|---|
 | 2058 |                                                 {
 | 
|---|
 | 2059 |                                                         s = strconv_cdata(s, endch);
 | 
|---|
 | 2060 | 
 | 
|---|
 | 2061 |                                                         if (!s) THROW_ERROR(status_bad_cdata, cursor->value);
 | 
|---|
 | 2062 |                                                 }
 | 
|---|
 | 2063 |                                                 else
 | 
|---|
 | 2064 |                                                 {
 | 
|---|
 | 2065 |                                                         // Scan for terminating ']]>'.
 | 
|---|
 | 2066 |                                                         SCANFOR(s[0] == ']' && s[1] == ']' && ENDSWITH(s[2], '>'));
 | 
|---|
 | 2067 |                                                         CHECK_ERROR(status_bad_cdata, s);
 | 
|---|
 | 2068 | 
 | 
|---|
 | 2069 |                                                         *s++ = 0; // Zero-terminate this segment.
 | 
|---|
 | 2070 |                                                 }
 | 
|---|
 | 2071 |                                         }
 | 
|---|
 | 2072 |                                         else // Flagged for discard, but we still have to scan for the terminator.
 | 
|---|
 | 2073 |                                         {
 | 
|---|
 | 2074 |                                                 // Scan for terminating ']]>'.
 | 
|---|
 | 2075 |                                                 SCANFOR(s[0] == ']' && s[1] == ']' && ENDSWITH(s[2], '>'));
 | 
|---|
 | 2076 |                                                 CHECK_ERROR(status_bad_cdata, s);
 | 
|---|
 | 2077 | 
 | 
|---|
 | 2078 |                                                 ++s;
 | 
|---|
 | 2079 |                                         }
 | 
|---|
 | 2080 | 
 | 
|---|
 | 2081 |                                         s += (s[1] == '>' ? 2 : 1); // Step over the last ']>'.
 | 
|---|
 | 2082 |                                 }
 | 
|---|
 | 2083 |                                 else THROW_ERROR(status_bad_cdata, s);
 | 
|---|
 | 2084 |                         }
 | 
|---|
 | 2085 |                         else if (s[0] == 'D' && s[1] == 'O' && s[2] == 'C' && s[3] == 'T' && s[4] == 'Y' && s[5] == 'P' && ENDSWITH(s[6], 'E'))
 | 
|---|
 | 2086 |                         {
 | 
|---|
 | 2087 |                                 s -= 2;
 | 
|---|
 | 2088 | 
 | 
|---|
 | 2089 |                 if (cursor->parent) THROW_ERROR(status_bad_doctype, s);
 | 
|---|
 | 2090 | 
 | 
|---|
 | 2091 |                 char_t* mark = s + 9;
 | 
|---|
 | 2092 | 
 | 
|---|
 | 2093 |                                 s = parse_doctype_group(s, endch, true);
 | 
|---|
 | 2094 | 
 | 
|---|
 | 2095 |                 if (OPTSET(parse_doctype))
 | 
|---|
 | 2096 |                 {
 | 
|---|
 | 2097 |                     while (IS_CHARTYPE(*mark, ct_space)) ++mark;
 | 
|---|
 | 2098 | 
 | 
|---|
 | 2099 |                     PUSHNODE(node_doctype);
 | 
|---|
 | 2100 | 
 | 
|---|
 | 2101 |                     cursor->value = mark;
 | 
|---|
 | 2102 | 
 | 
|---|
 | 2103 |                     assert((s[0] == 0 && endch == '>') || s[-1] == '>');
 | 
|---|
 | 2104 |                     s[*s == 0 ? 0 : -1] = 0;
 | 
|---|
 | 2105 | 
 | 
|---|
 | 2106 |                     POPNODE();
 | 
|---|
 | 2107 |                 }
 | 
|---|
 | 2108 |                         }
 | 
|---|
 | 2109 |                         else if (*s == 0 && endch == '-') THROW_ERROR(status_bad_comment, s);
 | 
|---|
 | 2110 |                         else if (*s == 0 && endch == '[') THROW_ERROR(status_bad_cdata, s);
 | 
|---|
 | 2111 |                         else THROW_ERROR(status_unrecognized_tag, s);
 | 
|---|
 | 2112 | 
 | 
|---|
 | 2113 |                         return s;
 | 
|---|
 | 2114 |                 }
 | 
|---|
 | 2115 | 
 | 
|---|
 | 2116 |                 char_t* parse_question(char_t* s, xml_node_struct*& ref_cursor, unsigned int optmsk, char_t endch)
 | 
|---|
 | 2117 |                 {
 | 
|---|
 | 2118 |                         // load into registers
 | 
|---|
 | 2119 |                         xml_node_struct* cursor = ref_cursor;
 | 
|---|
 | 2120 |                         char_t ch = 0;
 | 
|---|
 | 2121 | 
 | 
|---|
 | 2122 |                         // parse node contents, starting with question mark
 | 
|---|
 | 2123 |                         ++s;
 | 
|---|
 | 2124 | 
 | 
|---|
 | 2125 |                         // read PI target
 | 
|---|
 | 2126 |                         char_t* target = s;
 | 
|---|
 | 2127 | 
 | 
|---|
 | 2128 |                         if (!IS_CHARTYPE(*s, ct_start_symbol)) THROW_ERROR(status_bad_pi, s);
 | 
|---|
 | 2129 | 
 | 
|---|
 | 2130 |                         SCANWHILE(IS_CHARTYPE(*s, ct_symbol));
 | 
|---|
 | 2131 |                         CHECK_ERROR(status_bad_pi, s);
 | 
|---|
 | 2132 | 
 | 
|---|
 | 2133 |                         // determine node type; stricmp / strcasecmp is not portable
 | 
|---|
 | 2134 |                         bool declaration = (target[0] | ' ') == 'x' && (target[1] | ' ') == 'm' && (target[2] | ' ') == 'l' && target + 3 == s;
 | 
|---|
 | 2135 | 
 | 
|---|
 | 2136 |                         if (declaration ? OPTSET(parse_declaration) : OPTSET(parse_pi))
 | 
|---|
 | 2137 |                         {
 | 
|---|
 | 2138 |                                 if (declaration)
 | 
|---|
 | 2139 |                                 {
 | 
|---|
 | 2140 |                                         // disallow non top-level declarations
 | 
|---|
 | 2141 |                                         if (cursor->parent) THROW_ERROR(status_bad_pi, s);
 | 
|---|
 | 2142 | 
 | 
|---|
 | 2143 |                                         PUSHNODE(node_declaration);
 | 
|---|
 | 2144 |                                 }
 | 
|---|
 | 2145 |                                 else
 | 
|---|
 | 2146 |                                 {
 | 
|---|
 | 2147 |                                         PUSHNODE(node_pi);
 | 
|---|
 | 2148 |                                 }
 | 
|---|
 | 2149 | 
 | 
|---|
 | 2150 |                                 cursor->name = target;
 | 
|---|
 | 2151 | 
 | 
|---|
 | 2152 |                                 ENDSEG();
 | 
|---|
 | 2153 | 
 | 
|---|
 | 2154 |                                 // parse value/attributes
 | 
|---|
 | 2155 |                                 if (ch == '?')
 | 
|---|
 | 2156 |                                 {
 | 
|---|
 | 2157 |                                         // empty node
 | 
|---|
 | 2158 |                                         if (!ENDSWITH(*s, '>')) THROW_ERROR(status_bad_pi, s);
 | 
|---|
 | 2159 |                                         s += (*s == '>');
 | 
|---|
 | 2160 | 
 | 
|---|
 | 2161 |                                         POPNODE();
 | 
|---|
 | 2162 |                                 }
 | 
|---|
 | 2163 |                                 else if (IS_CHARTYPE(ch, ct_space))
 | 
|---|
 | 2164 |                                 {
 | 
|---|
 | 2165 |                                         SKIPWS();
 | 
|---|
 | 2166 | 
 | 
|---|
 | 2167 |                                         // scan for tag end
 | 
|---|
 | 2168 |                                         char_t* value = s;
 | 
|---|
 | 2169 | 
 | 
|---|
 | 2170 |                                         SCANFOR(s[0] == '?' && ENDSWITH(s[1], '>'));
 | 
|---|
 | 2171 |                                         CHECK_ERROR(status_bad_pi, s);
 | 
|---|
 | 2172 | 
 | 
|---|
 | 2173 |                                         if (declaration)
 | 
|---|
 | 2174 |                                         {
 | 
|---|
 | 2175 |                                                 // replace ending ? with / so that 'element' terminates properly
 | 
|---|
 | 2176 |                                                 *s = '/';
 | 
|---|
 | 2177 | 
 | 
|---|
 | 2178 |                                                 // we exit from this function with cursor at node_declaration, which is a signal to parse() to go to LOC_ATTRIBUTES
 | 
|---|
 | 2179 |                                                 s = value;
 | 
|---|
 | 2180 |                                         }
 | 
|---|
 | 2181 |                                         else
 | 
|---|
 | 2182 |                                         {
 | 
|---|
 | 2183 |                                                 // store value and step over >
 | 
|---|
 | 2184 |                                                 cursor->value = value;
 | 
|---|
 | 2185 |                                                 POPNODE();
 | 
|---|
 | 2186 | 
 | 
|---|
 | 2187 |                                                 ENDSEG();
 | 
|---|
 | 2188 | 
 | 
|---|
 | 2189 |                                                 s += (*s == '>');
 | 
|---|
 | 2190 |                                         }
 | 
|---|
 | 2191 |                                 }
 | 
|---|
 | 2192 |                                 else THROW_ERROR(status_bad_pi, s);
 | 
|---|
 | 2193 |                         }
 | 
|---|
 | 2194 |                         else
 | 
|---|
 | 2195 |                         {
 | 
|---|
 | 2196 |                                 // scan for tag end
 | 
|---|
 | 2197 |                                 SCANFOR(s[0] == '?' && ENDSWITH(s[1], '>'));
 | 
|---|
 | 2198 |                                 CHECK_ERROR(status_bad_pi, s);
 | 
|---|
 | 2199 | 
 | 
|---|
 | 2200 |                                 s += (s[1] == '>' ? 2 : 1);
 | 
|---|
 | 2201 |                         }
 | 
|---|
 | 2202 | 
 | 
|---|
 | 2203 |                         // store from registers
 | 
|---|
 | 2204 |                         ref_cursor = cursor;
 | 
|---|
 | 2205 | 
 | 
|---|
 | 2206 |                         return s;
 | 
|---|
 | 2207 |                 }
 | 
|---|
 | 2208 | 
 | 
|---|
 | 2209 |                 void parse(char_t* s, xml_node_struct* xmldoc, unsigned int optmsk, char_t endch)
 | 
|---|
 | 2210 |                 {
 | 
|---|
 | 2211 |                         strconv_attribute_t strconv_attribute = get_strconv_attribute(optmsk);
 | 
|---|
 | 2212 |                         strconv_pcdata_t strconv_pcdata = get_strconv_pcdata(optmsk);
 | 
|---|
 | 2213 |                         
 | 
|---|
 | 2214 |                         char_t ch = 0;
 | 
|---|
 | 2215 |                         xml_node_struct* cursor = xmldoc;
 | 
|---|
 | 2216 |                         char_t* mark = s;
 | 
|---|
 | 2217 | 
 | 
|---|
 | 2218 |                         while (*s != 0)
 | 
|---|
 | 2219 |                         {
 | 
|---|
 | 2220 |                                 if (*s == '<')
 | 
|---|
 | 2221 |                                 {
 | 
|---|
 | 2222 |                                         ++s;
 | 
|---|
 | 2223 | 
 | 
|---|
 | 2224 |                                 LOC_TAG:
 | 
|---|
 | 2225 |                                         if (IS_CHARTYPE(*s, ct_start_symbol)) // '<#...'
 | 
|---|
 | 2226 |                                         {
 | 
|---|
 | 2227 |                                                 PUSHNODE(node_element); // Append a new node to the tree.
 | 
|---|
 | 2228 | 
 | 
|---|
 | 2229 |                                                 cursor->name = s;
 | 
|---|
 | 2230 | 
 | 
|---|
 | 2231 |                                                 SCANWHILE(IS_CHARTYPE(*s, ct_symbol)); // Scan for a terminator.
 | 
|---|
 | 2232 |                                                 ENDSEG(); // Save char in 'ch', terminate & step over.
 | 
|---|
 | 2233 | 
 | 
|---|
 | 2234 |                                                 if (ch == '>')
 | 
|---|
 | 2235 |                                                 {
 | 
|---|
 | 2236 |                                                         // end of tag
 | 
|---|
 | 2237 |                                                 }
 | 
|---|
 | 2238 |                                                 else if (IS_CHARTYPE(ch, ct_space))
 | 
|---|
 | 2239 |                                                 {
 | 
|---|
 | 2240 |                                                 LOC_ATTRIBUTES:
 | 
|---|
 | 2241 |                                                     while (true)
 | 
|---|
 | 2242 |                                                     {
 | 
|---|
 | 2243 |                                                                 SKIPWS(); // Eat any whitespace.
 | 
|---|
 | 2244 |                                                 
 | 
|---|
 | 2245 |                                                                 if (IS_CHARTYPE(*s, ct_start_symbol)) // <... #...
 | 
|---|
 | 2246 |                                                                 {
 | 
|---|
 | 2247 |                                                                         xml_attribute_struct* a = append_attribute_ll(cursor, alloc); // Make space for this attribute.
 | 
|---|
 | 2248 |                                                                         if (!a) THROW_ERROR(status_out_of_memory, s);
 | 
|---|
 | 2249 | 
 | 
|---|
 | 2250 |                                                                         a->name = s; // Save the offset.
 | 
|---|
 | 2251 | 
 | 
|---|
 | 2252 |                                                                         SCANWHILE(IS_CHARTYPE(*s, ct_symbol)); // Scan for a terminator.
 | 
|---|
 | 2253 |                                                                         CHECK_ERROR(status_bad_attribute, s); //$ redundant, left for performance
 | 
|---|
 | 2254 | 
 | 
|---|
 | 2255 |                                                                         ENDSEG(); // Save char in 'ch', terminate & step over.
 | 
|---|
 | 2256 |                                                                         CHECK_ERROR(status_bad_attribute, s); //$ redundant, left for performance
 | 
|---|
 | 2257 | 
 | 
|---|
 | 2258 |                                                                         if (IS_CHARTYPE(ch, ct_space))
 | 
|---|
 | 2259 |                                                                         {
 | 
|---|
 | 2260 |                                                                                 SKIPWS(); // Eat any whitespace.
 | 
|---|
 | 2261 |                                                                                 CHECK_ERROR(status_bad_attribute, s); //$ redundant, left for performance
 | 
|---|
 | 2262 | 
 | 
|---|
 | 2263 |                                                                                 ch = *s;
 | 
|---|
 | 2264 |                                                                                 ++s;
 | 
|---|
 | 2265 |                                                                         }
 | 
|---|
 | 2266 |                                                                         
 | 
|---|
 | 2267 |                                                                         if (ch == '=') // '<... #=...'
 | 
|---|
 | 2268 |                                                                         {
 | 
|---|
 | 2269 |                                                                                 SKIPWS(); // Eat any whitespace.
 | 
|---|
 | 2270 | 
 | 
|---|
 | 2271 |                                                                                 if (*s == '"' || *s == '\'') // '<... #="...'
 | 
|---|
 | 2272 |                                                                                 {
 | 
|---|
 | 2273 |                                                                                         ch = *s; // Save quote char to avoid breaking on "''" -or- '""'.
 | 
|---|
 | 2274 |                                                                                         ++s; // Step over the quote.
 | 
|---|
 | 2275 |                                                                                         a->value = s; // Save the offset.
 | 
|---|
 | 2276 | 
 | 
|---|
 | 2277 |                                                                                         s = strconv_attribute(s, ch);
 | 
|---|
 | 2278 |                                                                                 
 | 
|---|
 | 2279 |                                                                                         if (!s) THROW_ERROR(status_bad_attribute, a->value);
 | 
|---|
 | 2280 | 
 | 
|---|
 | 2281 |                                                                                         // After this line the loop continues from the start;
 | 
|---|
 | 2282 |                                                                                         // Whitespaces, / and > are ok, symbols and EOF are wrong,
 | 
|---|
 | 2283 |                                                                                         // everything else will be detected
 | 
|---|
 | 2284 |                                                                                         if (IS_CHARTYPE(*s, ct_start_symbol)) THROW_ERROR(status_bad_attribute, s);
 | 
|---|
 | 2285 |                                                                                 }
 | 
|---|
 | 2286 |                                                                                 else THROW_ERROR(status_bad_attribute, s);
 | 
|---|
 | 2287 |                                                                         }
 | 
|---|
 | 2288 |                                                                         else THROW_ERROR(status_bad_attribute, s);
 | 
|---|
 | 2289 |                                                                 }
 | 
|---|
 | 2290 |                                                                 else if (*s == '/')
 | 
|---|
 | 2291 |                                                                 {
 | 
|---|
 | 2292 |                                                                         ++s;
 | 
|---|
 | 2293 |                                                                         
 | 
|---|
 | 2294 |                                                                         if (*s == '>')
 | 
|---|
 | 2295 |                                                                         {
 | 
|---|
 | 2296 |                                                                                 POPNODE();
 | 
|---|
 | 2297 |                                                                                 s++;
 | 
|---|
 | 2298 |                                                                                 break;
 | 
|---|
 | 2299 |                                                                         }
 | 
|---|
 | 2300 |                                                                         else if (*s == 0 && endch == '>')
 | 
|---|
 | 2301 |                                                                         {
 | 
|---|
 | 2302 |                                                                                 POPNODE();
 | 
|---|
 | 2303 |                                                                                 break;
 | 
|---|
 | 2304 |                                                                         }
 | 
|---|
 | 2305 |                                                                         else THROW_ERROR(status_bad_start_element, s);
 | 
|---|
 | 2306 |                                                                 }
 | 
|---|
 | 2307 |                                                                 else if (*s == '>')
 | 
|---|
 | 2308 |                                                                 {
 | 
|---|
 | 2309 |                                                                         ++s;
 | 
|---|
 | 2310 | 
 | 
|---|
 | 2311 |                                                                         break;
 | 
|---|
 | 2312 |                                                                 }
 | 
|---|
 | 2313 |                                                                 else if (*s == 0 && endch == '>')
 | 
|---|
 | 2314 |                                                                 {
 | 
|---|
 | 2315 |                                                                         break;
 | 
|---|
 | 2316 |                                                                 }
 | 
|---|
 | 2317 |                                                                 else THROW_ERROR(status_bad_start_element, s);
 | 
|---|
 | 2318 |                                                         }
 | 
|---|
 | 2319 | 
 | 
|---|
 | 2320 |                                                         // !!!
 | 
|---|
 | 2321 |                                                 }
 | 
|---|
 | 2322 |                                                 else if (ch == '/') // '<#.../'
 | 
|---|
 | 2323 |                                                 {
 | 
|---|
 | 2324 |                                                         if (!ENDSWITH(*s, '>')) THROW_ERROR(status_bad_start_element, s);
 | 
|---|
 | 2325 | 
 | 
|---|
 | 2326 |                                                         POPNODE(); // Pop.
 | 
|---|
 | 2327 | 
 | 
|---|
 | 2328 |                                                         s += (*s == '>');
 | 
|---|
 | 2329 |                                                 }
 | 
|---|
 | 2330 |                                                 else if (ch == 0)
 | 
|---|
 | 2331 |                                                 {
 | 
|---|
 | 2332 |                                                         // we stepped over null terminator, backtrack & handle closing tag
 | 
|---|
 | 2333 |                                                         --s;
 | 
|---|
 | 2334 |                                                         
 | 
|---|
 | 2335 |                                                         if (endch != '>') THROW_ERROR(status_bad_start_element, s);
 | 
|---|
 | 2336 |                                                 }
 | 
|---|
 | 2337 |                                                 else THROW_ERROR(status_bad_start_element, s);
 | 
|---|
 | 2338 |                                         }
 | 
|---|
 | 2339 |                                         else if (*s == '/')
 | 
|---|
 | 2340 |                                         {
 | 
|---|
 | 2341 |                                                 ++s;
 | 
|---|
 | 2342 | 
 | 
|---|
 | 2343 |                                                 char_t* name = cursor->name;
 | 
|---|
 | 2344 |                                                 if (!name) THROW_ERROR(status_end_element_mismatch, s);
 | 
|---|
 | 2345 |                                                 
 | 
|---|
 | 2346 |                                                 while (IS_CHARTYPE(*s, ct_symbol))
 | 
|---|
 | 2347 |                                                 {
 | 
|---|
 | 2348 |                                                         if (*s++ != *name++) THROW_ERROR(status_end_element_mismatch, s);
 | 
|---|
 | 2349 |                                                 }
 | 
|---|
 | 2350 | 
 | 
|---|
 | 2351 |                                                 if (*name)
 | 
|---|
 | 2352 |                                                 {
 | 
|---|
 | 2353 |                                                         if (*s == 0 && name[0] == endch && name[1] == 0) THROW_ERROR(status_bad_end_element, s);
 | 
|---|
 | 2354 |                                                         else THROW_ERROR(status_end_element_mismatch, s);
 | 
|---|
 | 2355 |                                                 }
 | 
|---|
 | 2356 |                                                         
 | 
|---|
 | 2357 |                                                 POPNODE(); // Pop.
 | 
|---|
 | 2358 | 
 | 
|---|
 | 2359 |                                                 SKIPWS();
 | 
|---|
 | 2360 | 
 | 
|---|
 | 2361 |                                                 if (*s == 0)
 | 
|---|
 | 2362 |                                                 {
 | 
|---|
 | 2363 |                                                         if (endch != '>') THROW_ERROR(status_bad_end_element, s);
 | 
|---|
 | 2364 |                                                 }
 | 
|---|
 | 2365 |                                                 else
 | 
|---|
 | 2366 |                                                 {
 | 
|---|
 | 2367 |                                                         if (*s != '>') THROW_ERROR(status_bad_end_element, s);
 | 
|---|
 | 2368 |                                                         ++s;
 | 
|---|
 | 2369 |                                                 }
 | 
|---|
 | 2370 |                                         }
 | 
|---|
 | 2371 |                                         else if (*s == '?') // '<?...'
 | 
|---|
 | 2372 |                                         {
 | 
|---|
 | 2373 |                                                 s = parse_question(s, cursor, optmsk, endch);
 | 
|---|
 | 2374 | 
 | 
|---|
 | 2375 |                                                 assert(cursor);
 | 
|---|
 | 2376 |                                                 if ((cursor->header & xml_memory_page_type_mask) + 1 == node_declaration) goto LOC_ATTRIBUTES;
 | 
|---|
 | 2377 |                                         }
 | 
|---|
 | 2378 |                                         else if (*s == '!') // '<!...'
 | 
|---|
 | 2379 |                                         {
 | 
|---|
 | 2380 |                                                 s = parse_exclamation(s, cursor, optmsk, endch);
 | 
|---|
 | 2381 |                                         }
 | 
|---|
 | 2382 |                                         else if (*s == 0 && endch == '?') THROW_ERROR(status_bad_pi, s);
 | 
|---|
 | 2383 |                                         else THROW_ERROR(status_unrecognized_tag, s);
 | 
|---|
 | 2384 |                                 }
 | 
|---|
 | 2385 |                                 else
 | 
|---|
 | 2386 |                                 {
 | 
|---|
 | 2387 |                                         mark = s; // Save this offset while searching for a terminator.
 | 
|---|
 | 2388 | 
 | 
|---|
 | 2389 |                                         SKIPWS(); // Eat whitespace if no genuine PCDATA here.
 | 
|---|
 | 2390 | 
 | 
|---|
 | 2391 |                                         if ((!OPTSET(parse_ws_pcdata) || mark == s) && (*s == '<' || !*s))
 | 
|---|
 | 2392 |                                         {
 | 
|---|
 | 2393 |                                                 continue;
 | 
|---|
 | 2394 |                                         }
 | 
|---|
 | 2395 | 
 | 
|---|
 | 2396 |                                         s = mark;
 | 
|---|
 | 2397 |                                                         
 | 
|---|
 | 2398 |                                         if (cursor->parent)
 | 
|---|
 | 2399 |                                         {
 | 
|---|
 | 2400 |                                                 PUSHNODE(node_pcdata); // Append a new node on the tree.
 | 
|---|
 | 2401 |                                                 cursor->value = s; // Save the offset.
 | 
|---|
 | 2402 | 
 | 
|---|
 | 2403 |                                                 s = strconv_pcdata(s);
 | 
|---|
 | 2404 |                                                                 
 | 
|---|
 | 2405 |                                                 POPNODE(); // Pop since this is a standalone.
 | 
|---|
 | 2406 |                                                 
 | 
|---|
 | 2407 |                                                 if (!*s) break;
 | 
|---|
 | 2408 |                                         }
 | 
|---|
 | 2409 |                                         else
 | 
|---|
 | 2410 |                                         {
 | 
|---|
 | 2411 |                                                 SCANFOR(*s == '<'); // '...<'
 | 
|---|
 | 2412 |                                                 if (!*s) break;
 | 
|---|
 | 2413 |                                                 
 | 
|---|
 | 2414 |                                                 ++s;
 | 
|---|
 | 2415 |                                         }
 | 
|---|
 | 2416 | 
 | 
|---|
 | 2417 |                                         // We're after '<'
 | 
|---|
 | 2418 |                                         goto LOC_TAG;
 | 
|---|
 | 2419 |                                 }
 | 
|---|
 | 2420 |                         }
 | 
|---|
 | 2421 | 
 | 
|---|
 | 2422 |                         // check that last tag is closed
 | 
|---|
 | 2423 |                         if (cursor != xmldoc) THROW_ERROR(status_end_element_mismatch, s);
 | 
|---|
 | 2424 |                 }
 | 
|---|
 | 2425 | 
 | 
|---|
 | 2426 |                 static xml_parse_result parse(char_t* buffer, size_t length, xml_node_struct* root, unsigned int optmsk)
 | 
|---|
 | 2427 |                 {
 | 
|---|
 | 2428 |                         xml_document_struct* xmldoc = static_cast<xml_document_struct*>(root);
 | 
|---|
 | 2429 | 
 | 
|---|
 | 2430 |                         // store buffer for offset_debug
 | 
|---|
 | 2431 |                         xmldoc->buffer = buffer;
 | 
|---|
 | 2432 | 
 | 
|---|
 | 2433 |                         // early-out for empty documents
 | 
|---|
 | 2434 |                         if (length == 0) return make_parse_result(status_ok);
 | 
|---|
 | 2435 | 
 | 
|---|
 | 2436 |                         // create parser on stack
 | 
|---|
 | 2437 |                         xml_parser parser(*xmldoc);
 | 
|---|
 | 2438 | 
 | 
|---|
 | 2439 |                         // save last character and make buffer zero-terminated (speeds up parsing)
 | 
|---|
 | 2440 |                         char_t endch = buffer[length - 1];
 | 
|---|
 | 2441 |                         buffer[length - 1] = 0;
 | 
|---|
 | 2442 |                         
 | 
|---|
 | 2443 |                         // perform actual parsing
 | 
|---|
 | 2444 |                         int error = setjmp(parser.error_handler);
 | 
|---|
 | 2445 | 
 | 
|---|
 | 2446 |                         if (error == 0)
 | 
|---|
 | 2447 |                         {
 | 
|---|
 | 2448 |                                 parser.parse(buffer, xmldoc, optmsk, endch);
 | 
|---|
 | 2449 |                         }
 | 
|---|
 | 2450 | 
 | 
|---|
 | 2451 |                         xml_parse_result result = make_parse_result(static_cast<xml_parse_status>(error), parser.error_offset ? parser.error_offset - buffer : 0);
 | 
|---|
 | 2452 |                         assert(result.offset >= 0 && static_cast<size_t>(result.offset) <= length);
 | 
|---|
 | 2453 | 
 | 
|---|
 | 2454 |                         // update allocator state
 | 
|---|
 | 2455 |                         *static_cast<xml_allocator*>(xmldoc) = parser.alloc;
 | 
|---|
 | 2456 | 
 | 
|---|
 | 2457 |                         // since we removed last character, we have to handle the only possible false positive
 | 
|---|
 | 2458 |                         if (result && endch == '<')
 | 
|---|
 | 2459 |                         {
 | 
|---|
 | 2460 |                                 // there's no possible well-formed document with < at the end
 | 
|---|
 | 2461 |                                 return make_parse_result(status_unrecognized_tag, length);
 | 
|---|
 | 2462 |                         }
 | 
|---|
 | 2463 | 
 | 
|---|
 | 2464 |                         return result;
 | 
|---|
 | 2465 |                 }
 | 
|---|
 | 2466 |         };
 | 
|---|
 | 2467 | 
 | 
|---|
 | 2468 |         // Output facilities
 | 
|---|
 | 2469 |         xml_encoding get_write_native_encoding()
 | 
|---|
 | 2470 |         {
 | 
|---|
 | 2471 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 2472 |                 return get_wchar_encoding();
 | 
|---|
 | 2473 |         #else
 | 
|---|
 | 2474 |                 return encoding_utf8;
 | 
|---|
 | 2475 |         #endif
 | 
|---|
 | 2476 |         }
 | 
|---|
 | 2477 | 
 | 
|---|
 | 2478 |         xml_encoding get_write_encoding(xml_encoding encoding)
 | 
|---|
 | 2479 |         {
 | 
|---|
 | 2480 |                 // replace wchar encoding with utf implementation
 | 
|---|
 | 2481 |                 if (encoding == encoding_wchar) return get_wchar_encoding();
 | 
|---|
 | 2482 | 
 | 
|---|
 | 2483 |                 // replace utf16 encoding with utf16 with specific endianness
 | 
|---|
 | 2484 |                 if (encoding == encoding_utf16) return is_little_endian() ? encoding_utf16_le : encoding_utf16_be;
 | 
|---|
 | 2485 | 
 | 
|---|
 | 2486 |                 // replace utf32 encoding with utf32 with specific endianness
 | 
|---|
 | 2487 |                 if (encoding == encoding_utf32) return is_little_endian() ? encoding_utf32_le : encoding_utf32_be;
 | 
|---|
 | 2488 | 
 | 
|---|
 | 2489 |                 // only do autodetection if no explicit encoding is requested
 | 
|---|
 | 2490 |                 if (encoding != encoding_auto) return encoding;
 | 
|---|
 | 2491 | 
 | 
|---|
 | 2492 |                 // assume utf8 encoding
 | 
|---|
 | 2493 |                 return encoding_utf8;
 | 
|---|
 | 2494 |         }
 | 
|---|
 | 2495 | 
 | 
|---|
 | 2496 | #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 2497 |         size_t get_valid_length(const char_t* data, size_t length)
 | 
|---|
 | 2498 |         {
 | 
|---|
 | 2499 |                 assert(length > 0);
 | 
|---|
 | 2500 | 
 | 
|---|
 | 2501 |                 // discard last character if it's the lead of a surrogate pair 
 | 
|---|
 | 2502 |                 return (sizeof(wchar_t) == 2 && (unsigned)(static_cast<uint16_t>(data[length - 1]) - 0xD800) < 0x400) ? length - 1 : length;
 | 
|---|
 | 2503 |         }
 | 
|---|
 | 2504 | 
 | 
|---|
 | 2505 |         size_t convert_buffer(char* result, const char_t* data, size_t length, xml_encoding encoding)
 | 
|---|
 | 2506 |         {
 | 
|---|
 | 2507 |                 // only endian-swapping is required
 | 
|---|
 | 2508 |                 if (need_endian_swap_utf(encoding, get_wchar_encoding()))
 | 
|---|
 | 2509 |                 {
 | 
|---|
 | 2510 |                         convert_wchar_endian_swap(reinterpret_cast<char_t*>(result), data, length);
 | 
|---|
 | 2511 | 
 | 
|---|
 | 2512 |                         return length * sizeof(char_t);
 | 
|---|
 | 2513 |                 }
 | 
|---|
 | 2514 |         
 | 
|---|
 | 2515 |                 // convert to utf8
 | 
|---|
 | 2516 |                 if (encoding == encoding_utf8)
 | 
|---|
 | 2517 |                 {
 | 
|---|
 | 2518 |                         uint8_t* dest = reinterpret_cast<uint8_t*>(result);
 | 
|---|
 | 2519 | 
 | 
|---|
 | 2520 |                         uint8_t* end = sizeof(wchar_t) == 2 ?
 | 
|---|
 | 2521 |                                 utf_decoder<utf8_writer>::decode_utf16_block(reinterpret_cast<const uint16_t*>(data), length, dest) :
 | 
|---|
 | 2522 |                                 utf_decoder<utf8_writer>::decode_utf32_block(reinterpret_cast<const uint32_t*>(data), length, dest);
 | 
|---|
 | 2523 | 
 | 
|---|
 | 2524 |                         return static_cast<size_t>(end - dest);
 | 
|---|
 | 2525 |                 }
 | 
|---|
 | 2526 | 
 | 
|---|
 | 2527 |                 // convert to utf16
 | 
|---|
 | 2528 |                 if (encoding == encoding_utf16_be || encoding == encoding_utf16_le)
 | 
|---|
 | 2529 |                 {
 | 
|---|
 | 2530 |                         uint16_t* dest = reinterpret_cast<uint16_t*>(result);
 | 
|---|
 | 2531 | 
 | 
|---|
 | 2532 |                         // convert to native utf16
 | 
|---|
 | 2533 |                         uint16_t* end = utf_decoder<utf16_writer>::decode_utf32_block(reinterpret_cast<const uint32_t*>(data), length, dest);
 | 
|---|
 | 2534 | 
 | 
|---|
 | 2535 |                         // swap if necessary
 | 
|---|
 | 2536 |                         xml_encoding native_encoding = is_little_endian() ? encoding_utf16_le : encoding_utf16_be;
 | 
|---|
 | 2537 | 
 | 
|---|
 | 2538 |                         if (native_encoding != encoding) convert_utf_endian_swap(dest, dest, static_cast<size_t>(end - dest));
 | 
|---|
 | 2539 | 
 | 
|---|
 | 2540 |                         return static_cast<size_t>(end - dest) * sizeof(uint16_t);
 | 
|---|
 | 2541 |                 }
 | 
|---|
 | 2542 | 
 | 
|---|
 | 2543 |                 // convert to utf32
 | 
|---|
 | 2544 |                 if (encoding == encoding_utf32_be || encoding == encoding_utf32_le)
 | 
|---|
 | 2545 |                 {
 | 
|---|
 | 2546 |                         uint32_t* dest = reinterpret_cast<uint32_t*>(result);
 | 
|---|
 | 2547 | 
 | 
|---|
 | 2548 |                         // convert to native utf32
 | 
|---|
 | 2549 |                         uint32_t* end = utf_decoder<utf32_writer>::decode_utf16_block(reinterpret_cast<const uint16_t*>(data), length, dest);
 | 
|---|
 | 2550 | 
 | 
|---|
 | 2551 |                         // swap if necessary
 | 
|---|
 | 2552 |                         xml_encoding native_encoding = is_little_endian() ? encoding_utf32_le : encoding_utf32_be;
 | 
|---|
 | 2553 | 
 | 
|---|
 | 2554 |                         if (native_encoding != encoding) convert_utf_endian_swap(dest, dest, static_cast<size_t>(end - dest));
 | 
|---|
 | 2555 | 
 | 
|---|
 | 2556 |                         return static_cast<size_t>(end - dest) * sizeof(uint32_t);
 | 
|---|
 | 2557 |                 }
 | 
|---|
 | 2558 | 
 | 
|---|
 | 2559 |                 assert(!"Invalid encoding");
 | 
|---|
 | 2560 |                 return 0;
 | 
|---|
 | 2561 |         }
 | 
|---|
 | 2562 | #else
 | 
|---|
 | 2563 |         size_t get_valid_length(const char_t* data, size_t length)
 | 
|---|
 | 2564 |         {
 | 
|---|
 | 2565 |                 assert(length > 4);
 | 
|---|
 | 2566 | 
 | 
|---|
 | 2567 |                 for (size_t i = 1; i <= 4; ++i)
 | 
|---|
 | 2568 |                 {
 | 
|---|
 | 2569 |                         uint8_t ch = static_cast<uint8_t>(data[length - i]);
 | 
|---|
 | 2570 | 
 | 
|---|
 | 2571 |                         // either a standalone character or a leading one
 | 
|---|
 | 2572 |                         if ((ch & 0xc0) != 0x80) return length - i;
 | 
|---|
 | 2573 |                 }
 | 
|---|
 | 2574 | 
 | 
|---|
 | 2575 |                 // there are four non-leading characters at the end, sequence tail is broken so might as well process the whole chunk
 | 
|---|
 | 2576 |                 return length;
 | 
|---|
 | 2577 |         }
 | 
|---|
 | 2578 | 
 | 
|---|
 | 2579 |         size_t convert_buffer(char* result, const char_t* data, size_t length, xml_encoding encoding)
 | 
|---|
 | 2580 |         {
 | 
|---|
 | 2581 |                 if (encoding == encoding_utf16_be || encoding == encoding_utf16_le)
 | 
|---|
 | 2582 |                 {
 | 
|---|
 | 2583 |                         uint16_t* dest = reinterpret_cast<uint16_t*>(result);
 | 
|---|
 | 2584 | 
 | 
|---|
 | 2585 |                         // convert to native utf16
 | 
|---|
 | 2586 |                         uint16_t* end = utf_decoder<utf16_writer>::decode_utf8_block(reinterpret_cast<const uint8_t*>(data), length, dest);
 | 
|---|
 | 2587 | 
 | 
|---|
 | 2588 |                         // swap if necessary
 | 
|---|
 | 2589 |                         xml_encoding native_encoding = is_little_endian() ? encoding_utf16_le : encoding_utf16_be;
 | 
|---|
 | 2590 | 
 | 
|---|
 | 2591 |                         if (native_encoding != encoding) convert_utf_endian_swap(dest, dest, static_cast<size_t>(end - dest));
 | 
|---|
 | 2592 | 
 | 
|---|
 | 2593 |                         return static_cast<size_t>(end - dest) * sizeof(uint16_t);
 | 
|---|
 | 2594 |                 }
 | 
|---|
 | 2595 | 
 | 
|---|
 | 2596 |                 if (encoding == encoding_utf32_be || encoding == encoding_utf32_le)
 | 
|---|
 | 2597 |                 {
 | 
|---|
 | 2598 |                         uint32_t* dest = reinterpret_cast<uint32_t*>(result);
 | 
|---|
 | 2599 | 
 | 
|---|
 | 2600 |                         // convert to native utf32
 | 
|---|
 | 2601 |                         uint32_t* end = utf_decoder<utf32_writer>::decode_utf8_block(reinterpret_cast<const uint8_t*>(data), length, dest);
 | 
|---|
 | 2602 | 
 | 
|---|
 | 2603 |                         // swap if necessary
 | 
|---|
 | 2604 |                         xml_encoding native_encoding = is_little_endian() ? encoding_utf32_le : encoding_utf32_be;
 | 
|---|
 | 2605 | 
 | 
|---|
 | 2606 |                         if (native_encoding != encoding) convert_utf_endian_swap(dest, dest, static_cast<size_t>(end - dest));
 | 
|---|
 | 2607 | 
 | 
|---|
 | 2608 |                         return static_cast<size_t>(end - dest) * sizeof(uint32_t);
 | 
|---|
 | 2609 |                 }
 | 
|---|
 | 2610 | 
 | 
|---|
 | 2611 |                 assert(!"Invalid encoding");
 | 
|---|
 | 2612 |                 return 0;
 | 
|---|
 | 2613 |         }
 | 
|---|
 | 2614 | #endif
 | 
|---|
 | 2615 | 
 | 
|---|
 | 2616 |         class xml_buffered_writer
 | 
|---|
 | 2617 |         {
 | 
|---|
 | 2618 |                 xml_buffered_writer(const xml_buffered_writer&);
 | 
|---|
 | 2619 |                 xml_buffered_writer& operator=(const xml_buffered_writer&);
 | 
|---|
 | 2620 | 
 | 
|---|
 | 2621 |         public:
 | 
|---|
 | 2622 |                 xml_buffered_writer(xml_writer& writer, xml_encoding user_encoding): writer(writer), bufsize(0), encoding(get_write_encoding(user_encoding))
 | 
|---|
 | 2623 |                 {
 | 
|---|
 | 2624 |                 }
 | 
|---|
 | 2625 | 
 | 
|---|
 | 2626 |                 ~xml_buffered_writer()
 | 
|---|
 | 2627 |                 {
 | 
|---|
 | 2628 |                         flush();
 | 
|---|
 | 2629 |                 }
 | 
|---|
 | 2630 | 
 | 
|---|
 | 2631 |                 void flush()
 | 
|---|
 | 2632 |                 {
 | 
|---|
 | 2633 |                         flush(buffer, bufsize);
 | 
|---|
 | 2634 |                         bufsize = 0;
 | 
|---|
 | 2635 |                 }
 | 
|---|
 | 2636 | 
 | 
|---|
 | 2637 |                 void flush(const char_t* data, size_t size)
 | 
|---|
 | 2638 |                 {
 | 
|---|
 | 2639 |                         if (size == 0) return;
 | 
|---|
 | 2640 | 
 | 
|---|
 | 2641 |                         // fast path, just write data
 | 
|---|
 | 2642 |                         if (encoding == get_write_native_encoding())
 | 
|---|
 | 2643 |                                 writer.write(data, size * sizeof(char_t));
 | 
|---|
 | 2644 |                         else
 | 
|---|
 | 2645 |                         {
 | 
|---|
 | 2646 |                                 // convert chunk
 | 
|---|
 | 2647 |                                 size_t result = convert_buffer(scratch, data, size, encoding);
 | 
|---|
 | 2648 |                                 assert(result <= sizeof(scratch));
 | 
|---|
 | 2649 | 
 | 
|---|
 | 2650 |                                 // write data
 | 
|---|
 | 2651 |                                 writer.write(scratch, result);
 | 
|---|
 | 2652 |                         }
 | 
|---|
 | 2653 |                 }
 | 
|---|
 | 2654 | 
 | 
|---|
 | 2655 |                 void write(const char_t* data, size_t length)
 | 
|---|
 | 2656 |                 {
 | 
|---|
 | 2657 |                         if (bufsize + length > bufcapacity)
 | 
|---|
 | 2658 |                         {
 | 
|---|
 | 2659 |                                 // flush the remaining buffer contents
 | 
|---|
 | 2660 |                                 flush();
 | 
|---|
 | 2661 | 
 | 
|---|
 | 2662 |                                 // handle large chunks
 | 
|---|
 | 2663 |                                 if (length > bufcapacity)
 | 
|---|
 | 2664 |                                 {
 | 
|---|
 | 2665 |                                         if (encoding == get_write_native_encoding())
 | 
|---|
 | 2666 |                                         {
 | 
|---|
 | 2667 |                                                 // fast path, can just write data chunk
 | 
|---|
 | 2668 |                                                 writer.write(data, length * sizeof(char_t));
 | 
|---|
 | 2669 |                                                 return;
 | 
|---|
 | 2670 |                                         }
 | 
|---|
 | 2671 | 
 | 
|---|
 | 2672 |                                         // need to convert in suitable chunks
 | 
|---|
 | 2673 |                                         while (length > bufcapacity)
 | 
|---|
 | 2674 |                                         {
 | 
|---|
 | 2675 |                                                 // get chunk size by selecting such number of characters that are guaranteed to fit into scratch buffer
 | 
|---|
 | 2676 |                                                 // and form a complete codepoint sequence (i.e. discard start of last codepoint if necessary)
 | 
|---|
 | 2677 |                                                 size_t chunk_size = get_valid_length(data, bufcapacity);
 | 
|---|
 | 2678 | 
 | 
|---|
 | 2679 |                                                 // convert chunk and write
 | 
|---|
 | 2680 |                                                 flush(data, chunk_size);
 | 
|---|
 | 2681 | 
 | 
|---|
 | 2682 |                                                 // iterate
 | 
|---|
 | 2683 |                                                 data += chunk_size;
 | 
|---|
 | 2684 |                                                 length -= chunk_size;
 | 
|---|
 | 2685 |                                         }
 | 
|---|
 | 2686 | 
 | 
|---|
 | 2687 |                                         // small tail is copied below
 | 
|---|
 | 2688 |                                         bufsize = 0;
 | 
|---|
 | 2689 |                                 }
 | 
|---|
 | 2690 |                         }
 | 
|---|
 | 2691 | 
 | 
|---|
 | 2692 |                         memcpy(buffer + bufsize, data, length * sizeof(char_t));
 | 
|---|
 | 2693 |                         bufsize += length;
 | 
|---|
 | 2694 |                 }
 | 
|---|
 | 2695 | 
 | 
|---|
 | 2696 |                 void write(const char_t* data)
 | 
|---|
 | 2697 |                 {
 | 
|---|
 | 2698 |                         write(data, strlength(data));
 | 
|---|
 | 2699 |                 }
 | 
|---|
 | 2700 | 
 | 
|---|
 | 2701 |                 void write(char_t d0)
 | 
|---|
 | 2702 |                 {
 | 
|---|
 | 2703 |                         if (bufsize + 1 > bufcapacity) flush();
 | 
|---|
 | 2704 | 
 | 
|---|
 | 2705 |                         buffer[bufsize + 0] = d0;
 | 
|---|
 | 2706 |                         bufsize += 1;
 | 
|---|
 | 2707 |                 }
 | 
|---|
 | 2708 | 
 | 
|---|
 | 2709 |                 void write(char_t d0, char_t d1)
 | 
|---|
 | 2710 |                 {
 | 
|---|
 | 2711 |                         if (bufsize + 2 > bufcapacity) flush();
 | 
|---|
 | 2712 | 
 | 
|---|
 | 2713 |                         buffer[bufsize + 0] = d0;
 | 
|---|
 | 2714 |                         buffer[bufsize + 1] = d1;
 | 
|---|
 | 2715 |                         bufsize += 2;
 | 
|---|
 | 2716 |                 }
 | 
|---|
 | 2717 | 
 | 
|---|
 | 2718 |                 void write(char_t d0, char_t d1, char_t d2)
 | 
|---|
 | 2719 |                 {
 | 
|---|
 | 2720 |                         if (bufsize + 3 > bufcapacity) flush();
 | 
|---|
 | 2721 | 
 | 
|---|
 | 2722 |                         buffer[bufsize + 0] = d0;
 | 
|---|
 | 2723 |                         buffer[bufsize + 1] = d1;
 | 
|---|
 | 2724 |                         buffer[bufsize + 2] = d2;
 | 
|---|
 | 2725 |                         bufsize += 3;
 | 
|---|
 | 2726 |                 }
 | 
|---|
 | 2727 | 
 | 
|---|
 | 2728 |                 void write(char_t d0, char_t d1, char_t d2, char_t d3)
 | 
|---|
 | 2729 |                 {
 | 
|---|
 | 2730 |                         if (bufsize + 4 > bufcapacity) flush();
 | 
|---|
 | 2731 | 
 | 
|---|
 | 2732 |                         buffer[bufsize + 0] = d0;
 | 
|---|
 | 2733 |                         buffer[bufsize + 1] = d1;
 | 
|---|
 | 2734 |                         buffer[bufsize + 2] = d2;
 | 
|---|
 | 2735 |                         buffer[bufsize + 3] = d3;
 | 
|---|
 | 2736 |                         bufsize += 4;
 | 
|---|
 | 2737 |                 }
 | 
|---|
 | 2738 | 
 | 
|---|
 | 2739 |                 void write(char_t d0, char_t d1, char_t d2, char_t d3, char_t d4)
 | 
|---|
 | 2740 |                 {
 | 
|---|
 | 2741 |                         if (bufsize + 5 > bufcapacity) flush();
 | 
|---|
 | 2742 | 
 | 
|---|
 | 2743 |                         buffer[bufsize + 0] = d0;
 | 
|---|
 | 2744 |                         buffer[bufsize + 1] = d1;
 | 
|---|
 | 2745 |                         buffer[bufsize + 2] = d2;
 | 
|---|
 | 2746 |                         buffer[bufsize + 3] = d3;
 | 
|---|
 | 2747 |                         buffer[bufsize + 4] = d4;
 | 
|---|
 | 2748 |                         bufsize += 5;
 | 
|---|
 | 2749 |                 }
 | 
|---|
 | 2750 | 
 | 
|---|
 | 2751 |                 void write(char_t d0, char_t d1, char_t d2, char_t d3, char_t d4, char_t d5)
 | 
|---|
 | 2752 |                 {
 | 
|---|
 | 2753 |                         if (bufsize + 6 > bufcapacity) flush();
 | 
|---|
 | 2754 | 
 | 
|---|
 | 2755 |                         buffer[bufsize + 0] = d0;
 | 
|---|
 | 2756 |                         buffer[bufsize + 1] = d1;
 | 
|---|
 | 2757 |                         buffer[bufsize + 2] = d2;
 | 
|---|
 | 2758 |                         buffer[bufsize + 3] = d3;
 | 
|---|
 | 2759 |                         buffer[bufsize + 4] = d4;
 | 
|---|
 | 2760 |                         buffer[bufsize + 5] = d5;
 | 
|---|
 | 2761 |                         bufsize += 6;
 | 
|---|
 | 2762 |                 }
 | 
|---|
 | 2763 | 
 | 
|---|
 | 2764 |                 // utf8 maximum expansion: x4 (-> utf32)
 | 
|---|
 | 2765 |                 // utf16 maximum expansion: x2 (-> utf32)
 | 
|---|
 | 2766 |                 // utf32 maximum expansion: x1
 | 
|---|
 | 2767 |                 enum { bufcapacity = 2048 };
 | 
|---|
 | 2768 | 
 | 
|---|
 | 2769 |                 char_t buffer[bufcapacity];
 | 
|---|
 | 2770 |                 char scratch[4 * bufcapacity];
 | 
|---|
 | 2771 | 
 | 
|---|
 | 2772 |                 xml_writer& writer;
 | 
|---|
 | 2773 |                 size_t bufsize;
 | 
|---|
 | 2774 |                 xml_encoding encoding;
 | 
|---|
 | 2775 |         };
 | 
|---|
 | 2776 | 
 | 
|---|
 | 2777 |         void write_bom(xml_writer& writer, xml_encoding encoding)
 | 
|---|
 | 2778 |         {
 | 
|---|
 | 2779 |                 switch (encoding)
 | 
|---|
 | 2780 |                 {
 | 
|---|
 | 2781 |                 case encoding_utf8:
 | 
|---|
 | 2782 |                         writer.write("\xef\xbb\xbf", 3);
 | 
|---|
 | 2783 |                         break;
 | 
|---|
 | 2784 | 
 | 
|---|
 | 2785 |                 case encoding_utf16_be:
 | 
|---|
 | 2786 |                         writer.write("\xfe\xff", 2);
 | 
|---|
 | 2787 |                         break;
 | 
|---|
 | 2788 | 
 | 
|---|
 | 2789 |                 case encoding_utf16_le:
 | 
|---|
 | 2790 |                         writer.write("\xff\xfe", 2);
 | 
|---|
 | 2791 |                         break;
 | 
|---|
 | 2792 | 
 | 
|---|
 | 2793 |                 case encoding_utf32_be:
 | 
|---|
 | 2794 |                         writer.write("\x00\x00\xfe\xff", 4);
 | 
|---|
 | 2795 |                         break;
 | 
|---|
 | 2796 | 
 | 
|---|
 | 2797 |                 case encoding_utf32_le:
 | 
|---|
 | 2798 |                         writer.write("\xff\xfe\x00\x00", 4);
 | 
|---|
 | 2799 |                         break;
 | 
|---|
 | 2800 | 
 | 
|---|
 | 2801 |                 default:
 | 
|---|
 | 2802 |                         assert(!"Invalid encoding");
 | 
|---|
 | 2803 |                 }
 | 
|---|
 | 2804 |         }
 | 
|---|
 | 2805 | 
 | 
|---|
 | 2806 |         void text_output_escaped(xml_buffered_writer& writer, const char_t* s, chartypex_t type)
 | 
|---|
 | 2807 |         {
 | 
|---|
 | 2808 |                 while (*s)
 | 
|---|
 | 2809 |                 {
 | 
|---|
 | 2810 |                         const char_t* prev = s;
 | 
|---|
 | 2811 |                         
 | 
|---|
 | 2812 |                         // While *s is a usual symbol
 | 
|---|
 | 2813 |                         while (!IS_CHARTYPEX(*s, type)) ++s;
 | 
|---|
 | 2814 |                 
 | 
|---|
 | 2815 |                         writer.write(prev, static_cast<size_t>(s - prev));
 | 
|---|
 | 2816 | 
 | 
|---|
 | 2817 |                         switch (*s)
 | 
|---|
 | 2818 |                         {
 | 
|---|
 | 2819 |                                 case 0: break;
 | 
|---|
 | 2820 |                                 case '&':
 | 
|---|
 | 2821 |                                         writer.write('&', 'a', 'm', 'p', ';');
 | 
|---|
 | 2822 |                                         ++s;
 | 
|---|
 | 2823 |                                         break;
 | 
|---|
 | 2824 |                                 case '<':
 | 
|---|
 | 2825 |                                         writer.write('&', 'l', 't', ';');
 | 
|---|
 | 2826 |                                         ++s;
 | 
|---|
 | 2827 |                                         break;
 | 
|---|
 | 2828 |                                 case '>':
 | 
|---|
 | 2829 |                                         writer.write('&', 'g', 't', ';');
 | 
|---|
 | 2830 |                                         ++s;
 | 
|---|
 | 2831 |                                         break;
 | 
|---|
 | 2832 |                                 case '"':
 | 
|---|
 | 2833 |                                         writer.write('&', 'q', 'u', 'o', 't', ';');
 | 
|---|
 | 2834 |                                         ++s;
 | 
|---|
 | 2835 |                                         break;
 | 
|---|
 | 2836 |                                 default: // s is not a usual symbol
 | 
|---|
 | 2837 |                                 {
 | 
|---|
 | 2838 |                                         unsigned int ch = static_cast<unsigned int>(*s++);
 | 
|---|
 | 2839 |                                         assert(ch < 32);
 | 
|---|
 | 2840 | 
 | 
|---|
 | 2841 |                                         writer.write('&', '#', static_cast<char_t>((ch / 10) + '0'), static_cast<char_t>((ch % 10) + '0'), ';');
 | 
|---|
 | 2842 |                                 }
 | 
|---|
 | 2843 |                         }
 | 
|---|
 | 2844 |                 }
 | 
|---|
 | 2845 |         }
 | 
|---|
 | 2846 | 
 | 
|---|
 | 2847 |         void text_output_cdata(xml_buffered_writer& writer, const char_t* s)
 | 
|---|
 | 2848 |         {
 | 
|---|
 | 2849 |                 do
 | 
|---|
 | 2850 |                 {
 | 
|---|
 | 2851 |                         writer.write('<', '!', '[', 'C', 'D');
 | 
|---|
 | 2852 |                         writer.write('A', 'T', 'A', '[');
 | 
|---|
 | 2853 | 
 | 
|---|
 | 2854 |                         const char_t* prev = s;
 | 
|---|
 | 2855 | 
 | 
|---|
 | 2856 |                         // look for ]]> sequence - we can't output it as is since it terminates CDATA
 | 
|---|
 | 2857 |                         while (*s && !(s[0] == ']' && s[1] == ']' && s[2] == '>')) ++s;
 | 
|---|
 | 2858 | 
 | 
|---|
 | 2859 |                         // skip ]] if we stopped at ]]>, > will go to the next CDATA section
 | 
|---|
 | 2860 |                         if (*s) s += 2;
 | 
|---|
 | 2861 | 
 | 
|---|
 | 2862 |                         writer.write(prev, static_cast<size_t>(s - prev));
 | 
|---|
 | 2863 | 
 | 
|---|
 | 2864 |                         writer.write(']', ']', '>');
 | 
|---|
 | 2865 |                 }
 | 
|---|
 | 2866 |                 while (*s);
 | 
|---|
 | 2867 |         }
 | 
|---|
 | 2868 | 
 | 
|---|
 | 2869 |         void node_output_attributes(xml_buffered_writer& writer, const xml_node& node)
 | 
|---|
 | 2870 |         {
 | 
|---|
 | 2871 |                 const char_t* default_name = PUGIXML_TEXT(":anonymous");
 | 
|---|
 | 2872 | 
 | 
|---|
 | 2873 |                 for (xml_attribute a = node.first_attribute(); a; a = a.next_attribute())
 | 
|---|
 | 2874 |                 {
 | 
|---|
 | 2875 |                         writer.write(' ');
 | 
|---|
 | 2876 |                         writer.write(a.name()[0] ? a.name() : default_name);
 | 
|---|
 | 2877 |                         writer.write('=', '"');
 | 
|---|
 | 2878 | 
 | 
|---|
 | 2879 |                         text_output_escaped(writer, a.value(), ctx_special_attr);
 | 
|---|
 | 2880 | 
 | 
|---|
 | 2881 |                         writer.write('"');
 | 
|---|
 | 2882 |                 }
 | 
|---|
 | 2883 |         }
 | 
|---|
 | 2884 | 
 | 
|---|
 | 2885 |         void node_output(xml_buffered_writer& writer, const xml_node& node, const char_t* indent, unsigned int flags, unsigned int depth)
 | 
|---|
 | 2886 |         {
 | 
|---|
 | 2887 |                 const char_t* default_name = PUGIXML_TEXT(":anonymous");
 | 
|---|
 | 2888 | 
 | 
|---|
 | 2889 |                 if ((flags & format_indent) != 0 && (flags & format_raw) == 0)
 | 
|---|
 | 2890 |                         for (unsigned int i = 0; i < depth; ++i) writer.write(indent);
 | 
|---|
 | 2891 | 
 | 
|---|
 | 2892 |                 switch (node.type())
 | 
|---|
 | 2893 |                 {
 | 
|---|
 | 2894 |                 case node_document:
 | 
|---|
 | 2895 |                 {
 | 
|---|
 | 2896 |                         for (xml_node n = node.first_child(); n; n = n.next_sibling())
 | 
|---|
 | 2897 |                                 node_output(writer, n, indent, flags, depth);
 | 
|---|
 | 2898 |                         break;
 | 
|---|
 | 2899 |                 }
 | 
|---|
 | 2900 |                         
 | 
|---|
 | 2901 |                 case node_element:
 | 
|---|
 | 2902 |                 {
 | 
|---|
 | 2903 |                         const char_t* name = node.name()[0] ? node.name() : default_name;
 | 
|---|
 | 2904 | 
 | 
|---|
 | 2905 |                         writer.write('<');
 | 
|---|
 | 2906 |                         writer.write(name);
 | 
|---|
 | 2907 | 
 | 
|---|
 | 2908 |                         node_output_attributes(writer, node);
 | 
|---|
 | 2909 | 
 | 
|---|
 | 2910 |                         if (flags & format_raw)
 | 
|---|
 | 2911 |                         {
 | 
|---|
 | 2912 |                                 if (!node.first_child())
 | 
|---|
 | 2913 |                                         writer.write(' ', '/', '>');
 | 
|---|
 | 2914 |                                 else
 | 
|---|
 | 2915 |                                 {
 | 
|---|
 | 2916 |                                         writer.write('>');
 | 
|---|
 | 2917 | 
 | 
|---|
 | 2918 |                                         for (xml_node n = node.first_child(); n; n = n.next_sibling())
 | 
|---|
 | 2919 |                                                 node_output(writer, n, indent, flags, depth + 1);
 | 
|---|
 | 2920 | 
 | 
|---|
 | 2921 |                                         writer.write('<', '/');
 | 
|---|
 | 2922 |                                         writer.write(name);
 | 
|---|
 | 2923 |                                         writer.write('>');
 | 
|---|
 | 2924 |                                 }
 | 
|---|
 | 2925 |                         }
 | 
|---|
 | 2926 |                         else if (!node.first_child())
 | 
|---|
 | 2927 |                                 writer.write(' ', '/', '>', '\n');
 | 
|---|
 | 2928 |                         else if (node.first_child() == node.last_child() && (node.first_child().type() == node_pcdata || node.first_child().type() == node_cdata))
 | 
|---|
 | 2929 |                         {
 | 
|---|
 | 2930 |                                 writer.write('>');
 | 
|---|
 | 2931 | 
 | 
|---|
 | 2932 |                 if (node.first_child().type() == node_pcdata)
 | 
|---|
 | 2933 |                     text_output_escaped(writer, node.first_child().value(), ctx_special_pcdata);
 | 
|---|
 | 2934 |                 else
 | 
|---|
 | 2935 |                     text_output_cdata(writer, node.first_child().value());
 | 
|---|
 | 2936 | 
 | 
|---|
 | 2937 |                                 writer.write('<', '/');
 | 
|---|
 | 2938 |                                 writer.write(name);
 | 
|---|
 | 2939 |                                 writer.write('>', '\n');
 | 
|---|
 | 2940 |                         }
 | 
|---|
 | 2941 |                         else
 | 
|---|
 | 2942 |                         {
 | 
|---|
 | 2943 |                                 writer.write('>', '\n');
 | 
|---|
 | 2944 |                                 
 | 
|---|
 | 2945 |                                 for (xml_node n = node.first_child(); n; n = n.next_sibling())
 | 
|---|
 | 2946 |                                         node_output(writer, n, indent, flags, depth + 1);
 | 
|---|
 | 2947 | 
 | 
|---|
 | 2948 |                                 if ((flags & format_indent) != 0 && (flags & format_raw) == 0)
 | 
|---|
 | 2949 |                                         for (unsigned int i = 0; i < depth; ++i) writer.write(indent);
 | 
|---|
 | 2950 |                                 
 | 
|---|
 | 2951 |                                 writer.write('<', '/');
 | 
|---|
 | 2952 |                                 writer.write(name);
 | 
|---|
 | 2953 |                                 writer.write('>', '\n');
 | 
|---|
 | 2954 |                         }
 | 
|---|
 | 2955 | 
 | 
|---|
 | 2956 |                         break;
 | 
|---|
 | 2957 |                 }
 | 
|---|
 | 2958 |                 
 | 
|---|
 | 2959 |                 case node_pcdata:
 | 
|---|
 | 2960 |                         text_output_escaped(writer, node.value(), ctx_special_pcdata);
 | 
|---|
 | 2961 |                         if ((flags & format_raw) == 0) writer.write('\n');
 | 
|---|
 | 2962 |                         break;
 | 
|---|
 | 2963 | 
 | 
|---|
 | 2964 |                 case node_cdata:
 | 
|---|
 | 2965 |                         text_output_cdata(writer, node.value());
 | 
|---|
 | 2966 |                         if ((flags & format_raw) == 0) writer.write('\n');
 | 
|---|
 | 2967 |                         break;
 | 
|---|
 | 2968 | 
 | 
|---|
 | 2969 |                 case node_comment:
 | 
|---|
 | 2970 |                         writer.write('<', '!', '-', '-');
 | 
|---|
 | 2971 |                         writer.write(node.value());
 | 
|---|
 | 2972 |                         writer.write('-', '-', '>');
 | 
|---|
 | 2973 |                         if ((flags & format_raw) == 0) writer.write('\n');
 | 
|---|
 | 2974 |                         break;
 | 
|---|
 | 2975 | 
 | 
|---|
 | 2976 |                 case node_pi:
 | 
|---|
 | 2977 |                 case node_declaration:
 | 
|---|
 | 2978 |                         writer.write('<', '?');
 | 
|---|
 | 2979 |                         writer.write(node.name()[0] ? node.name() : default_name);
 | 
|---|
 | 2980 | 
 | 
|---|
 | 2981 |                         if (node.type() == node_declaration)
 | 
|---|
 | 2982 |                         {
 | 
|---|
 | 2983 |                                 node_output_attributes(writer, node);
 | 
|---|
 | 2984 |                         }
 | 
|---|
 | 2985 |                         else if (node.value()[0])
 | 
|---|
 | 2986 |                         {
 | 
|---|
 | 2987 |                                 writer.write(' ');
 | 
|---|
 | 2988 |                                 writer.write(node.value());
 | 
|---|
 | 2989 |                         }
 | 
|---|
 | 2990 | 
 | 
|---|
 | 2991 |                         writer.write('?', '>');
 | 
|---|
 | 2992 |                         if ((flags & format_raw) == 0) writer.write('\n');
 | 
|---|
 | 2993 |                         break;
 | 
|---|
 | 2994 | 
 | 
|---|
 | 2995 |                 case node_doctype:
 | 
|---|
 | 2996 |                         writer.write('<', '!', 'D', 'O', 'C');
 | 
|---|
 | 2997 |                         writer.write('T', 'Y', 'P', 'E');
 | 
|---|
 | 2998 | 
 | 
|---|
 | 2999 |             if (node.value()[0])
 | 
|---|
 | 3000 |             {
 | 
|---|
 | 3001 |                 writer.write(' ');
 | 
|---|
 | 3002 |                 writer.write(node.value());
 | 
|---|
 | 3003 |             }
 | 
|---|
 | 3004 | 
 | 
|---|
 | 3005 |             writer.write('>');
 | 
|---|
 | 3006 |                         if ((flags & format_raw) == 0) writer.write('\n');
 | 
|---|
 | 3007 |                         break;
 | 
|---|
 | 3008 | 
 | 
|---|
 | 3009 |                 default:
 | 
|---|
 | 3010 |                         assert(!"Invalid node type");
 | 
|---|
 | 3011 |                 }
 | 
|---|
 | 3012 |         }
 | 
|---|
 | 3013 | 
 | 
|---|
 | 3014 |         inline bool has_declaration(const xml_node& node)
 | 
|---|
 | 3015 |         {
 | 
|---|
 | 3016 |                 for (xml_node child = node.first_child(); child; child = child.next_sibling())
 | 
|---|
 | 3017 |                 {
 | 
|---|
 | 3018 |                         xml_node_type type = child.type();
 | 
|---|
 | 3019 | 
 | 
|---|
 | 3020 |                         if (type == node_declaration) return true;
 | 
|---|
 | 3021 |                         if (type == node_element) return false;
 | 
|---|
 | 3022 |                 }
 | 
|---|
 | 3023 | 
 | 
|---|
 | 3024 |                 return false;
 | 
|---|
 | 3025 |         }
 | 
|---|
 | 3026 | 
 | 
|---|
 | 3027 |         inline bool allow_insert_child(xml_node_type parent, xml_node_type child)
 | 
|---|
 | 3028 |         {
 | 
|---|
 | 3029 |                 if (parent != node_document && parent != node_element) return false;
 | 
|---|
 | 3030 |                 if (child == node_document || child == node_null) return false;
 | 
|---|
 | 3031 |                 if (parent != node_document && (child == node_declaration || child == node_doctype)) return false;
 | 
|---|
 | 3032 | 
 | 
|---|
 | 3033 |                 return true;
 | 
|---|
 | 3034 |         }
 | 
|---|
 | 3035 | 
 | 
|---|
 | 3036 |         void recursive_copy_skip(xml_node& dest, const xml_node& source, const xml_node& skip)
 | 
|---|
 | 3037 |         {
 | 
|---|
 | 3038 |                 assert(dest.type() == source.type());
 | 
|---|
 | 3039 | 
 | 
|---|
 | 3040 |                 switch (source.type())
 | 
|---|
 | 3041 |                 {
 | 
|---|
 | 3042 |                 case node_element:
 | 
|---|
 | 3043 |                 {
 | 
|---|
 | 3044 |                         dest.set_name(source.name());
 | 
|---|
 | 3045 | 
 | 
|---|
 | 3046 |                         for (xml_attribute a = source.first_attribute(); a; a = a.next_attribute())
 | 
|---|
 | 3047 |                                 dest.append_attribute(a.name()).set_value(a.value());
 | 
|---|
 | 3048 | 
 | 
|---|
 | 3049 |                         for (xml_node c = source.first_child(); c; c = c.next_sibling())
 | 
|---|
 | 3050 |                         {
 | 
|---|
 | 3051 |                                 if (c == skip) continue;
 | 
|---|
 | 3052 | 
 | 
|---|
 | 3053 |                                 xml_node cc = dest.append_child(c.type());
 | 
|---|
 | 3054 |                                 assert(cc);
 | 
|---|
 | 3055 | 
 | 
|---|
 | 3056 |                                 recursive_copy_skip(cc, c, skip);
 | 
|---|
 | 3057 |                         }
 | 
|---|
 | 3058 | 
 | 
|---|
 | 3059 |                         break;
 | 
|---|
 | 3060 |                 }
 | 
|---|
 | 3061 | 
 | 
|---|
 | 3062 |                 case node_pcdata:
 | 
|---|
 | 3063 |                 case node_cdata:
 | 
|---|
 | 3064 |                 case node_comment:
 | 
|---|
 | 3065 |         case node_doctype:
 | 
|---|
 | 3066 |                         dest.set_value(source.value());
 | 
|---|
 | 3067 |                         break;
 | 
|---|
 | 3068 | 
 | 
|---|
 | 3069 |                 case node_pi:
 | 
|---|
 | 3070 |                         dest.set_name(source.name());
 | 
|---|
 | 3071 |                         dest.set_value(source.value());
 | 
|---|
 | 3072 |                         break;
 | 
|---|
 | 3073 | 
 | 
|---|
 | 3074 |                 case node_declaration:
 | 
|---|
 | 3075 |                 {
 | 
|---|
 | 3076 |                         dest.set_name(source.name());
 | 
|---|
 | 3077 | 
 | 
|---|
 | 3078 |                         for (xml_attribute a = source.first_attribute(); a; a = a.next_attribute())
 | 
|---|
 | 3079 |                                 dest.append_attribute(a.name()).set_value(a.value());
 | 
|---|
 | 3080 | 
 | 
|---|
 | 3081 |                         break;
 | 
|---|
 | 3082 |                 }
 | 
|---|
 | 3083 | 
 | 
|---|
 | 3084 |                 default:
 | 
|---|
 | 3085 |                         assert(!"Invalid node type");
 | 
|---|
 | 3086 |                 }
 | 
|---|
 | 3087 |         }
 | 
|---|
 | 3088 | 
 | 
|---|
 | 3089 |         // we need to get length of entire file to load it in memory; the only (relatively) sane way to do it is via seek/tell trick
 | 
|---|
 | 3090 |         xml_parse_status get_file_size(FILE* file, size_t& out_result)
 | 
|---|
 | 3091 |         {
 | 
|---|
 | 3092 |         #if defined(_MSC_VER) && _MSC_VER >= 1400
 | 
|---|
 | 3093 |                 // there are 64-bit versions of fseek/ftell, let's use them
 | 
|---|
 | 3094 |                 typedef __int64 length_type;
 | 
|---|
 | 3095 | 
 | 
|---|
 | 3096 |                 _fseeki64(file, 0, SEEK_END);
 | 
|---|
 | 3097 |                 length_type length = _ftelli64(file);
 | 
|---|
 | 3098 |                 _fseeki64(file, 0, SEEK_SET);
 | 
|---|
 | 3099 |         #elif defined(__MINGW32__) && !defined(__NO_MINGW_LFS) && !defined(__STRICT_ANSI__)
 | 
|---|
 | 3100 |                 // there are 64-bit versions of fseek/ftell, let's use them
 | 
|---|
 | 3101 |                 typedef off64_t length_type;
 | 
|---|
 | 3102 | 
 | 
|---|
 | 3103 |                 fseeko64(file, 0, SEEK_END);
 | 
|---|
 | 3104 |                 length_type length = ftello64(file);
 | 
|---|
 | 3105 |                 fseeko64(file, 0, SEEK_SET);
 | 
|---|
 | 3106 |         #else
 | 
|---|
 | 3107 |                 // if this is a 32-bit OS, long is enough; if this is a unix system, long is 64-bit, which is enough; otherwise we can't do anything anyway.
 | 
|---|
 | 3108 |                 typedef long length_type;
 | 
|---|
 | 3109 | 
 | 
|---|
 | 3110 |                 fseek(file, 0, SEEK_END);
 | 
|---|
 | 3111 |                 length_type length = ftell(file);
 | 
|---|
 | 3112 |                 fseek(file, 0, SEEK_SET);
 | 
|---|
 | 3113 |         #endif
 | 
|---|
 | 3114 | 
 | 
|---|
 | 3115 |                 // check for I/O errors
 | 
|---|
 | 3116 |                 if (length < 0) return status_io_error;
 | 
|---|
 | 3117 |                 
 | 
|---|
 | 3118 |                 // check for overflow
 | 
|---|
 | 3119 |                 size_t result = static_cast<size_t>(length);
 | 
|---|
 | 3120 | 
 | 
|---|
 | 3121 |                 if (static_cast<length_type>(result) != length) return status_out_of_memory;
 | 
|---|
 | 3122 | 
 | 
|---|
 | 3123 |                 // finalize
 | 
|---|
 | 3124 |                 out_result = result;
 | 
|---|
 | 3125 | 
 | 
|---|
 | 3126 |                 return status_ok;
 | 
|---|
 | 3127 |         }
 | 
|---|
 | 3128 | 
 | 
|---|
 | 3129 |         xml_parse_result load_file_impl(xml_document& doc, FILE* file, unsigned int options, xml_encoding encoding)
 | 
|---|
 | 3130 |         {
 | 
|---|
 | 3131 |                 if (!file) return make_parse_result(status_file_not_found);
 | 
|---|
 | 3132 | 
 | 
|---|
 | 3133 |                 // get file size (can result in I/O errors)
 | 
|---|
 | 3134 |                 size_t size = 0;
 | 
|---|
 | 3135 |                 xml_parse_status size_status = get_file_size(file, size);
 | 
|---|
 | 3136 | 
 | 
|---|
 | 3137 |                 if (size_status != status_ok)
 | 
|---|
 | 3138 |                 {
 | 
|---|
 | 3139 |                         fclose(file);
 | 
|---|
 | 3140 |                         return make_parse_result(size_status);
 | 
|---|
 | 3141 |                 }
 | 
|---|
 | 3142 |                 
 | 
|---|
 | 3143 |                 // allocate buffer for the whole file
 | 
|---|
 | 3144 |                 char* contents = static_cast<char*>(global_allocate(size > 0 ? size : 1));
 | 
|---|
 | 3145 | 
 | 
|---|
 | 3146 |                 if (!contents)
 | 
|---|
 | 3147 |                 {
 | 
|---|
 | 3148 |                         fclose(file);
 | 
|---|
 | 3149 |                         return make_parse_result(status_out_of_memory);
 | 
|---|
 | 3150 |                 }
 | 
|---|
 | 3151 | 
 | 
|---|
 | 3152 |                 // read file in memory
 | 
|---|
 | 3153 |                 size_t read_size = fread(contents, 1, size, file);
 | 
|---|
 | 3154 |                 fclose(file);
 | 
|---|
 | 3155 | 
 | 
|---|
 | 3156 |                 if (read_size != size)
 | 
|---|
 | 3157 |                 {
 | 
|---|
 | 3158 |                         global_deallocate(contents);
 | 
|---|
 | 3159 |                         return make_parse_result(status_io_error);
 | 
|---|
 | 3160 |                 }
 | 
|---|
 | 3161 |                 
 | 
|---|
 | 3162 |                 return doc.load_buffer_inplace_own(contents, size, options, encoding);
 | 
|---|
 | 3163 |         }
 | 
|---|
 | 3164 | 
 | 
|---|
 | 3165 | #ifndef PUGIXML_NO_STL
 | 
|---|
 | 3166 |         template <typename T> xml_parse_result load_stream_impl(xml_document& doc, std::basic_istream<T>& stream, unsigned int options, xml_encoding encoding)
 | 
|---|
 | 3167 |         {
 | 
|---|
 | 3168 |                 // get length of remaining data in stream
 | 
|---|
 | 3169 |                 typename std::basic_istream<T>::pos_type pos = stream.tellg();
 | 
|---|
 | 3170 |                 stream.seekg(0, std::ios::end);
 | 
|---|
 | 3171 |                 std::streamoff length = stream.tellg() - pos;
 | 
|---|
 | 3172 |                 stream.seekg(pos);
 | 
|---|
 | 3173 | 
 | 
|---|
 | 3174 |                 if (stream.fail() || pos < 0) return make_parse_result(status_io_error);
 | 
|---|
 | 3175 | 
 | 
|---|
 | 3176 |                 // guard against huge files
 | 
|---|
 | 3177 |                 size_t read_length = static_cast<size_t>(length);
 | 
|---|
 | 3178 | 
 | 
|---|
 | 3179 |                 if (static_cast<std::streamsize>(read_length) != length || length < 0) return make_parse_result(status_out_of_memory);
 | 
|---|
 | 3180 | 
 | 
|---|
 | 3181 |                 // read stream data into memory (guard against stream exceptions with buffer holder)
 | 
|---|
 | 3182 |                 buffer_holder buffer(global_allocate((read_length > 0 ? read_length : 1) * sizeof(T)), global_deallocate);
 | 
|---|
 | 3183 |                 if (!buffer.data) return make_parse_result(status_out_of_memory);
 | 
|---|
 | 3184 | 
 | 
|---|
 | 3185 |                 stream.read(static_cast<T*>(buffer.data), static_cast<std::streamsize>(read_length));
 | 
|---|
 | 3186 | 
 | 
|---|
 | 3187 |                 // read may set failbit | eofbit in case gcount() is less than read_length (i.e. line ending conversion), so check for other I/O errors
 | 
|---|
 | 3188 |                 if (stream.bad()) return make_parse_result(status_io_error);
 | 
|---|
 | 3189 | 
 | 
|---|
 | 3190 |                 // load data from buffer
 | 
|---|
 | 3191 |                 size_t actual_length = static_cast<size_t>(stream.gcount());
 | 
|---|
 | 3192 |                 assert(actual_length <= read_length);
 | 
|---|
 | 3193 | 
 | 
|---|
 | 3194 |                 return doc.load_buffer_inplace_own(buffer.release(), actual_length * sizeof(T), options, encoding);
 | 
|---|
 | 3195 |         }
 | 
|---|
 | 3196 | #endif
 | 
|---|
 | 3197 | 
 | 
|---|
 | 3198 | #if defined(_MSC_VER) || defined(__BORLANDC__) || defined(__MINGW32__)
 | 
|---|
 | 3199 |         FILE* open_file_wide(const wchar_t* path, const wchar_t* mode)
 | 
|---|
 | 3200 |         {
 | 
|---|
 | 3201 |                 return _wfopen(path, mode);
 | 
|---|
 | 3202 |         }
 | 
|---|
 | 3203 | #else
 | 
|---|
 | 3204 |         char* convert_path_heap(const wchar_t* str)
 | 
|---|
 | 3205 |         {
 | 
|---|
 | 3206 |                 assert(str);
 | 
|---|
 | 3207 | 
 | 
|---|
 | 3208 |                 // first pass: get length in utf8 characters
 | 
|---|
 | 3209 |                 size_t length = wcslen(str);
 | 
|---|
 | 3210 |         size_t size = as_utf8_begin(str, length);
 | 
|---|
 | 3211 | 
 | 
|---|
 | 3212 |                 // allocate resulting string
 | 
|---|
 | 3213 |                 char* result = static_cast<char*>(global_allocate(size + 1));
 | 
|---|
 | 3214 |                 if (!result) return 0;
 | 
|---|
 | 3215 | 
 | 
|---|
 | 3216 |                 // second pass: convert to utf8
 | 
|---|
 | 3217 |         as_utf8_end(result, size, str, length);
 | 
|---|
 | 3218 | 
 | 
|---|
 | 3219 |                 return result;
 | 
|---|
 | 3220 |         }
 | 
|---|
 | 3221 | 
 | 
|---|
 | 3222 |         FILE* open_file_wide(const wchar_t* path, const wchar_t* mode)
 | 
|---|
 | 3223 |         {
 | 
|---|
 | 3224 |                 // there is no standard function to open wide paths, so our best bet is to try utf8 path
 | 
|---|
 | 3225 |                 char* path_utf8 = convert_path_heap(path);
 | 
|---|
 | 3226 |                 if (!path_utf8) return 0;
 | 
|---|
 | 3227 | 
 | 
|---|
 | 3228 |                 // convert mode to ASCII (we mirror _wfopen interface)
 | 
|---|
 | 3229 |                 char mode_ascii[4] = {0};
 | 
|---|
 | 3230 |                 for (size_t i = 0; mode[i]; ++i) mode_ascii[i] = static_cast<char>(mode[i]);
 | 
|---|
 | 3231 | 
 | 
|---|
 | 3232 |                 // try to open the utf8 path
 | 
|---|
 | 3233 |                 FILE* result = fopen(path_utf8, mode_ascii);
 | 
|---|
 | 3234 | 
 | 
|---|
 | 3235 |                 // free dummy buffer
 | 
|---|
 | 3236 |                 global_deallocate(path_utf8);
 | 
|---|
 | 3237 | 
 | 
|---|
 | 3238 |                 return result;
 | 
|---|
 | 3239 |         }
 | 
|---|
 | 3240 | #endif
 | 
|---|
 | 3241 | }
 | 
|---|
 | 3242 | 
 | 
|---|
 | 3243 | namespace pugi
 | 
|---|
 | 3244 | {
 | 
|---|
 | 3245 |         xml_writer_file::xml_writer_file(void* file): file(file)
 | 
|---|
 | 3246 |         {
 | 
|---|
 | 3247 |         }
 | 
|---|
 | 3248 | 
 | 
|---|
 | 3249 |         void xml_writer_file::write(const void* data, size_t size)
 | 
|---|
 | 3250 |         {
 | 
|---|
 | 3251 |                 fwrite(data, size, 1, static_cast<FILE*>(file));
 | 
|---|
 | 3252 |         }
 | 
|---|
 | 3253 | 
 | 
|---|
 | 3254 | #ifndef PUGIXML_NO_STL
 | 
|---|
 | 3255 |         xml_writer_stream::xml_writer_stream(std::basic_ostream<char, std::char_traits<char> >& stream): narrow_stream(&stream), wide_stream(0)
 | 
|---|
 | 3256 |         {
 | 
|---|
 | 3257 |         }
 | 
|---|
 | 3258 | 
 | 
|---|
 | 3259 |         xml_writer_stream::xml_writer_stream(std::basic_ostream<wchar_t, std::char_traits<wchar_t> >& stream): narrow_stream(0), wide_stream(&stream)
 | 
|---|
 | 3260 |         {
 | 
|---|
 | 3261 |         }
 | 
|---|
 | 3262 | 
 | 
|---|
 | 3263 |         void xml_writer_stream::write(const void* data, size_t size)
 | 
|---|
 | 3264 |         {
 | 
|---|
 | 3265 |                 if (narrow_stream)
 | 
|---|
 | 3266 |                 {
 | 
|---|
 | 3267 |                         assert(!wide_stream);
 | 
|---|
 | 3268 |                         narrow_stream->write(reinterpret_cast<const char*>(data), static_cast<std::streamsize>(size));
 | 
|---|
 | 3269 |                 }
 | 
|---|
 | 3270 |                 else
 | 
|---|
 | 3271 |                 {
 | 
|---|
 | 3272 |                         assert(wide_stream);
 | 
|---|
 | 3273 |                         assert(size % sizeof(wchar_t) == 0);
 | 
|---|
 | 3274 | 
 | 
|---|
 | 3275 |                         wide_stream->write(reinterpret_cast<const wchar_t*>(data), static_cast<std::streamsize>(size / sizeof(wchar_t)));
 | 
|---|
 | 3276 |                 }
 | 
|---|
 | 3277 |         }
 | 
|---|
 | 3278 | #endif
 | 
|---|
 | 3279 | 
 | 
|---|
 | 3280 |         xml_tree_walker::xml_tree_walker(): _depth(0)
 | 
|---|
 | 3281 |         {
 | 
|---|
 | 3282 |         }
 | 
|---|
 | 3283 |         
 | 
|---|
 | 3284 |         xml_tree_walker::~xml_tree_walker()
 | 
|---|
 | 3285 |         {
 | 
|---|
 | 3286 |         }
 | 
|---|
 | 3287 | 
 | 
|---|
 | 3288 |         int xml_tree_walker::depth() const
 | 
|---|
 | 3289 |         {
 | 
|---|
 | 3290 |                 return _depth;
 | 
|---|
 | 3291 |         }
 | 
|---|
 | 3292 | 
 | 
|---|
 | 3293 |         bool xml_tree_walker::begin(xml_node&)
 | 
|---|
 | 3294 |         {
 | 
|---|
 | 3295 |                 return true;
 | 
|---|
 | 3296 |         }
 | 
|---|
 | 3297 | 
 | 
|---|
 | 3298 |         bool xml_tree_walker::end(xml_node&)
 | 
|---|
 | 3299 |         {
 | 
|---|
 | 3300 |                 return true;
 | 
|---|
 | 3301 |         }
 | 
|---|
 | 3302 | 
 | 
|---|
 | 3303 |         xml_attribute::xml_attribute(): _attr(0)
 | 
|---|
 | 3304 |         {
 | 
|---|
 | 3305 |         }
 | 
|---|
 | 3306 | 
 | 
|---|
 | 3307 |         xml_attribute::xml_attribute(xml_attribute_struct* attr): _attr(attr)
 | 
|---|
 | 3308 |         {
 | 
|---|
 | 3309 |         }
 | 
|---|
 | 3310 | 
 | 
|---|
 | 3311 |         xml_attribute::operator xml_attribute::unspecified_bool_type() const
 | 
|---|
 | 3312 |         {
 | 
|---|
 | 3313 |         return _attr ? &xml_attribute::_attr : 0;
 | 
|---|
 | 3314 |         }
 | 
|---|
 | 3315 | 
 | 
|---|
 | 3316 |         bool xml_attribute::operator!() const
 | 
|---|
 | 3317 |         {
 | 
|---|
 | 3318 |                 return !_attr;
 | 
|---|
 | 3319 |         }
 | 
|---|
 | 3320 | 
 | 
|---|
 | 3321 |         bool xml_attribute::operator==(const xml_attribute& r) const
 | 
|---|
 | 3322 |         {
 | 
|---|
 | 3323 |                 return (_attr == r._attr);
 | 
|---|
 | 3324 |         }
 | 
|---|
 | 3325 |         
 | 
|---|
 | 3326 |         bool xml_attribute::operator!=(const xml_attribute& r) const
 | 
|---|
 | 3327 |         {
 | 
|---|
 | 3328 |                 return (_attr != r._attr);
 | 
|---|
 | 3329 |         }
 | 
|---|
 | 3330 | 
 | 
|---|
 | 3331 |         bool xml_attribute::operator<(const xml_attribute& r) const
 | 
|---|
 | 3332 |         {
 | 
|---|
 | 3333 |                 return (_attr < r._attr);
 | 
|---|
 | 3334 |         }
 | 
|---|
 | 3335 |         
 | 
|---|
 | 3336 |         bool xml_attribute::operator>(const xml_attribute& r) const
 | 
|---|
 | 3337 |         {
 | 
|---|
 | 3338 |                 return (_attr > r._attr);
 | 
|---|
 | 3339 |         }
 | 
|---|
 | 3340 |         
 | 
|---|
 | 3341 |         bool xml_attribute::operator<=(const xml_attribute& r) const
 | 
|---|
 | 3342 |         {
 | 
|---|
 | 3343 |                 return (_attr <= r._attr);
 | 
|---|
 | 3344 |         }
 | 
|---|
 | 3345 |         
 | 
|---|
 | 3346 |         bool xml_attribute::operator>=(const xml_attribute& r) const
 | 
|---|
 | 3347 |         {
 | 
|---|
 | 3348 |                 return (_attr >= r._attr);
 | 
|---|
 | 3349 |         }
 | 
|---|
 | 3350 | 
 | 
|---|
 | 3351 |         xml_attribute xml_attribute::next_attribute() const
 | 
|---|
 | 3352 |         {
 | 
|---|
 | 3353 |         return _attr ? xml_attribute(_attr->next_attribute) : xml_attribute();
 | 
|---|
 | 3354 |         }
 | 
|---|
 | 3355 | 
 | 
|---|
 | 3356 |     xml_attribute xml_attribute::previous_attribute() const
 | 
|---|
 | 3357 |     {
 | 
|---|
 | 3358 |         return _attr && _attr->prev_attribute_c->next_attribute ? xml_attribute(_attr->prev_attribute_c) : xml_attribute();
 | 
|---|
 | 3359 |     }
 | 
|---|
 | 3360 | 
 | 
|---|
 | 3361 |         int xml_attribute::as_int() const
 | 
|---|
 | 3362 |         {
 | 
|---|
 | 3363 |                 if (!_attr || !_attr->value) return 0;
 | 
|---|
 | 3364 | 
 | 
|---|
 | 3365 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 3366 |                 return (int)wcstol(_attr->value, 0, 10);
 | 
|---|
 | 3367 |         #else
 | 
|---|
 | 3368 |                 return (int)strtol(_attr->value, 0, 10);
 | 
|---|
 | 3369 |         #endif
 | 
|---|
 | 3370 |         }
 | 
|---|
 | 3371 | 
 | 
|---|
 | 3372 |         unsigned int xml_attribute::as_uint() const
 | 
|---|
 | 3373 |         {
 | 
|---|
 | 3374 |                 if (!_attr || !_attr->value) return 0;
 | 
|---|
 | 3375 | 
 | 
|---|
 | 3376 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 3377 |                 return (unsigned int)wcstoul(_attr->value, 0, 10);
 | 
|---|
 | 3378 |         #else
 | 
|---|
 | 3379 |                 return (unsigned int)strtoul(_attr->value, 0, 10);
 | 
|---|
 | 3380 |         #endif
 | 
|---|
 | 3381 |         }
 | 
|---|
 | 3382 | 
 | 
|---|
 | 3383 |         double xml_attribute::as_double() const
 | 
|---|
 | 3384 |         {
 | 
|---|
 | 3385 |                 if (!_attr || !_attr->value) return 0;
 | 
|---|
 | 3386 | 
 | 
|---|
 | 3387 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 3388 |                 return wcstod(_attr->value, 0);
 | 
|---|
 | 3389 |         #else
 | 
|---|
 | 3390 |                 return strtod(_attr->value, 0);
 | 
|---|
 | 3391 |         #endif
 | 
|---|
 | 3392 |         }
 | 
|---|
 | 3393 | 
 | 
|---|
 | 3394 |         float xml_attribute::as_float() const
 | 
|---|
 | 3395 |         {
 | 
|---|
 | 3396 |                 if (!_attr || !_attr->value) return 0;
 | 
|---|
 | 3397 | 
 | 
|---|
 | 3398 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 3399 |                 return (float)wcstod(_attr->value, 0);
 | 
|---|
 | 3400 |         #else
 | 
|---|
 | 3401 |                 return (float)strtod(_attr->value, 0);
 | 
|---|
 | 3402 |         #endif
 | 
|---|
 | 3403 |         }
 | 
|---|
 | 3404 | 
 | 
|---|
 | 3405 |         bool xml_attribute::as_bool() const
 | 
|---|
 | 3406 |         {
 | 
|---|
 | 3407 |                 if (!_attr || !_attr->value) return false;
 | 
|---|
 | 3408 | 
 | 
|---|
 | 3409 |                 // only look at first char
 | 
|---|
 | 3410 |                 char_t first = *_attr->value;
 | 
|---|
 | 3411 | 
 | 
|---|
 | 3412 |                 // 1*, t* (true), T* (True), y* (yes), Y* (YES)
 | 
|---|
 | 3413 |                 return (first == '1' || first == 't' || first == 'T' || first == 'y' || first == 'Y');
 | 
|---|
 | 3414 |         }
 | 
|---|
 | 3415 | 
 | 
|---|
 | 3416 |         bool xml_attribute::empty() const
 | 
|---|
 | 3417 |         {
 | 
|---|
 | 3418 |                 return !_attr;
 | 
|---|
 | 3419 |         }
 | 
|---|
 | 3420 | 
 | 
|---|
 | 3421 |         const char_t* xml_attribute::name() const
 | 
|---|
 | 3422 |         {
 | 
|---|
 | 3423 |                 return (_attr && _attr->name) ? _attr->name : PUGIXML_TEXT("");
 | 
|---|
 | 3424 |         }
 | 
|---|
 | 3425 | 
 | 
|---|
 | 3426 |         const char_t* xml_attribute::value() const
 | 
|---|
 | 3427 |         {
 | 
|---|
 | 3428 |                 return (_attr && _attr->value) ? _attr->value : PUGIXML_TEXT("");
 | 
|---|
 | 3429 |         }
 | 
|---|
 | 3430 | 
 | 
|---|
 | 3431 |     size_t xml_attribute::hash_value() const
 | 
|---|
 | 3432 |     {
 | 
|---|
 | 3433 |         return static_cast<size_t>(reinterpret_cast<uintptr_t>(_attr) / sizeof(xml_attribute_struct));
 | 
|---|
 | 3434 |     }
 | 
|---|
 | 3435 | 
 | 
|---|
 | 3436 |         xml_attribute_struct* xml_attribute::internal_object() const
 | 
|---|
 | 3437 |         {
 | 
|---|
 | 3438 |         return _attr;
 | 
|---|
 | 3439 |         }
 | 
|---|
 | 3440 | 
 | 
|---|
 | 3441 |         xml_attribute& xml_attribute::operator=(const char_t* rhs)
 | 
|---|
 | 3442 |         {
 | 
|---|
 | 3443 |                 set_value(rhs);
 | 
|---|
 | 3444 |                 return *this;
 | 
|---|
 | 3445 |         }
 | 
|---|
 | 3446 |         
 | 
|---|
 | 3447 |         xml_attribute& xml_attribute::operator=(int rhs)
 | 
|---|
 | 3448 |         {
 | 
|---|
 | 3449 |                 set_value(rhs);
 | 
|---|
 | 3450 |                 return *this;
 | 
|---|
 | 3451 |         }
 | 
|---|
 | 3452 | 
 | 
|---|
 | 3453 |         xml_attribute& xml_attribute::operator=(unsigned int rhs)
 | 
|---|
 | 3454 |         {
 | 
|---|
 | 3455 |                 set_value(rhs);
 | 
|---|
 | 3456 |                 return *this;
 | 
|---|
 | 3457 |         }
 | 
|---|
 | 3458 | 
 | 
|---|
 | 3459 |         xml_attribute& xml_attribute::operator=(double rhs)
 | 
|---|
 | 3460 |         {
 | 
|---|
 | 3461 |                 set_value(rhs);
 | 
|---|
 | 3462 |                 return *this;
 | 
|---|
 | 3463 |         }
 | 
|---|
 | 3464 |         
 | 
|---|
 | 3465 |         xml_attribute& xml_attribute::operator=(bool rhs)
 | 
|---|
 | 3466 |         {
 | 
|---|
 | 3467 |                 set_value(rhs);
 | 
|---|
 | 3468 |                 return *this;
 | 
|---|
 | 3469 |         }
 | 
|---|
 | 3470 | 
 | 
|---|
 | 3471 |         bool xml_attribute::set_name(const char_t* rhs)
 | 
|---|
 | 3472 |         {
 | 
|---|
 | 3473 |                 if (!_attr) return false;
 | 
|---|
 | 3474 |                 
 | 
|---|
 | 3475 |                 return strcpy_insitu(_attr->name, _attr->header, xml_memory_page_name_allocated_mask, rhs);
 | 
|---|
 | 3476 |         }
 | 
|---|
 | 3477 |                 
 | 
|---|
 | 3478 |         bool xml_attribute::set_value(const char_t* rhs)
 | 
|---|
 | 3479 |         {
 | 
|---|
 | 3480 |                 if (!_attr) return false;
 | 
|---|
 | 3481 | 
 | 
|---|
 | 3482 |                 return strcpy_insitu(_attr->value, _attr->header, xml_memory_page_value_allocated_mask, rhs);
 | 
|---|
 | 3483 |         }
 | 
|---|
 | 3484 | 
 | 
|---|
 | 3485 |         bool xml_attribute::set_value(int rhs)
 | 
|---|
 | 3486 |         {
 | 
|---|
 | 3487 |                 char buf[128];
 | 
|---|
 | 3488 |                 sprintf(buf, "%d", rhs);
 | 
|---|
 | 3489 |         
 | 
|---|
 | 3490 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 3491 |                 char_t wbuf[128];
 | 
|---|
 | 3492 |                 widen_ascii(wbuf, buf);
 | 
|---|
 | 3493 | 
 | 
|---|
 | 3494 |                 return set_value(wbuf);
 | 
|---|
 | 3495 |         #else
 | 
|---|
 | 3496 |                 return set_value(buf);
 | 
|---|
 | 3497 |         #endif
 | 
|---|
 | 3498 |         }
 | 
|---|
 | 3499 | 
 | 
|---|
 | 3500 |         bool xml_attribute::set_value(unsigned int rhs)
 | 
|---|
 | 3501 |         {
 | 
|---|
 | 3502 |                 char buf[128];
 | 
|---|
 | 3503 |                 sprintf(buf, "%u", rhs);
 | 
|---|
 | 3504 | 
 | 
|---|
 | 3505 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 3506 |                 char_t wbuf[128];
 | 
|---|
 | 3507 |                 widen_ascii(wbuf, buf);
 | 
|---|
 | 3508 | 
 | 
|---|
 | 3509 |                 return set_value(wbuf);
 | 
|---|
 | 3510 |         #else
 | 
|---|
 | 3511 |                 return set_value(buf);
 | 
|---|
 | 3512 |         #endif
 | 
|---|
 | 3513 |         }
 | 
|---|
 | 3514 | 
 | 
|---|
 | 3515 |         bool xml_attribute::set_value(double rhs)
 | 
|---|
 | 3516 |         {
 | 
|---|
 | 3517 |                 char buf[128];
 | 
|---|
 | 3518 |                 sprintf(buf, "%g", rhs);
 | 
|---|
 | 3519 | 
 | 
|---|
 | 3520 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 3521 |                 char_t wbuf[128];
 | 
|---|
 | 3522 |                 widen_ascii(wbuf, buf);
 | 
|---|
 | 3523 | 
 | 
|---|
 | 3524 |                 return set_value(wbuf);
 | 
|---|
 | 3525 |         #else
 | 
|---|
 | 3526 |                 return set_value(buf);
 | 
|---|
 | 3527 |         #endif
 | 
|---|
 | 3528 |         }
 | 
|---|
 | 3529 |         
 | 
|---|
 | 3530 |         bool xml_attribute::set_value(bool rhs)
 | 
|---|
 | 3531 |         {
 | 
|---|
 | 3532 |                 return set_value(rhs ? PUGIXML_TEXT("true") : PUGIXML_TEXT("false"));
 | 
|---|
 | 3533 |         }
 | 
|---|
 | 3534 | 
 | 
|---|
 | 3535 | #ifdef __BORLANDC__
 | 
|---|
 | 3536 |         bool operator&&(const xml_attribute& lhs, bool rhs)
 | 
|---|
 | 3537 |         {
 | 
|---|
 | 3538 |                 return (bool)lhs && rhs;
 | 
|---|
 | 3539 |         }
 | 
|---|
 | 3540 | 
 | 
|---|
 | 3541 |         bool operator||(const xml_attribute& lhs, bool rhs)
 | 
|---|
 | 3542 |         {
 | 
|---|
 | 3543 |                 return (bool)lhs || rhs;
 | 
|---|
 | 3544 |         }
 | 
|---|
 | 3545 | #endif
 | 
|---|
 | 3546 | 
 | 
|---|
 | 3547 |         xml_node::xml_node(): _root(0)
 | 
|---|
 | 3548 |         {
 | 
|---|
 | 3549 |         }
 | 
|---|
 | 3550 | 
 | 
|---|
 | 3551 |         xml_node::xml_node(xml_node_struct* p): _root(p)
 | 
|---|
 | 3552 |         {
 | 
|---|
 | 3553 |         }
 | 
|---|
 | 3554 |         
 | 
|---|
 | 3555 |         xml_node::operator xml_node::unspecified_bool_type() const
 | 
|---|
 | 3556 |         {
 | 
|---|
 | 3557 |         return _root ? &xml_node::_root : 0;
 | 
|---|
 | 3558 |         }
 | 
|---|
 | 3559 | 
 | 
|---|
 | 3560 |         bool xml_node::operator!() const
 | 
|---|
 | 3561 |         {
 | 
|---|
 | 3562 |                 return !_root;
 | 
|---|
 | 3563 |         }
 | 
|---|
 | 3564 | 
 | 
|---|
 | 3565 |         xml_node::iterator xml_node::begin() const
 | 
|---|
 | 3566 |         {
 | 
|---|
 | 3567 |                 return iterator(_root ? _root->first_child : 0, _root);
 | 
|---|
 | 3568 |         }
 | 
|---|
 | 3569 | 
 | 
|---|
 | 3570 |         xml_node::iterator xml_node::end() const
 | 
|---|
 | 3571 |         {
 | 
|---|
 | 3572 |                 return iterator(0, _root);
 | 
|---|
 | 3573 |         }
 | 
|---|
 | 3574 |         
 | 
|---|
 | 3575 |         xml_node::attribute_iterator xml_node::attributes_begin() const
 | 
|---|
 | 3576 |         {
 | 
|---|
 | 3577 |                 return attribute_iterator(_root ? _root->first_attribute : 0, _root);
 | 
|---|
 | 3578 |         }
 | 
|---|
 | 3579 | 
 | 
|---|
 | 3580 |         xml_node::attribute_iterator xml_node::attributes_end() const
 | 
|---|
 | 3581 |         {
 | 
|---|
 | 3582 |                 return attribute_iterator(0, _root);
 | 
|---|
 | 3583 |         }
 | 
|---|
 | 3584 | 
 | 
|---|
 | 3585 |         bool xml_node::operator==(const xml_node& r) const
 | 
|---|
 | 3586 |         {
 | 
|---|
 | 3587 |                 return (_root == r._root);
 | 
|---|
 | 3588 |         }
 | 
|---|
 | 3589 | 
 | 
|---|
 | 3590 |         bool xml_node::operator!=(const xml_node& r) const
 | 
|---|
 | 3591 |         {
 | 
|---|
 | 3592 |                 return (_root != r._root);
 | 
|---|
 | 3593 |         }
 | 
|---|
 | 3594 | 
 | 
|---|
 | 3595 |         bool xml_node::operator<(const xml_node& r) const
 | 
|---|
 | 3596 |         {
 | 
|---|
 | 3597 |                 return (_root < r._root);
 | 
|---|
 | 3598 |         }
 | 
|---|
 | 3599 |         
 | 
|---|
 | 3600 |         bool xml_node::operator>(const xml_node& r) const
 | 
|---|
 | 3601 |         {
 | 
|---|
 | 3602 |                 return (_root > r._root);
 | 
|---|
 | 3603 |         }
 | 
|---|
 | 3604 |         
 | 
|---|
 | 3605 |         bool xml_node::operator<=(const xml_node& r) const
 | 
|---|
 | 3606 |         {
 | 
|---|
 | 3607 |                 return (_root <= r._root);
 | 
|---|
 | 3608 |         }
 | 
|---|
 | 3609 |         
 | 
|---|
 | 3610 |         bool xml_node::operator>=(const xml_node& r) const
 | 
|---|
 | 3611 |         {
 | 
|---|
 | 3612 |                 return (_root >= r._root);
 | 
|---|
 | 3613 |         }
 | 
|---|
 | 3614 | 
 | 
|---|
 | 3615 |         bool xml_node::empty() const
 | 
|---|
 | 3616 |         {
 | 
|---|
 | 3617 |                 return !_root;
 | 
|---|
 | 3618 |         }
 | 
|---|
 | 3619 |         
 | 
|---|
 | 3620 |         const char_t* xml_node::name() const
 | 
|---|
 | 3621 |         {
 | 
|---|
 | 3622 |                 return (_root && _root->name) ? _root->name : PUGIXML_TEXT("");
 | 
|---|
 | 3623 |         }
 | 
|---|
 | 3624 | 
 | 
|---|
 | 3625 |         xml_node_type xml_node::type() const
 | 
|---|
 | 3626 |         {
 | 
|---|
 | 3627 |                 return _root ? static_cast<xml_node_type>((_root->header & xml_memory_page_type_mask) + 1) : node_null;
 | 
|---|
 | 3628 |         }
 | 
|---|
 | 3629 |         
 | 
|---|
 | 3630 |         const char_t* xml_node::value() const
 | 
|---|
 | 3631 |         {
 | 
|---|
 | 3632 |                 return (_root && _root->value) ? _root->value : PUGIXML_TEXT("");
 | 
|---|
 | 3633 |         }
 | 
|---|
 | 3634 |         
 | 
|---|
 | 3635 |         xml_node xml_node::child(const char_t* name) const
 | 
|---|
 | 3636 |         {
 | 
|---|
 | 3637 |                 if (!_root) return xml_node();
 | 
|---|
 | 3638 | 
 | 
|---|
 | 3639 |                 for (xml_node_struct* i = _root->first_child; i; i = i->next_sibling)
 | 
|---|
 | 3640 |                         if (i->name && strequal(name, i->name)) return xml_node(i);
 | 
|---|
 | 3641 | 
 | 
|---|
 | 3642 |                 return xml_node();
 | 
|---|
 | 3643 |         }
 | 
|---|
 | 3644 | 
 | 
|---|
 | 3645 |         xml_attribute xml_node::attribute(const char_t* name) const
 | 
|---|
 | 3646 |         {
 | 
|---|
 | 3647 |                 if (!_root) return xml_attribute();
 | 
|---|
 | 3648 | 
 | 
|---|
 | 3649 |                 for (xml_attribute_struct* i = _root->first_attribute; i; i = i->next_attribute)
 | 
|---|
 | 3650 |                         if (i->name && strequal(name, i->name))
 | 
|---|
 | 3651 |                                 return xml_attribute(i);
 | 
|---|
 | 3652 |                 
 | 
|---|
 | 3653 |                 return xml_attribute();
 | 
|---|
 | 3654 |         }
 | 
|---|
 | 3655 |         
 | 
|---|
 | 3656 |         xml_node xml_node::next_sibling(const char_t* name) const
 | 
|---|
 | 3657 |         {
 | 
|---|
 | 3658 |                 if (!_root) return xml_node();
 | 
|---|
 | 3659 |                 
 | 
|---|
 | 3660 |                 for (xml_node_struct* i = _root->next_sibling; i; i = i->next_sibling)
 | 
|---|
 | 3661 |                         if (i->name && strequal(name, i->name)) return xml_node(i);
 | 
|---|
 | 3662 | 
 | 
|---|
 | 3663 |                 return xml_node();
 | 
|---|
 | 3664 |         }
 | 
|---|
 | 3665 | 
 | 
|---|
 | 3666 |         xml_node xml_node::next_sibling() const
 | 
|---|
 | 3667 |         {
 | 
|---|
 | 3668 |                 if (!_root) return xml_node();
 | 
|---|
 | 3669 |                 
 | 
|---|
 | 3670 |                 if (_root->next_sibling) return xml_node(_root->next_sibling);
 | 
|---|
 | 3671 |                 else return xml_node();
 | 
|---|
 | 3672 |         }
 | 
|---|
 | 3673 | 
 | 
|---|
 | 3674 |         xml_node xml_node::previous_sibling(const char_t* name) const
 | 
|---|
 | 3675 |         {
 | 
|---|
 | 3676 |                 if (!_root) return xml_node();
 | 
|---|
 | 3677 |                 
 | 
|---|
 | 3678 |                 for (xml_node_struct* i = _root->prev_sibling_c; i->next_sibling; i = i->prev_sibling_c)
 | 
|---|
 | 3679 |                         if (i->name && strequal(name, i->name)) return xml_node(i);
 | 
|---|
 | 3680 | 
 | 
|---|
 | 3681 |                 return xml_node();
 | 
|---|
 | 3682 |         }
 | 
|---|
 | 3683 | 
 | 
|---|
 | 3684 |         xml_node xml_node::previous_sibling() const
 | 
|---|
 | 3685 |         {
 | 
|---|
 | 3686 |                 if (!_root) return xml_node();
 | 
|---|
 | 3687 |                 
 | 
|---|
 | 3688 |                 if (_root->prev_sibling_c->next_sibling) return xml_node(_root->prev_sibling_c);
 | 
|---|
 | 3689 |                 else return xml_node();
 | 
|---|
 | 3690 |         }
 | 
|---|
 | 3691 | 
 | 
|---|
 | 3692 |         xml_node xml_node::parent() const
 | 
|---|
 | 3693 |         {
 | 
|---|
 | 3694 |                 return _root ? xml_node(_root->parent) : xml_node();
 | 
|---|
 | 3695 |         }
 | 
|---|
 | 3696 | 
 | 
|---|
 | 3697 |         xml_node xml_node::root() const
 | 
|---|
 | 3698 |         {
 | 
|---|
 | 3699 |                 if (!_root) return xml_node();
 | 
|---|
 | 3700 | 
 | 
|---|
 | 3701 |                 xml_memory_page* page = reinterpret_cast<xml_memory_page*>(_root->header & xml_memory_page_pointer_mask);
 | 
|---|
 | 3702 | 
 | 
|---|
 | 3703 |                 return xml_node(static_cast<xml_document_struct*>(page->allocator));
 | 
|---|
 | 3704 |         }
 | 
|---|
 | 3705 | 
 | 
|---|
 | 3706 |         const char_t* xml_node::child_value() const
 | 
|---|
 | 3707 |         {
 | 
|---|
 | 3708 |                 if (!_root) return PUGIXML_TEXT("");
 | 
|---|
 | 3709 |                 
 | 
|---|
 | 3710 |                 for (xml_node_struct* i = _root->first_child; i; i = i->next_sibling)
 | 
|---|
 | 3711 |                 {
 | 
|---|
 | 3712 |                         xml_node_type type = static_cast<xml_node_type>((i->header & xml_memory_page_type_mask) + 1);
 | 
|---|
 | 3713 | 
 | 
|---|
 | 3714 |                         if (i->value && (type == node_pcdata || type == node_cdata))
 | 
|---|
 | 3715 |                                 return i->value;
 | 
|---|
 | 3716 |                 }
 | 
|---|
 | 3717 | 
 | 
|---|
 | 3718 |                 return PUGIXML_TEXT("");
 | 
|---|
 | 3719 |         }
 | 
|---|
 | 3720 | 
 | 
|---|
 | 3721 |         const char_t* xml_node::child_value(const char_t* name) const
 | 
|---|
 | 3722 |         {
 | 
|---|
 | 3723 |                 return child(name).child_value();
 | 
|---|
 | 3724 |         }
 | 
|---|
 | 3725 | 
 | 
|---|
 | 3726 |         xml_attribute xml_node::first_attribute() const
 | 
|---|
 | 3727 |         {
 | 
|---|
 | 3728 |                 return _root ? xml_attribute(_root->first_attribute) : xml_attribute();
 | 
|---|
 | 3729 |         }
 | 
|---|
 | 3730 | 
 | 
|---|
 | 3731 |         xml_attribute xml_node::last_attribute() const
 | 
|---|
 | 3732 |         {
 | 
|---|
 | 3733 |                 return _root && _root->first_attribute ? xml_attribute(_root->first_attribute->prev_attribute_c) : xml_attribute();
 | 
|---|
 | 3734 |         }
 | 
|---|
 | 3735 | 
 | 
|---|
 | 3736 |         xml_node xml_node::first_child() const
 | 
|---|
 | 3737 |         {
 | 
|---|
 | 3738 |                 return _root ? xml_node(_root->first_child) : xml_node();
 | 
|---|
 | 3739 |         }
 | 
|---|
 | 3740 | 
 | 
|---|
 | 3741 |         xml_node xml_node::last_child() const
 | 
|---|
 | 3742 |         {
 | 
|---|
 | 3743 |                 return _root && _root->first_child ? xml_node(_root->first_child->prev_sibling_c) : xml_node();
 | 
|---|
 | 3744 |         }
 | 
|---|
 | 3745 | 
 | 
|---|
 | 3746 |         bool xml_node::set_name(const char_t* rhs)
 | 
|---|
 | 3747 |         {
 | 
|---|
 | 3748 |                 switch (type())
 | 
|---|
 | 3749 |                 {
 | 
|---|
 | 3750 |                 case node_pi:
 | 
|---|
 | 3751 |                 case node_declaration:
 | 
|---|
 | 3752 |                 case node_element:
 | 
|---|
 | 3753 |                         return strcpy_insitu(_root->name, _root->header, xml_memory_page_name_allocated_mask, rhs);
 | 
|---|
 | 3754 | 
 | 
|---|
 | 3755 |                 default:
 | 
|---|
 | 3756 |                         return false;
 | 
|---|
 | 3757 |                 }
 | 
|---|
 | 3758 |         }
 | 
|---|
 | 3759 |                 
 | 
|---|
 | 3760 |         bool xml_node::set_value(const char_t* rhs)
 | 
|---|
 | 3761 |         {
 | 
|---|
 | 3762 |                 switch (type())
 | 
|---|
 | 3763 |                 {
 | 
|---|
 | 3764 |                 case node_pi:
 | 
|---|
 | 3765 |                 case node_cdata:
 | 
|---|
 | 3766 |                 case node_pcdata:
 | 
|---|
 | 3767 |                 case node_comment:
 | 
|---|
 | 3768 |         case node_doctype:
 | 
|---|
 | 3769 |                         return strcpy_insitu(_root->value, _root->header, xml_memory_page_value_allocated_mask, rhs);
 | 
|---|
 | 3770 | 
 | 
|---|
 | 3771 |                 default:
 | 
|---|
 | 3772 |                         return false;
 | 
|---|
 | 3773 |                 }
 | 
|---|
 | 3774 |         }
 | 
|---|
 | 3775 | 
 | 
|---|
 | 3776 |         xml_attribute xml_node::append_attribute(const char_t* name)
 | 
|---|
 | 3777 |         {
 | 
|---|
 | 3778 |                 if (type() != node_element && type() != node_declaration) return xml_attribute();
 | 
|---|
 | 3779 |                 
 | 
|---|
 | 3780 |                 xml_attribute a(append_attribute_ll(_root, get_allocator(_root)));
 | 
|---|
 | 3781 |                 a.set_name(name);
 | 
|---|
 | 3782 |                 
 | 
|---|
 | 3783 |                 return a;
 | 
|---|
 | 3784 |         }
 | 
|---|
 | 3785 | 
 | 
|---|
 | 3786 |         xml_attribute xml_node::prepend_attribute(const char_t* name)
 | 
|---|
 | 3787 |         {
 | 
|---|
 | 3788 |                 if (type() != node_element && type() != node_declaration) return xml_attribute();
 | 
|---|
 | 3789 |                 
 | 
|---|
 | 3790 |                 xml_attribute a(allocate_attribute(get_allocator(_root)));
 | 
|---|
 | 3791 |                 if (!a) return xml_attribute();
 | 
|---|
 | 3792 | 
 | 
|---|
 | 3793 |                 a.set_name(name);
 | 
|---|
 | 3794 |                 
 | 
|---|
 | 3795 |         xml_attribute_struct* head = _root->first_attribute;
 | 
|---|
 | 3796 | 
 | 
|---|
 | 3797 |                 if (head)
 | 
|---|
 | 3798 |         {
 | 
|---|
 | 3799 |             a._attr->prev_attribute_c = head->prev_attribute_c;
 | 
|---|
 | 3800 |             head->prev_attribute_c = a._attr;
 | 
|---|
 | 3801 |         }
 | 
|---|
 | 3802 |         else
 | 
|---|
 | 3803 |             a._attr->prev_attribute_c = a._attr;
 | 
|---|
 | 3804 |                 
 | 
|---|
 | 3805 |                 a._attr->next_attribute = head;
 | 
|---|
 | 3806 |         _root->first_attribute = a._attr;
 | 
|---|
 | 3807 |                                 
 | 
|---|
 | 3808 |                 return a;
 | 
|---|
 | 3809 |         }
 | 
|---|
 | 3810 | 
 | 
|---|
 | 3811 |         xml_attribute xml_node::insert_attribute_before(const char_t* name, const xml_attribute& attr)
 | 
|---|
 | 3812 |         {
 | 
|---|
 | 3813 |                 if ((type() != node_element && type() != node_declaration) || attr.empty()) return xml_attribute();
 | 
|---|
 | 3814 |                 
 | 
|---|
 | 3815 |                 // check that attribute belongs to *this
 | 
|---|
 | 3816 |                 xml_attribute_struct* cur = attr._attr;
 | 
|---|
 | 3817 | 
 | 
|---|
 | 3818 |                 while (cur->prev_attribute_c->next_attribute) cur = cur->prev_attribute_c;
 | 
|---|
 | 3819 | 
 | 
|---|
 | 3820 |                 if (cur != _root->first_attribute) return xml_attribute();
 | 
|---|
 | 3821 | 
 | 
|---|
 | 3822 |                 xml_attribute a(allocate_attribute(get_allocator(_root)));
 | 
|---|
 | 3823 |                 if (!a) return xml_attribute();
 | 
|---|
 | 3824 | 
 | 
|---|
 | 3825 |                 a.set_name(name);
 | 
|---|
 | 3826 | 
 | 
|---|
 | 3827 |                 if (attr._attr->prev_attribute_c->next_attribute)
 | 
|---|
 | 3828 |                         attr._attr->prev_attribute_c->next_attribute = a._attr;
 | 
|---|
 | 3829 |                 else
 | 
|---|
 | 3830 |                         _root->first_attribute = a._attr;
 | 
|---|
 | 3831 |                 
 | 
|---|
 | 3832 |                 a._attr->prev_attribute_c = attr._attr->prev_attribute_c;
 | 
|---|
 | 3833 |                 a._attr->next_attribute = attr._attr;
 | 
|---|
 | 3834 |                 attr._attr->prev_attribute_c = a._attr;
 | 
|---|
 | 3835 |                                 
 | 
|---|
 | 3836 |                 return a;
 | 
|---|
 | 3837 |         }
 | 
|---|
 | 3838 | 
 | 
|---|
 | 3839 |         xml_attribute xml_node::insert_attribute_after(const char_t* name, const xml_attribute& attr)
 | 
|---|
 | 3840 |         {
 | 
|---|
 | 3841 |                 if ((type() != node_element && type() != node_declaration) || attr.empty()) return xml_attribute();
 | 
|---|
 | 3842 |                 
 | 
|---|
 | 3843 |                 // check that attribute belongs to *this
 | 
|---|
 | 3844 |                 xml_attribute_struct* cur = attr._attr;
 | 
|---|
 | 3845 | 
 | 
|---|
 | 3846 |                 while (cur->prev_attribute_c->next_attribute) cur = cur->prev_attribute_c;
 | 
|---|
 | 3847 | 
 | 
|---|
 | 3848 |                 if (cur != _root->first_attribute) return xml_attribute();
 | 
|---|
 | 3849 | 
 | 
|---|
 | 3850 |                 xml_attribute a(allocate_attribute(get_allocator(_root)));
 | 
|---|
 | 3851 |                 if (!a) return xml_attribute();
 | 
|---|
 | 3852 | 
 | 
|---|
 | 3853 |                 a.set_name(name);
 | 
|---|
 | 3854 | 
 | 
|---|
 | 3855 |                 if (attr._attr->next_attribute)
 | 
|---|
 | 3856 |                         attr._attr->next_attribute->prev_attribute_c = a._attr;
 | 
|---|
 | 3857 |                 else
 | 
|---|
 | 3858 |                         _root->first_attribute->prev_attribute_c = a._attr;
 | 
|---|
 | 3859 |                 
 | 
|---|
 | 3860 |                 a._attr->next_attribute = attr._attr->next_attribute;
 | 
|---|
 | 3861 |                 a._attr->prev_attribute_c = attr._attr;
 | 
|---|
 | 3862 |                 attr._attr->next_attribute = a._attr;
 | 
|---|
 | 3863 | 
 | 
|---|
 | 3864 |                 return a;
 | 
|---|
 | 3865 |         }
 | 
|---|
 | 3866 | 
 | 
|---|
 | 3867 |         xml_attribute xml_node::append_copy(const xml_attribute& proto)
 | 
|---|
 | 3868 |         {
 | 
|---|
 | 3869 |                 if (!proto) return xml_attribute();
 | 
|---|
 | 3870 | 
 | 
|---|
 | 3871 |                 xml_attribute result = append_attribute(proto.name());
 | 
|---|
 | 3872 |                 result.set_value(proto.value());
 | 
|---|
 | 3873 | 
 | 
|---|
 | 3874 |                 return result;
 | 
|---|
 | 3875 |         }
 | 
|---|
 | 3876 | 
 | 
|---|
 | 3877 |         xml_attribute xml_node::prepend_copy(const xml_attribute& proto)
 | 
|---|
 | 3878 |         {
 | 
|---|
 | 3879 |                 if (!proto) return xml_attribute();
 | 
|---|
 | 3880 | 
 | 
|---|
 | 3881 |                 xml_attribute result = prepend_attribute(proto.name());
 | 
|---|
 | 3882 |                 result.set_value(proto.value());
 | 
|---|
 | 3883 | 
 | 
|---|
 | 3884 |                 return result;
 | 
|---|
 | 3885 |         }
 | 
|---|
 | 3886 | 
 | 
|---|
 | 3887 |         xml_attribute xml_node::insert_copy_after(const xml_attribute& proto, const xml_attribute& attr)
 | 
|---|
 | 3888 |         {
 | 
|---|
 | 3889 |                 if (!proto) return xml_attribute();
 | 
|---|
 | 3890 | 
 | 
|---|
 | 3891 |                 xml_attribute result = insert_attribute_after(proto.name(), attr);
 | 
|---|
 | 3892 |                 result.set_value(proto.value());
 | 
|---|
 | 3893 | 
 | 
|---|
 | 3894 |                 return result;
 | 
|---|
 | 3895 |         }
 | 
|---|
 | 3896 | 
 | 
|---|
 | 3897 |         xml_attribute xml_node::insert_copy_before(const xml_attribute& proto, const xml_attribute& attr)
 | 
|---|
 | 3898 |         {
 | 
|---|
 | 3899 |                 if (!proto) return xml_attribute();
 | 
|---|
 | 3900 | 
 | 
|---|
 | 3901 |                 xml_attribute result = insert_attribute_before(proto.name(), attr);
 | 
|---|
 | 3902 |                 result.set_value(proto.value());
 | 
|---|
 | 3903 | 
 | 
|---|
 | 3904 |                 return result;
 | 
|---|
 | 3905 |         }
 | 
|---|
 | 3906 | 
 | 
|---|
 | 3907 |         xml_node xml_node::append_child(xml_node_type type)
 | 
|---|
 | 3908 |         {
 | 
|---|
 | 3909 |                 if (!allow_insert_child(this->type(), type)) return xml_node();
 | 
|---|
 | 3910 |                 
 | 
|---|
 | 3911 |                 xml_node n(append_node(_root, get_allocator(_root), type));
 | 
|---|
 | 3912 | 
 | 
|---|
 | 3913 |                 if (type == node_declaration) n.set_name(PUGIXML_TEXT("xml"));
 | 
|---|
 | 3914 | 
 | 
|---|
 | 3915 |                 return n;
 | 
|---|
 | 3916 |         }
 | 
|---|
 | 3917 | 
 | 
|---|
 | 3918 |         xml_node xml_node::prepend_child(xml_node_type type)
 | 
|---|
 | 3919 |         {
 | 
|---|
 | 3920 |                 if (!allow_insert_child(this->type(), type)) return xml_node();
 | 
|---|
 | 3921 |                 
 | 
|---|
 | 3922 |                 xml_node n(allocate_node(get_allocator(_root), type));
 | 
|---|
 | 3923 |                 if (!n) return xml_node();
 | 
|---|
 | 3924 | 
 | 
|---|
 | 3925 |         n._root->parent = _root;
 | 
|---|
 | 3926 | 
 | 
|---|
 | 3927 |         xml_node_struct* head = _root->first_child;
 | 
|---|
 | 3928 | 
 | 
|---|
 | 3929 |                 if (head)
 | 
|---|
 | 3930 |         {
 | 
|---|
 | 3931 |             n._root->prev_sibling_c = head->prev_sibling_c;
 | 
|---|
 | 3932 |             head->prev_sibling_c = n._root;
 | 
|---|
 | 3933 |         }
 | 
|---|
 | 3934 |         else
 | 
|---|
 | 3935 |             n._root->prev_sibling_c = n._root;
 | 
|---|
 | 3936 |                 
 | 
|---|
 | 3937 |                 n._root->next_sibling = head;
 | 
|---|
 | 3938 |         _root->first_child = n._root;
 | 
|---|
 | 3939 |                                 
 | 
|---|
 | 3940 |                 if (type == node_declaration) n.set_name(PUGIXML_TEXT("xml"));
 | 
|---|
 | 3941 | 
 | 
|---|
 | 3942 |                 return n;
 | 
|---|
 | 3943 |         }
 | 
|---|
 | 3944 | 
 | 
|---|
 | 3945 |         xml_node xml_node::insert_child_before(xml_node_type type, const xml_node& node)
 | 
|---|
 | 3946 |         {
 | 
|---|
 | 3947 |                 if (!allow_insert_child(this->type(), type)) return xml_node();
 | 
|---|
 | 3948 |                 if (!node._root || node._root->parent != _root) return xml_node();
 | 
|---|
 | 3949 |         
 | 
|---|
 | 3950 |                 xml_node n(allocate_node(get_allocator(_root), type));
 | 
|---|
 | 3951 |                 if (!n) return xml_node();
 | 
|---|
 | 3952 | 
 | 
|---|
 | 3953 |                 n._root->parent = _root;
 | 
|---|
 | 3954 |                 
 | 
|---|
 | 3955 |                 if (node._root->prev_sibling_c->next_sibling)
 | 
|---|
 | 3956 |                         node._root->prev_sibling_c->next_sibling = n._root;
 | 
|---|
 | 3957 |                 else
 | 
|---|
 | 3958 |                         _root->first_child = n._root;
 | 
|---|
 | 3959 |                 
 | 
|---|
 | 3960 |                 n._root->prev_sibling_c = node._root->prev_sibling_c;
 | 
|---|
 | 3961 |                 n._root->next_sibling = node._root;
 | 
|---|
 | 3962 |                 node._root->prev_sibling_c = n._root;
 | 
|---|
 | 3963 | 
 | 
|---|
 | 3964 |                 if (type == node_declaration) n.set_name(PUGIXML_TEXT("xml"));
 | 
|---|
 | 3965 | 
 | 
|---|
 | 3966 |                 return n;
 | 
|---|
 | 3967 |         }
 | 
|---|
 | 3968 | 
 | 
|---|
 | 3969 |         xml_node xml_node::insert_child_after(xml_node_type type, const xml_node& node)
 | 
|---|
 | 3970 |         {
 | 
|---|
 | 3971 |                 if (!allow_insert_child(this->type(), type)) return xml_node();
 | 
|---|
 | 3972 |                 if (!node._root || node._root->parent != _root) return xml_node();
 | 
|---|
 | 3973 |         
 | 
|---|
 | 3974 |                 xml_node n(allocate_node(get_allocator(_root), type));
 | 
|---|
 | 3975 |                 if (!n) return xml_node();
 | 
|---|
 | 3976 | 
 | 
|---|
 | 3977 |                 n._root->parent = _root;
 | 
|---|
 | 3978 |         
 | 
|---|
 | 3979 |                 if (node._root->next_sibling)
 | 
|---|
 | 3980 |                         node._root->next_sibling->prev_sibling_c = n._root;
 | 
|---|
 | 3981 |                 else
 | 
|---|
 | 3982 |                         _root->first_child->prev_sibling_c = n._root;
 | 
|---|
 | 3983 |                 
 | 
|---|
 | 3984 |                 n._root->next_sibling = node._root->next_sibling;
 | 
|---|
 | 3985 |                 n._root->prev_sibling_c = node._root;
 | 
|---|
 | 3986 |                 node._root->next_sibling = n._root;
 | 
|---|
 | 3987 | 
 | 
|---|
 | 3988 |                 if (type == node_declaration) n.set_name(PUGIXML_TEXT("xml"));
 | 
|---|
 | 3989 | 
 | 
|---|
 | 3990 |                 return n;
 | 
|---|
 | 3991 |         }
 | 
|---|
 | 3992 | 
 | 
|---|
 | 3993 |     xml_node xml_node::append_child(const char_t* name)
 | 
|---|
 | 3994 |     {
 | 
|---|
 | 3995 |         xml_node result = append_child(node_element);
 | 
|---|
 | 3996 | 
 | 
|---|
 | 3997 |         result.set_name(name);
 | 
|---|
 | 3998 | 
 | 
|---|
 | 3999 |         return result;
 | 
|---|
 | 4000 |     }
 | 
|---|
 | 4001 | 
 | 
|---|
 | 4002 |     xml_node xml_node::prepend_child(const char_t* name)
 | 
|---|
 | 4003 |     {
 | 
|---|
 | 4004 |         xml_node result = prepend_child(node_element);
 | 
|---|
 | 4005 | 
 | 
|---|
 | 4006 |         result.set_name(name);
 | 
|---|
 | 4007 | 
 | 
|---|
 | 4008 |         return result;
 | 
|---|
 | 4009 |     }
 | 
|---|
 | 4010 | 
 | 
|---|
 | 4011 |     xml_node xml_node::insert_child_after(const char_t* name, const xml_node& node)
 | 
|---|
 | 4012 |     {
 | 
|---|
 | 4013 |         xml_node result = insert_child_after(node_element, node);
 | 
|---|
 | 4014 | 
 | 
|---|
 | 4015 |         result.set_name(name);
 | 
|---|
 | 4016 | 
 | 
|---|
 | 4017 |         return result;
 | 
|---|
 | 4018 |     }
 | 
|---|
 | 4019 | 
 | 
|---|
 | 4020 |     xml_node xml_node::insert_child_before(const char_t* name, const xml_node& node)
 | 
|---|
 | 4021 |     {
 | 
|---|
 | 4022 |         xml_node result = insert_child_before(node_element, node);
 | 
|---|
 | 4023 | 
 | 
|---|
 | 4024 |         result.set_name(name);
 | 
|---|
 | 4025 | 
 | 
|---|
 | 4026 |         return result;
 | 
|---|
 | 4027 |     }
 | 
|---|
 | 4028 | 
 | 
|---|
 | 4029 |         xml_node xml_node::append_copy(const xml_node& proto)
 | 
|---|
 | 4030 |         {
 | 
|---|
 | 4031 |                 xml_node result = append_child(proto.type());
 | 
|---|
 | 4032 | 
 | 
|---|
 | 4033 |                 if (result) recursive_copy_skip(result, proto, result);
 | 
|---|
 | 4034 | 
 | 
|---|
 | 4035 |                 return result;
 | 
|---|
 | 4036 |         }
 | 
|---|
 | 4037 | 
 | 
|---|
 | 4038 |         xml_node xml_node::prepend_copy(const xml_node& proto)
 | 
|---|
 | 4039 |         {
 | 
|---|
 | 4040 |                 xml_node result = prepend_child(proto.type());
 | 
|---|
 | 4041 | 
 | 
|---|
 | 4042 |                 if (result) recursive_copy_skip(result, proto, result);
 | 
|---|
 | 4043 | 
 | 
|---|
 | 4044 |                 return result;
 | 
|---|
 | 4045 |         }
 | 
|---|
 | 4046 | 
 | 
|---|
 | 4047 |         xml_node xml_node::insert_copy_after(const xml_node& proto, const xml_node& node)
 | 
|---|
 | 4048 |         {
 | 
|---|
 | 4049 |                 xml_node result = insert_child_after(proto.type(), node);
 | 
|---|
 | 4050 | 
 | 
|---|
 | 4051 |                 if (result) recursive_copy_skip(result, proto, result);
 | 
|---|
 | 4052 | 
 | 
|---|
 | 4053 |                 return result;
 | 
|---|
 | 4054 |         }
 | 
|---|
 | 4055 | 
 | 
|---|
 | 4056 |         xml_node xml_node::insert_copy_before(const xml_node& proto, const xml_node& node)
 | 
|---|
 | 4057 |         {
 | 
|---|
 | 4058 |                 xml_node result = insert_child_before(proto.type(), node);
 | 
|---|
 | 4059 | 
 | 
|---|
 | 4060 |                 if (result) recursive_copy_skip(result, proto, result);
 | 
|---|
 | 4061 | 
 | 
|---|
 | 4062 |                 return result;
 | 
|---|
 | 4063 |         }
 | 
|---|
 | 4064 | 
 | 
|---|
 | 4065 |         bool xml_node::remove_attribute(const char_t* name)
 | 
|---|
 | 4066 |         {
 | 
|---|
 | 4067 |                 return remove_attribute(attribute(name));
 | 
|---|
 | 4068 |         }
 | 
|---|
 | 4069 | 
 | 
|---|
 | 4070 |         bool xml_node::remove_attribute(const xml_attribute& a)
 | 
|---|
 | 4071 |         {
 | 
|---|
 | 4072 |                 if (!_root || !a._attr) return false;
 | 
|---|
 | 4073 | 
 | 
|---|
 | 4074 |                 // check that attribute belongs to *this
 | 
|---|
 | 4075 |                 xml_attribute_struct* attr = a._attr;
 | 
|---|
 | 4076 | 
 | 
|---|
 | 4077 |                 while (attr->prev_attribute_c->next_attribute) attr = attr->prev_attribute_c;
 | 
|---|
 | 4078 | 
 | 
|---|
 | 4079 |                 if (attr != _root->first_attribute) return false;
 | 
|---|
 | 4080 | 
 | 
|---|
 | 4081 |                 if (a._attr->next_attribute) a._attr->next_attribute->prev_attribute_c = a._attr->prev_attribute_c;
 | 
|---|
 | 4082 |                 else if (_root->first_attribute) _root->first_attribute->prev_attribute_c = a._attr->prev_attribute_c;
 | 
|---|
 | 4083 |                 
 | 
|---|
 | 4084 |                 if (a._attr->prev_attribute_c->next_attribute) a._attr->prev_attribute_c->next_attribute = a._attr->next_attribute;
 | 
|---|
 | 4085 |                 else _root->first_attribute = a._attr->next_attribute;
 | 
|---|
 | 4086 | 
 | 
|---|
 | 4087 |                 destroy_attribute(a._attr, get_allocator(_root));
 | 
|---|
 | 4088 | 
 | 
|---|
 | 4089 |                 return true;
 | 
|---|
 | 4090 |         }
 | 
|---|
 | 4091 | 
 | 
|---|
 | 4092 |         bool xml_node::remove_child(const char_t* name)
 | 
|---|
 | 4093 |         {
 | 
|---|
 | 4094 |                 return remove_child(child(name));
 | 
|---|
 | 4095 |         }
 | 
|---|
 | 4096 | 
 | 
|---|
 | 4097 |         bool xml_node::remove_child(const xml_node& n)
 | 
|---|
 | 4098 |         {
 | 
|---|
 | 4099 |                 if (!_root || !n._root || n._root->parent != _root) return false;
 | 
|---|
 | 4100 | 
 | 
|---|
 | 4101 |                 if (n._root->next_sibling) n._root->next_sibling->prev_sibling_c = n._root->prev_sibling_c;
 | 
|---|
 | 4102 |                 else if (_root->first_child) _root->first_child->prev_sibling_c = n._root->prev_sibling_c;
 | 
|---|
 | 4103 |                 
 | 
|---|
 | 4104 |                 if (n._root->prev_sibling_c->next_sibling) n._root->prev_sibling_c->next_sibling = n._root->next_sibling;
 | 
|---|
 | 4105 |                 else _root->first_child = n._root->next_sibling;
 | 
|---|
 | 4106 |         
 | 
|---|
 | 4107 |         destroy_node(n._root, get_allocator(_root));
 | 
|---|
 | 4108 | 
 | 
|---|
 | 4109 |                 return true;
 | 
|---|
 | 4110 |         }
 | 
|---|
 | 4111 | 
 | 
|---|
 | 4112 |         xml_node xml_node::find_child_by_attribute(const char_t* name, const char_t* attr_name, const char_t* attr_value) const
 | 
|---|
 | 4113 |         {
 | 
|---|
 | 4114 |                 if (!_root) return xml_node();
 | 
|---|
 | 4115 |                 
 | 
|---|
 | 4116 |                 for (xml_node_struct* i = _root->first_child; i; i = i->next_sibling)
 | 
|---|
 | 4117 |                         if (i->name && strequal(name, i->name))
 | 
|---|
 | 4118 |                         {
 | 
|---|
 | 4119 |                                 for (xml_attribute_struct* a = i->first_attribute; a; a = a->next_attribute)
 | 
|---|
 | 4120 |                                         if (strequal(attr_name, a->name) && strequal(attr_value, a->value))
 | 
|---|
 | 4121 |                                                 return xml_node(i);
 | 
|---|
 | 4122 |                         }
 | 
|---|
 | 4123 | 
 | 
|---|
 | 4124 |                 return xml_node();
 | 
|---|
 | 4125 |         }
 | 
|---|
 | 4126 | 
 | 
|---|
 | 4127 |         xml_node xml_node::find_child_by_attribute(const char_t* attr_name, const char_t* attr_value) const
 | 
|---|
 | 4128 |         {
 | 
|---|
 | 4129 |                 if (!_root) return xml_node();
 | 
|---|
 | 4130 |                 
 | 
|---|
 | 4131 |                 for (xml_node_struct* i = _root->first_child; i; i = i->next_sibling)
 | 
|---|
 | 4132 |                         for (xml_attribute_struct* a = i->first_attribute; a; a = a->next_attribute)
 | 
|---|
 | 4133 |                                 if (strequal(attr_name, a->name) && strequal(attr_value, a->value))
 | 
|---|
 | 4134 |                                         return xml_node(i);
 | 
|---|
 | 4135 | 
 | 
|---|
 | 4136 |                 return xml_node();
 | 
|---|
 | 4137 |         }
 | 
|---|
 | 4138 | 
 | 
|---|
 | 4139 | #ifndef PUGIXML_NO_STL
 | 
|---|
 | 4140 |         string_t xml_node::path(char_t delimiter) const
 | 
|---|
 | 4141 |         {
 | 
|---|
 | 4142 |                 string_t path;
 | 
|---|
 | 4143 | 
 | 
|---|
 | 4144 |                 xml_node cursor = *this; // Make a copy.
 | 
|---|
 | 4145 |                 
 | 
|---|
 | 4146 |                 path = cursor.name();
 | 
|---|
 | 4147 | 
 | 
|---|
 | 4148 |                 while (cursor.parent())
 | 
|---|
 | 4149 |                 {
 | 
|---|
 | 4150 |                         cursor = cursor.parent();
 | 
|---|
 | 4151 |                         
 | 
|---|
 | 4152 |                         string_t temp = cursor.name();
 | 
|---|
 | 4153 |                         temp += delimiter;
 | 
|---|
 | 4154 |                         temp += path;
 | 
|---|
 | 4155 |                         path.swap(temp);
 | 
|---|
 | 4156 |                 }
 | 
|---|
 | 4157 | 
 | 
|---|
 | 4158 |                 return path;
 | 
|---|
 | 4159 |         }
 | 
|---|
 | 4160 | #endif
 | 
|---|
 | 4161 | 
 | 
|---|
 | 4162 |         xml_node xml_node::first_element_by_path(const char_t* path, char_t delimiter) const
 | 
|---|
 | 4163 |         {
 | 
|---|
 | 4164 |                 xml_node found = *this; // Current search context.
 | 
|---|
 | 4165 | 
 | 
|---|
 | 4166 |                 if (!_root || !path || !path[0]) return found;
 | 
|---|
 | 4167 | 
 | 
|---|
 | 4168 |                 if (path[0] == delimiter)
 | 
|---|
 | 4169 |                 {
 | 
|---|
 | 4170 |                         // Absolute path; e.g. '/foo/bar'
 | 
|---|
 | 4171 |                         found = found.root();
 | 
|---|
 | 4172 |                         ++path;
 | 
|---|
 | 4173 |                 }
 | 
|---|
 | 4174 | 
 | 
|---|
 | 4175 |                 const char_t* path_segment = path;
 | 
|---|
 | 4176 | 
 | 
|---|
 | 4177 |                 while (*path_segment == delimiter) ++path_segment;
 | 
|---|
 | 4178 | 
 | 
|---|
 | 4179 |                 const char_t* path_segment_end = path_segment;
 | 
|---|
 | 4180 | 
 | 
|---|
 | 4181 |                 while (*path_segment_end && *path_segment_end != delimiter) ++path_segment_end;
 | 
|---|
 | 4182 | 
 | 
|---|
 | 4183 |                 if (path_segment == path_segment_end) return found;
 | 
|---|
 | 4184 | 
 | 
|---|
 | 4185 |                 const char_t* next_segment = path_segment_end;
 | 
|---|
 | 4186 | 
 | 
|---|
 | 4187 |                 while (*next_segment == delimiter) ++next_segment;
 | 
|---|
 | 4188 | 
 | 
|---|
 | 4189 |                 if (*path_segment == '.' && path_segment + 1 == path_segment_end)
 | 
|---|
 | 4190 |                         return found.first_element_by_path(next_segment, delimiter);
 | 
|---|
 | 4191 |                 else if (*path_segment == '.' && *(path_segment+1) == '.' && path_segment + 2 == path_segment_end)
 | 
|---|
 | 4192 |                         return found.parent().first_element_by_path(next_segment, delimiter);
 | 
|---|
 | 4193 |                 else
 | 
|---|
 | 4194 |                 {
 | 
|---|
 | 4195 |                         for (xml_node_struct* j = found._root->first_child; j; j = j->next_sibling)
 | 
|---|
 | 4196 |                         {
 | 
|---|
 | 4197 |                                 if (j->name && strequalrange(j->name, path_segment, static_cast<size_t>(path_segment_end - path_segment)))
 | 
|---|
 | 4198 |                                 {
 | 
|---|
 | 4199 |                                         xml_node subsearch = xml_node(j).first_element_by_path(next_segment, delimiter);
 | 
|---|
 | 4200 | 
 | 
|---|
 | 4201 |                                         if (subsearch) return subsearch;
 | 
|---|
 | 4202 |                                 }
 | 
|---|
 | 4203 |                         }
 | 
|---|
 | 4204 | 
 | 
|---|
 | 4205 |                         return xml_node();
 | 
|---|
 | 4206 |                 }
 | 
|---|
 | 4207 |         }
 | 
|---|
 | 4208 | 
 | 
|---|
 | 4209 |         bool xml_node::traverse(xml_tree_walker& walker)
 | 
|---|
 | 4210 |         {
 | 
|---|
 | 4211 |                 walker._depth = -1;
 | 
|---|
 | 4212 |                 
 | 
|---|
 | 4213 |                 xml_node arg_begin = *this;
 | 
|---|
 | 4214 |                 if (!walker.begin(arg_begin)) return false;
 | 
|---|
 | 4215 | 
 | 
|---|
 | 4216 |                 xml_node cur = first_child();
 | 
|---|
 | 4217 |                                 
 | 
|---|
 | 4218 |                 if (cur)
 | 
|---|
 | 4219 |                 {
 | 
|---|
 | 4220 |                         ++walker._depth;
 | 
|---|
 | 4221 | 
 | 
|---|
 | 4222 |                         do 
 | 
|---|
 | 4223 |                         {
 | 
|---|
 | 4224 |                                 xml_node arg_for_each = cur;
 | 
|---|
 | 4225 |                                 if (!walker.for_each(arg_for_each))
 | 
|---|
 | 4226 |                                         return false;
 | 
|---|
 | 4227 |                                                 
 | 
|---|
 | 4228 |                                 if (cur.first_child())
 | 
|---|
 | 4229 |                                 {
 | 
|---|
 | 4230 |                                         ++walker._depth;
 | 
|---|
 | 4231 |                                         cur = cur.first_child();
 | 
|---|
 | 4232 |                                 }
 | 
|---|
 | 4233 |                                 else if (cur.next_sibling())
 | 
|---|
 | 4234 |                                         cur = cur.next_sibling();
 | 
|---|
 | 4235 |                                 else
 | 
|---|
 | 4236 |                                 {
 | 
|---|
 | 4237 |                                         // Borland C++ workaround
 | 
|---|
 | 4238 |                                         while (!cur.next_sibling() && cur != *this && (bool)cur.parent())
 | 
|---|
 | 4239 |                                         {
 | 
|---|
 | 4240 |                                                 --walker._depth;
 | 
|---|
 | 4241 |                                                 cur = cur.parent();
 | 
|---|
 | 4242 |                                         }
 | 
|---|
 | 4243 |                                                 
 | 
|---|
 | 4244 |                                         if (cur != *this)
 | 
|---|
 | 4245 |                                                 cur = cur.next_sibling();
 | 
|---|
 | 4246 |                                 }
 | 
|---|
 | 4247 |                         }
 | 
|---|
 | 4248 |                         while (cur && cur != *this);
 | 
|---|
 | 4249 |                 }
 | 
|---|
 | 4250 | 
 | 
|---|
 | 4251 |                 assert(walker._depth == -1);
 | 
|---|
 | 4252 | 
 | 
|---|
 | 4253 |                 xml_node arg_end = *this;
 | 
|---|
 | 4254 |                 return walker.end(arg_end);
 | 
|---|
 | 4255 |         }
 | 
|---|
 | 4256 | 
 | 
|---|
 | 4257 |     size_t xml_node::hash_value() const
 | 
|---|
 | 4258 |     {
 | 
|---|
 | 4259 |         return static_cast<size_t>(reinterpret_cast<uintptr_t>(_root) / sizeof(xml_node_struct));
 | 
|---|
 | 4260 |     }
 | 
|---|
 | 4261 | 
 | 
|---|
 | 4262 |         xml_node_struct* xml_node::internal_object() const
 | 
|---|
 | 4263 |         {
 | 
|---|
 | 4264 |         return _root;
 | 
|---|
 | 4265 |         }
 | 
|---|
 | 4266 | 
 | 
|---|
 | 4267 |         void xml_node::print(xml_writer& writer, const char_t* indent, unsigned int flags, xml_encoding encoding, unsigned int depth) const
 | 
|---|
 | 4268 |         {
 | 
|---|
 | 4269 |                 if (!_root) return;
 | 
|---|
 | 4270 | 
 | 
|---|
 | 4271 |                 xml_buffered_writer buffered_writer(writer, encoding);
 | 
|---|
 | 4272 | 
 | 
|---|
 | 4273 |                 node_output(buffered_writer, *this, indent, flags, depth);
 | 
|---|
 | 4274 |         }
 | 
|---|
 | 4275 | 
 | 
|---|
 | 4276 | #ifndef PUGIXML_NO_STL
 | 
|---|
 | 4277 |         void xml_node::print(std::basic_ostream<char, std::char_traits<char> >& stream, const char_t* indent, unsigned int flags, xml_encoding encoding, unsigned int depth) const
 | 
|---|
 | 4278 |         {
 | 
|---|
 | 4279 |                 xml_writer_stream writer(stream);
 | 
|---|
 | 4280 | 
 | 
|---|
 | 4281 |                 print(writer, indent, flags, encoding, depth);
 | 
|---|
 | 4282 |         }
 | 
|---|
 | 4283 | 
 | 
|---|
 | 4284 |         void xml_node::print(std::basic_ostream<wchar_t, std::char_traits<wchar_t> >& stream, const char_t* indent, unsigned int flags, unsigned int depth) const
 | 
|---|
 | 4285 |         {
 | 
|---|
 | 4286 |                 xml_writer_stream writer(stream);
 | 
|---|
 | 4287 | 
 | 
|---|
 | 4288 |                 print(writer, indent, flags, encoding_wchar, depth);
 | 
|---|
 | 4289 |         }
 | 
|---|
 | 4290 | #endif
 | 
|---|
 | 4291 | 
 | 
|---|
 | 4292 |         ptrdiff_t xml_node::offset_debug() const
 | 
|---|
 | 4293 |         {
 | 
|---|
 | 4294 |                 xml_node_struct* r = root()._root;
 | 
|---|
 | 4295 | 
 | 
|---|
 | 4296 |                 if (!r) return -1;
 | 
|---|
 | 4297 | 
 | 
|---|
 | 4298 |                 const char_t* buffer = static_cast<xml_document_struct*>(r)->buffer;
 | 
|---|
 | 4299 | 
 | 
|---|
 | 4300 |                 if (!buffer) return -1;
 | 
|---|
 | 4301 | 
 | 
|---|
 | 4302 |                 switch (type())
 | 
|---|
 | 4303 |                 {
 | 
|---|
 | 4304 |                 case node_document:
 | 
|---|
 | 4305 |                         return 0;
 | 
|---|
 | 4306 | 
 | 
|---|
 | 4307 |                 case node_element:
 | 
|---|
 | 4308 |                 case node_declaration:
 | 
|---|
 | 4309 |                 case node_pi:
 | 
|---|
 | 4310 |                         return (_root->header & xml_memory_page_name_allocated_mask) ? -1 : _root->name - buffer;
 | 
|---|
 | 4311 | 
 | 
|---|
 | 4312 |                 case node_pcdata:
 | 
|---|
 | 4313 |                 case node_cdata:
 | 
|---|
 | 4314 |                 case node_comment:
 | 
|---|
 | 4315 |                 case node_doctype:
 | 
|---|
 | 4316 |                         return (_root->header & xml_memory_page_value_allocated_mask) ? -1 : _root->value - buffer;
 | 
|---|
 | 4317 | 
 | 
|---|
 | 4318 |                 default:
 | 
|---|
 | 4319 |                         return -1;
 | 
|---|
 | 4320 |                 }
 | 
|---|
 | 4321 |         }
 | 
|---|
 | 4322 | 
 | 
|---|
 | 4323 | #ifdef __BORLANDC__
 | 
|---|
 | 4324 |         bool operator&&(const xml_node& lhs, bool rhs)
 | 
|---|
 | 4325 |         {
 | 
|---|
 | 4326 |                 return (bool)lhs && rhs;
 | 
|---|
 | 4327 |         }
 | 
|---|
 | 4328 | 
 | 
|---|
 | 4329 |         bool operator||(const xml_node& lhs, bool rhs)
 | 
|---|
 | 4330 |         {
 | 
|---|
 | 4331 |                 return (bool)lhs || rhs;
 | 
|---|
 | 4332 |         }
 | 
|---|
 | 4333 | #endif
 | 
|---|
 | 4334 | 
 | 
|---|
 | 4335 |         xml_node_iterator::xml_node_iterator()
 | 
|---|
 | 4336 |         {
 | 
|---|
 | 4337 |         }
 | 
|---|
 | 4338 | 
 | 
|---|
 | 4339 |         xml_node_iterator::xml_node_iterator(const xml_node& node): _wrap(node), _parent(node.parent())
 | 
|---|
 | 4340 |         {
 | 
|---|
 | 4341 |         }
 | 
|---|
 | 4342 | 
 | 
|---|
 | 4343 |         xml_node_iterator::xml_node_iterator(xml_node_struct* ref, xml_node_struct* parent): _wrap(ref), _parent(parent)
 | 
|---|
 | 4344 |         {
 | 
|---|
 | 4345 |         }
 | 
|---|
 | 4346 | 
 | 
|---|
 | 4347 |         bool xml_node_iterator::operator==(const xml_node_iterator& rhs) const
 | 
|---|
 | 4348 |         {
 | 
|---|
 | 4349 |                 return _wrap._root == rhs._wrap._root && _parent._root == rhs._parent._root;
 | 
|---|
 | 4350 |         }
 | 
|---|
 | 4351 |         
 | 
|---|
 | 4352 |         bool xml_node_iterator::operator!=(const xml_node_iterator& rhs) const
 | 
|---|
 | 4353 |         {
 | 
|---|
 | 4354 |                 return _wrap._root != rhs._wrap._root || _parent._root != rhs._parent._root;
 | 
|---|
 | 4355 |         }
 | 
|---|
 | 4356 | 
 | 
|---|
 | 4357 |         xml_node& xml_node_iterator::operator*()
 | 
|---|
 | 4358 |         {
 | 
|---|
 | 4359 |                 assert(_wrap._root);
 | 
|---|
 | 4360 |                 return _wrap;
 | 
|---|
 | 4361 |         }
 | 
|---|
 | 4362 | 
 | 
|---|
 | 4363 |         xml_node* xml_node_iterator::operator->()
 | 
|---|
 | 4364 |         {
 | 
|---|
 | 4365 |                 assert(_wrap._root);
 | 
|---|
 | 4366 |                 return &_wrap;
 | 
|---|
 | 4367 |         }
 | 
|---|
 | 4368 | 
 | 
|---|
 | 4369 |         const xml_node_iterator& xml_node_iterator::operator++()
 | 
|---|
 | 4370 |         {
 | 
|---|
 | 4371 |                 assert(_wrap._root);
 | 
|---|
 | 4372 |                 _wrap._root = _wrap._root->next_sibling;
 | 
|---|
 | 4373 |                 return *this;
 | 
|---|
 | 4374 |         }
 | 
|---|
 | 4375 | 
 | 
|---|
 | 4376 |         xml_node_iterator xml_node_iterator::operator++(int)
 | 
|---|
 | 4377 |         {
 | 
|---|
 | 4378 |                 xml_node_iterator temp = *this;
 | 
|---|
 | 4379 |                 ++*this;
 | 
|---|
 | 4380 |                 return temp;
 | 
|---|
 | 4381 |         }
 | 
|---|
 | 4382 | 
 | 
|---|
 | 4383 |         const xml_node_iterator& xml_node_iterator::operator--()
 | 
|---|
 | 4384 |         {
 | 
|---|
 | 4385 |                 _wrap = _wrap._root ? _wrap.previous_sibling() : _parent.last_child();
 | 
|---|
 | 4386 |                 return *this;
 | 
|---|
 | 4387 |         }
 | 
|---|
 | 4388 | 
 | 
|---|
 | 4389 |         xml_node_iterator xml_node_iterator::operator--(int)
 | 
|---|
 | 4390 |         {
 | 
|---|
 | 4391 |                 xml_node_iterator temp = *this;
 | 
|---|
 | 4392 |                 --*this;
 | 
|---|
 | 4393 |                 return temp;
 | 
|---|
 | 4394 |         }
 | 
|---|
 | 4395 | 
 | 
|---|
 | 4396 |         xml_attribute_iterator::xml_attribute_iterator()
 | 
|---|
 | 4397 |         {
 | 
|---|
 | 4398 |         }
 | 
|---|
 | 4399 | 
 | 
|---|
 | 4400 |         xml_attribute_iterator::xml_attribute_iterator(const xml_attribute& attr, const xml_node& parent): _wrap(attr), _parent(parent)
 | 
|---|
 | 4401 |         {
 | 
|---|
 | 4402 |         }
 | 
|---|
 | 4403 | 
 | 
|---|
 | 4404 |         xml_attribute_iterator::xml_attribute_iterator(xml_attribute_struct* ref, xml_node_struct* parent): _wrap(ref), _parent(parent)
 | 
|---|
 | 4405 |         {
 | 
|---|
 | 4406 |         }
 | 
|---|
 | 4407 | 
 | 
|---|
 | 4408 |         bool xml_attribute_iterator::operator==(const xml_attribute_iterator& rhs) const
 | 
|---|
 | 4409 |         {
 | 
|---|
 | 4410 |                 return _wrap._attr == rhs._wrap._attr && _parent._root == rhs._parent._root;
 | 
|---|
 | 4411 |         }
 | 
|---|
 | 4412 |         
 | 
|---|
 | 4413 |         bool xml_attribute_iterator::operator!=(const xml_attribute_iterator& rhs) const
 | 
|---|
 | 4414 |         {
 | 
|---|
 | 4415 |                 return _wrap._attr != rhs._wrap._attr || _parent._root != rhs._parent._root;
 | 
|---|
 | 4416 |         }
 | 
|---|
 | 4417 | 
 | 
|---|
 | 4418 |         xml_attribute& xml_attribute_iterator::operator*()
 | 
|---|
 | 4419 |         {
 | 
|---|
 | 4420 |                 assert(_wrap._attr);
 | 
|---|
 | 4421 |                 return _wrap;
 | 
|---|
 | 4422 |         }
 | 
|---|
 | 4423 | 
 | 
|---|
 | 4424 |         xml_attribute* xml_attribute_iterator::operator->()
 | 
|---|
 | 4425 |         {
 | 
|---|
 | 4426 |                 assert(_wrap._attr);
 | 
|---|
 | 4427 |                 return &_wrap;
 | 
|---|
 | 4428 |         }
 | 
|---|
 | 4429 | 
 | 
|---|
 | 4430 |         const xml_attribute_iterator& xml_attribute_iterator::operator++()
 | 
|---|
 | 4431 |         {
 | 
|---|
 | 4432 |                 assert(_wrap._attr);
 | 
|---|
 | 4433 |                 _wrap._attr = _wrap._attr->next_attribute;
 | 
|---|
 | 4434 |                 return *this;
 | 
|---|
 | 4435 |         }
 | 
|---|
 | 4436 | 
 | 
|---|
 | 4437 |         xml_attribute_iterator xml_attribute_iterator::operator++(int)
 | 
|---|
 | 4438 |         {
 | 
|---|
 | 4439 |                 xml_attribute_iterator temp = *this;
 | 
|---|
 | 4440 |                 ++*this;
 | 
|---|
 | 4441 |                 return temp;
 | 
|---|
 | 4442 |         }
 | 
|---|
 | 4443 | 
 | 
|---|
 | 4444 |         const xml_attribute_iterator& xml_attribute_iterator::operator--()
 | 
|---|
 | 4445 |         {
 | 
|---|
 | 4446 |                 _wrap = _wrap._attr ? _wrap.previous_attribute() : _parent.last_attribute();
 | 
|---|
 | 4447 |                 return *this;
 | 
|---|
 | 4448 |         }
 | 
|---|
 | 4449 | 
 | 
|---|
 | 4450 |         xml_attribute_iterator xml_attribute_iterator::operator--(int)
 | 
|---|
 | 4451 |         {
 | 
|---|
 | 4452 |                 xml_attribute_iterator temp = *this;
 | 
|---|
 | 4453 |                 --*this;
 | 
|---|
 | 4454 |                 return temp;
 | 
|---|
 | 4455 |         }
 | 
|---|
 | 4456 | 
 | 
|---|
 | 4457 |     xml_parse_result::xml_parse_result(): status(status_internal_error), offset(0), encoding(encoding_auto)
 | 
|---|
 | 4458 |     {
 | 
|---|
 | 4459 |     }
 | 
|---|
 | 4460 | 
 | 
|---|
 | 4461 |     xml_parse_result::operator bool() const
 | 
|---|
 | 4462 |     {
 | 
|---|
 | 4463 |         return status == status_ok;
 | 
|---|
 | 4464 |     }
 | 
|---|
 | 4465 | 
 | 
|---|
 | 4466 |         const char* xml_parse_result::description() const
 | 
|---|
 | 4467 |         {
 | 
|---|
 | 4468 |                 switch (status)
 | 
|---|
 | 4469 |                 {
 | 
|---|
 | 4470 |                 case status_ok: return "No error";
 | 
|---|
 | 4471 | 
 | 
|---|
 | 4472 |                 case status_file_not_found: return "File was not found";
 | 
|---|
 | 4473 |                 case status_io_error: return "Error reading from file/stream";
 | 
|---|
 | 4474 |                 case status_out_of_memory: return "Could not allocate memory";
 | 
|---|
 | 4475 |                 case status_internal_error: return "Internal error occurred";
 | 
|---|
 | 4476 | 
 | 
|---|
 | 4477 |                 case status_unrecognized_tag: return "Could not determine tag type";
 | 
|---|
 | 4478 | 
 | 
|---|
 | 4479 |                 case status_bad_pi: return "Error parsing document declaration/processing instruction";
 | 
|---|
 | 4480 |                 case status_bad_comment: return "Error parsing comment";
 | 
|---|
 | 4481 |                 case status_bad_cdata: return "Error parsing CDATA section";
 | 
|---|
 | 4482 |                 case status_bad_doctype: return "Error parsing document type declaration";
 | 
|---|
 | 4483 |                 case status_bad_pcdata: return "Error parsing PCDATA section";
 | 
|---|
 | 4484 |                 case status_bad_start_element: return "Error parsing start element tag";
 | 
|---|
 | 4485 |                 case status_bad_attribute: return "Error parsing element attribute";
 | 
|---|
 | 4486 |                 case status_bad_end_element: return "Error parsing end element tag";
 | 
|---|
 | 4487 |                 case status_end_element_mismatch: return "Start-end tags mismatch";
 | 
|---|
 | 4488 | 
 | 
|---|
 | 4489 |                 default: return "Unknown error";
 | 
|---|
 | 4490 |                 }
 | 
|---|
 | 4491 |         }
 | 
|---|
 | 4492 | 
 | 
|---|
 | 4493 |         xml_document::xml_document(): _buffer(0)
 | 
|---|
 | 4494 |         {
 | 
|---|
 | 4495 |                 create();
 | 
|---|
 | 4496 |         }
 | 
|---|
 | 4497 | 
 | 
|---|
 | 4498 |         xml_document::~xml_document()
 | 
|---|
 | 4499 |         {
 | 
|---|
 | 4500 |                 destroy();
 | 
|---|
 | 4501 |         }
 | 
|---|
 | 4502 | 
 | 
|---|
 | 4503 |         void xml_document::reset()
 | 
|---|
 | 4504 |         {
 | 
|---|
 | 4505 |                 destroy();
 | 
|---|
 | 4506 |                 create();
 | 
|---|
 | 4507 |         }
 | 
|---|
 | 4508 | 
 | 
|---|
 | 4509 |     void xml_document::reset(const xml_document& proto)
 | 
|---|
 | 4510 |     {
 | 
|---|
 | 4511 |         reset();
 | 
|---|
 | 4512 | 
 | 
|---|
 | 4513 |         for (xml_node cur = proto.first_child(); cur; cur = cur.next_sibling())
 | 
|---|
 | 4514 |             append_copy(cur);
 | 
|---|
 | 4515 |     }
 | 
|---|
 | 4516 | 
 | 
|---|
 | 4517 |         void xml_document::create()
 | 
|---|
 | 4518 |         {
 | 
|---|
 | 4519 |                 // initialize sentinel page
 | 
|---|
 | 4520 |                 STATIC_ASSERT(offsetof(xml_memory_page, data) + sizeof(xml_document_struct) + xml_memory_page_alignment <= sizeof(_memory));
 | 
|---|
 | 4521 | 
 | 
|---|
 | 4522 |                 // align upwards to page boundary
 | 
|---|
 | 4523 |                 void* page_memory = reinterpret_cast<void*>((reinterpret_cast<uintptr_t>(_memory) + (xml_memory_page_alignment - 1)) & ~(xml_memory_page_alignment - 1));
 | 
|---|
 | 4524 | 
 | 
|---|
 | 4525 |                 // prepare page structure
 | 
|---|
 | 4526 |                 xml_memory_page* page = xml_memory_page::construct(page_memory);
 | 
|---|
 | 4527 | 
 | 
|---|
 | 4528 |                 page->busy_size = xml_memory_page_size;
 | 
|---|
 | 4529 | 
 | 
|---|
 | 4530 |                 // allocate new root
 | 
|---|
 | 4531 |                 _root = new (page->data) xml_document_struct(page);
 | 
|---|
 | 4532 |                 _root->prev_sibling_c = _root;
 | 
|---|
 | 4533 | 
 | 
|---|
 | 4534 |                 // setup sentinel page
 | 
|---|
 | 4535 |                 page->allocator = static_cast<xml_document_struct*>(_root);
 | 
|---|
 | 4536 |         }
 | 
|---|
 | 4537 | 
 | 
|---|
 | 4538 |         void xml_document::destroy()
 | 
|---|
 | 4539 |         {
 | 
|---|
 | 4540 |                 // destroy static storage
 | 
|---|
 | 4541 |                 if (_buffer)
 | 
|---|
 | 4542 |                 {
 | 
|---|
 | 4543 |                         global_deallocate(_buffer);
 | 
|---|
 | 4544 |                         _buffer = 0;
 | 
|---|
 | 4545 |                 }
 | 
|---|
 | 4546 | 
 | 
|---|
 | 4547 |                 // destroy dynamic storage, leave sentinel page (it's in static memory)
 | 
|---|
 | 4548 |                 if (_root)
 | 
|---|
 | 4549 |                 {
 | 
|---|
 | 4550 |                         xml_memory_page* root_page = reinterpret_cast<xml_memory_page*>(_root->header & xml_memory_page_pointer_mask);
 | 
|---|
 | 4551 |                         assert(root_page && !root_page->prev && !root_page->memory);
 | 
|---|
 | 4552 | 
 | 
|---|
 | 4553 |                         // destroy all pages
 | 
|---|
 | 4554 |                         for (xml_memory_page* page = root_page->next; page; )
 | 
|---|
 | 4555 |                         {
 | 
|---|
 | 4556 |                                 xml_memory_page* next = page->next;
 | 
|---|
 | 4557 | 
 | 
|---|
 | 4558 |                                 xml_allocator::deallocate_page(page);
 | 
|---|
 | 4559 | 
 | 
|---|
 | 4560 |                                 page = next;
 | 
|---|
 | 4561 |                         }
 | 
|---|
 | 4562 | 
 | 
|---|
 | 4563 |                         // cleanup root page
 | 
|---|
 | 4564 |                         root_page->allocator = 0;
 | 
|---|
 | 4565 |                         root_page->next = 0;
 | 
|---|
 | 4566 |                         root_page->busy_size = root_page->freed_size = 0;
 | 
|---|
 | 4567 | 
 | 
|---|
 | 4568 |                         _root = 0;
 | 
|---|
 | 4569 |                 }
 | 
|---|
 | 4570 |         }
 | 
|---|
 | 4571 | 
 | 
|---|
 | 4572 | #ifndef PUGIXML_NO_STL
 | 
|---|
 | 4573 |         xml_parse_result xml_document::load(std::basic_istream<char, std::char_traits<char> >& stream, unsigned int options, xml_encoding encoding)
 | 
|---|
 | 4574 |         {
 | 
|---|
 | 4575 |                 reset();
 | 
|---|
 | 4576 | 
 | 
|---|
 | 4577 |                 return load_stream_impl(*this, stream, options, encoding);
 | 
|---|
 | 4578 |         }
 | 
|---|
 | 4579 | 
 | 
|---|
 | 4580 |         xml_parse_result xml_document::load(std::basic_istream<wchar_t, std::char_traits<wchar_t> >& stream, unsigned int options)
 | 
|---|
 | 4581 |         {
 | 
|---|
 | 4582 |                 reset();
 | 
|---|
 | 4583 | 
 | 
|---|
 | 4584 |                 return load_stream_impl(*this, stream, options, encoding_wchar);
 | 
|---|
 | 4585 |         }
 | 
|---|
 | 4586 | #endif
 | 
|---|
 | 4587 | 
 | 
|---|
 | 4588 |         xml_parse_result xml_document::load(const char_t* contents, unsigned int options)
 | 
|---|
 | 4589 |         {
 | 
|---|
 | 4590 |                 // Force native encoding (skip autodetection)
 | 
|---|
 | 4591 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 4592 |                 xml_encoding encoding = encoding_wchar;
 | 
|---|
 | 4593 |         #else
 | 
|---|
 | 4594 |                 xml_encoding encoding = encoding_utf8;
 | 
|---|
 | 4595 |         #endif
 | 
|---|
 | 4596 | 
 | 
|---|
 | 4597 |                 return load_buffer(contents, strlength(contents) * sizeof(char_t), options, encoding);
 | 
|---|
 | 4598 |         }
 | 
|---|
 | 4599 | 
 | 
|---|
 | 4600 |         xml_parse_result xml_document::load_file(const char* path, unsigned int options, xml_encoding encoding)
 | 
|---|
 | 4601 |         {
 | 
|---|
 | 4602 |                 reset();
 | 
|---|
 | 4603 | 
 | 
|---|
 | 4604 |                 FILE* file = fopen(path, "rb");
 | 
|---|
 | 4605 | 
 | 
|---|
 | 4606 |                 return load_file_impl(*this, file, options, encoding);
 | 
|---|
 | 4607 |         }
 | 
|---|
 | 4608 | 
 | 
|---|
 | 4609 |         xml_parse_result xml_document::load_file(const wchar_t* path, unsigned int options, xml_encoding encoding)
 | 
|---|
 | 4610 |         {
 | 
|---|
 | 4611 |                 reset();
 | 
|---|
 | 4612 | 
 | 
|---|
 | 4613 |                 FILE* file = open_file_wide(path, L"rb");
 | 
|---|
 | 4614 | 
 | 
|---|
 | 4615 |                 return load_file_impl(*this, file, options, encoding);
 | 
|---|
 | 4616 |         }
 | 
|---|
 | 4617 | 
 | 
|---|
 | 4618 |         xml_parse_result xml_document::load_buffer_impl(void* contents, size_t size, unsigned int options, xml_encoding encoding, bool is_mutable, bool own)
 | 
|---|
 | 4619 |         {
 | 
|---|
 | 4620 |                 reset();
 | 
|---|
 | 4621 | 
 | 
|---|
 | 4622 |                 // check input buffer
 | 
|---|
 | 4623 |                 assert(contents || size == 0);
 | 
|---|
 | 4624 | 
 | 
|---|
 | 4625 |                 // get actual encoding
 | 
|---|
 | 4626 |                 xml_encoding buffer_encoding = get_buffer_encoding(encoding, contents, size);
 | 
|---|
 | 4627 | 
 | 
|---|
 | 4628 |                 // get private buffer
 | 
|---|
 | 4629 |                 char_t* buffer = 0;
 | 
|---|
 | 4630 |                 size_t length = 0;
 | 
|---|
 | 4631 | 
 | 
|---|
 | 4632 |                 if (!convert_buffer(buffer, length, buffer_encoding, contents, size, is_mutable)) return make_parse_result(status_out_of_memory);
 | 
|---|
 | 4633 |                 
 | 
|---|
 | 4634 |                 // delete original buffer if we performed a conversion
 | 
|---|
 | 4635 |                 if (own && buffer != contents && contents) global_deallocate(contents);
 | 
|---|
 | 4636 | 
 | 
|---|
 | 4637 |                 // parse
 | 
|---|
 | 4638 |                 xml_parse_result res = xml_parser::parse(buffer, length, _root, options);
 | 
|---|
 | 4639 | 
 | 
|---|
 | 4640 |                 // remember encoding
 | 
|---|
 | 4641 |                 res.encoding = buffer_encoding;
 | 
|---|
 | 4642 | 
 | 
|---|
 | 4643 |                 // grab onto buffer if it's our buffer, user is responsible for deallocating contens himself
 | 
|---|
 | 4644 |                 if (own || buffer != contents) _buffer = buffer;
 | 
|---|
 | 4645 | 
 | 
|---|
 | 4646 |                 return res;
 | 
|---|
 | 4647 |         }
 | 
|---|
 | 4648 | 
 | 
|---|
 | 4649 |         xml_parse_result xml_document::load_buffer(const void* contents, size_t size, unsigned int options, xml_encoding encoding)
 | 
|---|
 | 4650 |         {
 | 
|---|
 | 4651 |                 return load_buffer_impl(const_cast<void*>(contents), size, options, encoding, false, false);
 | 
|---|
 | 4652 |         }
 | 
|---|
 | 4653 | 
 | 
|---|
 | 4654 |         xml_parse_result xml_document::load_buffer_inplace(void* contents, size_t size, unsigned int options, xml_encoding encoding)
 | 
|---|
 | 4655 |         {
 | 
|---|
 | 4656 |                 return load_buffer_impl(contents, size, options, encoding, true, false);
 | 
|---|
 | 4657 |         }
 | 
|---|
 | 4658 |                 
 | 
|---|
 | 4659 |         xml_parse_result xml_document::load_buffer_inplace_own(void* contents, size_t size, unsigned int options, xml_encoding encoding)
 | 
|---|
 | 4660 |         {
 | 
|---|
 | 4661 |                 return load_buffer_impl(contents, size, options, encoding, true, true);
 | 
|---|
 | 4662 |         }
 | 
|---|
 | 4663 | 
 | 
|---|
 | 4664 |         void xml_document::save(xml_writer& writer, const char_t* indent, unsigned int flags, xml_encoding encoding) const
 | 
|---|
 | 4665 |         {
 | 
|---|
 | 4666 |                 if (flags & format_write_bom) write_bom(writer, get_write_encoding(encoding));
 | 
|---|
 | 4667 | 
 | 
|---|
 | 4668 |                 xml_buffered_writer buffered_writer(writer, encoding);
 | 
|---|
 | 4669 | 
 | 
|---|
 | 4670 |                 if (!(flags & format_no_declaration) && !has_declaration(*this))
 | 
|---|
 | 4671 |                 {
 | 
|---|
 | 4672 |                         buffered_writer.write(PUGIXML_TEXT("<?xml version=\"1.0\"?>"));
 | 
|---|
 | 4673 |                         if (!(flags & format_raw)) buffered_writer.write('\n');
 | 
|---|
 | 4674 |                 }
 | 
|---|
 | 4675 | 
 | 
|---|
 | 4676 |                 node_output(buffered_writer, *this, indent, flags, 0);
 | 
|---|
 | 4677 |         }
 | 
|---|
 | 4678 | 
 | 
|---|
 | 4679 | #ifndef PUGIXML_NO_STL
 | 
|---|
 | 4680 |         void xml_document::save(std::basic_ostream<char, std::char_traits<char> >& stream, const char_t* indent, unsigned int flags, xml_encoding encoding) const
 | 
|---|
 | 4681 |         {
 | 
|---|
 | 4682 |                 xml_writer_stream writer(stream);
 | 
|---|
 | 4683 | 
 | 
|---|
 | 4684 |                 save(writer, indent, flags, encoding);
 | 
|---|
 | 4685 |         }
 | 
|---|
 | 4686 | 
 | 
|---|
 | 4687 |         void xml_document::save(std::basic_ostream<wchar_t, std::char_traits<wchar_t> >& stream, const char_t* indent, unsigned int flags) const
 | 
|---|
 | 4688 |         {
 | 
|---|
 | 4689 |                 xml_writer_stream writer(stream);
 | 
|---|
 | 4690 | 
 | 
|---|
 | 4691 |                 save(writer, indent, flags, encoding_wchar);
 | 
|---|
 | 4692 |         }
 | 
|---|
 | 4693 | #endif
 | 
|---|
 | 4694 | 
 | 
|---|
 | 4695 |         bool xml_document::save_file(const char* path, const char_t* indent, unsigned int flags, xml_encoding encoding) const
 | 
|---|
 | 4696 |         {
 | 
|---|
 | 4697 |                 FILE* file = fopen(path, "wb");
 | 
|---|
 | 4698 |                 if (!file) return false;
 | 
|---|
 | 4699 | 
 | 
|---|
 | 4700 |                 xml_writer_file writer(file);
 | 
|---|
 | 4701 |                 save(writer, indent, flags, encoding);
 | 
|---|
 | 4702 | 
 | 
|---|
 | 4703 |                 fclose(file);
 | 
|---|
 | 4704 | 
 | 
|---|
 | 4705 |                 return true;
 | 
|---|
 | 4706 |         }
 | 
|---|
 | 4707 | 
 | 
|---|
 | 4708 |         bool xml_document::save_file(const wchar_t* path, const char_t* indent, unsigned int flags, xml_encoding encoding) const
 | 
|---|
 | 4709 |         {
 | 
|---|
 | 4710 |                 FILE* file = open_file_wide(path, L"wb");
 | 
|---|
 | 4711 |                 if (!file) return false;
 | 
|---|
 | 4712 | 
 | 
|---|
 | 4713 |                 xml_writer_file writer(file);
 | 
|---|
 | 4714 |                 save(writer, indent, flags, encoding);
 | 
|---|
 | 4715 | 
 | 
|---|
 | 4716 |                 fclose(file);
 | 
|---|
 | 4717 | 
 | 
|---|
 | 4718 |                 return true;
 | 
|---|
 | 4719 |         }
 | 
|---|
 | 4720 | 
 | 
|---|
 | 4721 |     xml_node xml_document::document_element() const
 | 
|---|
 | 4722 |     {
 | 
|---|
 | 4723 |                 for (xml_node_struct* i = _root->first_child; i; i = i->next_sibling)
 | 
|---|
 | 4724 |                         if ((i->header & xml_memory_page_type_mask) + 1 == node_element)
 | 
|---|
 | 4725 |                 return xml_node(i);
 | 
|---|
 | 4726 | 
 | 
|---|
 | 4727 |         return xml_node();
 | 
|---|
 | 4728 |     }
 | 
|---|
 | 4729 | 
 | 
|---|
 | 4730 | #ifndef PUGIXML_NO_STL
 | 
|---|
 | 4731 |         std::string PUGIXML_FUNCTION as_utf8(const wchar_t* str)
 | 
|---|
 | 4732 |         {
 | 
|---|
 | 4733 |                 assert(str);
 | 
|---|
 | 4734 | 
 | 
|---|
 | 4735 |         return as_utf8_impl(str, wcslen(str));
 | 
|---|
 | 4736 |         }
 | 
|---|
 | 4737 | 
 | 
|---|
 | 4738 |         std::string PUGIXML_FUNCTION as_utf8(const std::wstring& str)
 | 
|---|
 | 4739 |         {
 | 
|---|
 | 4740 |         return as_utf8_impl(str.c_str(), str.size());
 | 
|---|
 | 4741 |         }
 | 
|---|
 | 4742 |         
 | 
|---|
 | 4743 |         std::wstring PUGIXML_FUNCTION as_wide(const char* str)
 | 
|---|
 | 4744 |         {
 | 
|---|
 | 4745 |                 assert(str);
 | 
|---|
 | 4746 | 
 | 
|---|
 | 4747 |         return as_wide_impl(str, strlen(str));
 | 
|---|
 | 4748 |         }
 | 
|---|
 | 4749 |         
 | 
|---|
 | 4750 |         std::wstring PUGIXML_FUNCTION as_wide(const std::string& str)
 | 
|---|
 | 4751 |         {
 | 
|---|
 | 4752 |         return as_wide_impl(str.c_str(), str.size());
 | 
|---|
 | 4753 |         }
 | 
|---|
 | 4754 | #endif
 | 
|---|
 | 4755 | 
 | 
|---|
 | 4756 |     void PUGIXML_FUNCTION set_memory_management_functions(allocation_function allocate, deallocation_function deallocate)
 | 
|---|
 | 4757 |     {
 | 
|---|
 | 4758 |         global_allocate = allocate;
 | 
|---|
 | 4759 |         global_deallocate = deallocate;
 | 
|---|
 | 4760 |     }
 | 
|---|
 | 4761 | 
 | 
|---|
 | 4762 |     allocation_function PUGIXML_FUNCTION get_memory_allocation_function()
 | 
|---|
 | 4763 |     {
 | 
|---|
 | 4764 |         return global_allocate;
 | 
|---|
 | 4765 |     }
 | 
|---|
 | 4766 | 
 | 
|---|
 | 4767 |     deallocation_function PUGIXML_FUNCTION get_memory_deallocation_function()
 | 
|---|
 | 4768 |     {
 | 
|---|
 | 4769 |         return global_deallocate;
 | 
|---|
 | 4770 |     }
 | 
|---|
 | 4771 | }
 | 
|---|
 | 4772 | 
 | 
|---|
 | 4773 | #if !defined(PUGIXML_NO_STL) && (defined(_MSC_VER) || defined(__ICC))
 | 
|---|
 | 4774 | namespace std
 | 
|---|
 | 4775 | {
 | 
|---|
 | 4776 |         // Workarounds for (non-standard) iterator category detection for older versions (MSVC7/IC8 and earlier)
 | 
|---|
 | 4777 |         std::bidirectional_iterator_tag _Iter_cat(const xml_node_iterator&)
 | 
|---|
 | 4778 |         {
 | 
|---|
 | 4779 |                 return std::bidirectional_iterator_tag();
 | 
|---|
 | 4780 |         }
 | 
|---|
 | 4781 | 
 | 
|---|
 | 4782 |         std::bidirectional_iterator_tag _Iter_cat(const xml_attribute_iterator&)
 | 
|---|
 | 4783 |         {
 | 
|---|
 | 4784 |                 return std::bidirectional_iterator_tag();
 | 
|---|
 | 4785 |         }
 | 
|---|
 | 4786 | }
 | 
|---|
 | 4787 | #endif
 | 
|---|
 | 4788 | 
 | 
|---|
 | 4789 | #if !defined(PUGIXML_NO_STL) && defined(__SUNPRO_CC)
 | 
|---|
 | 4790 | namespace std
 | 
|---|
 | 4791 | {
 | 
|---|
 | 4792 |         // Workarounds for (non-standard) iterator category detection
 | 
|---|
 | 4793 |         std::bidirectional_iterator_tag __iterator_category(const xml_node_iterator&)
 | 
|---|
 | 4794 |         {
 | 
|---|
 | 4795 |                 return std::bidirectional_iterator_tag();
 | 
|---|
 | 4796 |         }
 | 
|---|
 | 4797 | 
 | 
|---|
 | 4798 |         std::bidirectional_iterator_tag __iterator_category(const xml_attribute_iterator&)
 | 
|---|
 | 4799 |         {
 | 
|---|
 | 4800 |                 return std::bidirectional_iterator_tag();
 | 
|---|
 | 4801 |         }
 | 
|---|
 | 4802 | }
 | 
|---|
 | 4803 | #endif
 | 
|---|
 | 4804 | 
 | 
|---|
 | 4805 | #ifndef PUGIXML_NO_XPATH
 | 
|---|
 | 4806 | 
 | 
|---|
 | 4807 | // STL replacements
 | 
|---|
 | 4808 | namespace
 | 
|---|
 | 4809 | {
 | 
|---|
 | 4810 |         struct equal_to
 | 
|---|
 | 4811 |         {
 | 
|---|
 | 4812 |                 template <typename T> bool operator()(const T& lhs, const T& rhs) const
 | 
|---|
 | 4813 |                 {
 | 
|---|
 | 4814 |                         return lhs == rhs;
 | 
|---|
 | 4815 |                 }
 | 
|---|
 | 4816 |         };
 | 
|---|
 | 4817 | 
 | 
|---|
 | 4818 |         struct not_equal_to
 | 
|---|
 | 4819 |         {
 | 
|---|
 | 4820 |                 template <typename T> bool operator()(const T& lhs, const T& rhs) const
 | 
|---|
 | 4821 |                 {
 | 
|---|
 | 4822 |                         return lhs != rhs;
 | 
|---|
 | 4823 |                 }
 | 
|---|
 | 4824 |         };
 | 
|---|
 | 4825 | 
 | 
|---|
 | 4826 |         struct less
 | 
|---|
 | 4827 |         {
 | 
|---|
 | 4828 |                 template <typename T> bool operator()(const T& lhs, const T& rhs) const
 | 
|---|
 | 4829 |                 {
 | 
|---|
 | 4830 |                         return lhs < rhs;
 | 
|---|
 | 4831 |                 }
 | 
|---|
 | 4832 |         };
 | 
|---|
 | 4833 | 
 | 
|---|
 | 4834 |         struct less_equal
 | 
|---|
 | 4835 |         {
 | 
|---|
 | 4836 |                 template <typename T> bool operator()(const T& lhs, const T& rhs) const
 | 
|---|
 | 4837 |                 {
 | 
|---|
 | 4838 |                         return lhs <= rhs;
 | 
|---|
 | 4839 |                 }
 | 
|---|
 | 4840 |         };
 | 
|---|
 | 4841 | 
 | 
|---|
 | 4842 |         template <typename T> void swap(T& lhs, T& rhs)
 | 
|---|
 | 4843 |         {
 | 
|---|
 | 4844 |                 T temp = lhs;
 | 
|---|
 | 4845 |                 lhs = rhs;
 | 
|---|
 | 4846 |                 rhs = temp;
 | 
|---|
 | 4847 |         }
 | 
|---|
 | 4848 | 
 | 
|---|
 | 4849 |         template <typename I, typename Pred> I min_element(I begin, I end, const Pred& pred)
 | 
|---|
 | 4850 |         {
 | 
|---|
 | 4851 |                 I result = begin;
 | 
|---|
 | 4852 | 
 | 
|---|
 | 4853 |                 for (I it = begin + 1; it != end; ++it)
 | 
|---|
 | 4854 |                         if (pred(*it, *result))
 | 
|---|
 | 4855 |                                 result = it;
 | 
|---|
 | 4856 | 
 | 
|---|
 | 4857 |                 return result;
 | 
|---|
 | 4858 |         }
 | 
|---|
 | 4859 | 
 | 
|---|
 | 4860 |         template <typename I> void reverse(I begin, I end)
 | 
|---|
 | 4861 |         {
 | 
|---|
 | 4862 |                 while (begin + 1 < end) swap(*begin++, *--end);
 | 
|---|
 | 4863 |         }
 | 
|---|
 | 4864 | 
 | 
|---|
 | 4865 |         template <typename I> I unique(I begin, I end)
 | 
|---|
 | 4866 |         {
 | 
|---|
 | 4867 |                 // fast skip head
 | 
|---|
 | 4868 |                 while (begin + 1 < end && *begin != *(begin + 1)) begin++;
 | 
|---|
 | 4869 | 
 | 
|---|
 | 4870 |                 if (begin == end) return begin;
 | 
|---|
 | 4871 | 
 | 
|---|
 | 4872 |                 // last written element
 | 
|---|
 | 4873 |                 I write = begin++; 
 | 
|---|
 | 4874 | 
 | 
|---|
 | 4875 |                 // merge unique elements
 | 
|---|
 | 4876 |                 while (begin != end)
 | 
|---|
 | 4877 |                 {
 | 
|---|
 | 4878 |                         if (*begin != *write)
 | 
|---|
 | 4879 |                                 *++write = *begin++;
 | 
|---|
 | 4880 |                         else
 | 
|---|
 | 4881 |                                 begin++;
 | 
|---|
 | 4882 |                 }
 | 
|---|
 | 4883 | 
 | 
|---|
 | 4884 |                 // past-the-end (write points to live element)
 | 
|---|
 | 4885 |                 return write + 1;
 | 
|---|
 | 4886 |         }
 | 
|---|
 | 4887 | 
 | 
|---|
 | 4888 |         template <typename I> void copy_backwards(I begin, I end, I target)
 | 
|---|
 | 4889 |         {
 | 
|---|
 | 4890 |                 while (begin != end) *--target = *--end;
 | 
|---|
 | 4891 |         }
 | 
|---|
 | 4892 | 
 | 
|---|
 | 4893 |         template <typename I, typename Pred, typename T> void insertion_sort(I begin, I end, const Pred& pred, T*)
 | 
|---|
 | 4894 |         {
 | 
|---|
 | 4895 |                 assert(begin != end);
 | 
|---|
 | 4896 | 
 | 
|---|
 | 4897 |                 for (I it = begin + 1; it != end; ++it)
 | 
|---|
 | 4898 |                 {
 | 
|---|
 | 4899 |                         T val = *it;
 | 
|---|
 | 4900 | 
 | 
|---|
 | 4901 |                         if (pred(val, *begin))
 | 
|---|
 | 4902 |                         {
 | 
|---|
 | 4903 |                                 // move to front
 | 
|---|
 | 4904 |                                 copy_backwards(begin, it, it + 1);
 | 
|---|
 | 4905 |                                 *begin = val;
 | 
|---|
 | 4906 |                         }
 | 
|---|
 | 4907 |                         else
 | 
|---|
 | 4908 |                         {
 | 
|---|
 | 4909 |                                 I hole = it;
 | 
|---|
 | 4910 | 
 | 
|---|
 | 4911 |                                 // move hole backwards
 | 
|---|
 | 4912 |                                 while (pred(val, *(hole - 1)))
 | 
|---|
 | 4913 |                                 {
 | 
|---|
 | 4914 |                                         *hole = *(hole - 1);
 | 
|---|
 | 4915 |                                         hole--;
 | 
|---|
 | 4916 |                                 }
 | 
|---|
 | 4917 | 
 | 
|---|
 | 4918 |                                 // fill hole with element
 | 
|---|
 | 4919 |                                 *hole = val;
 | 
|---|
 | 4920 |                         }
 | 
|---|
 | 4921 |                 }
 | 
|---|
 | 4922 |         }
 | 
|---|
 | 4923 | 
 | 
|---|
 | 4924 |         // std variant for elements with ==
 | 
|---|
 | 4925 |         template <typename I, typename Pred> void partition(I begin, I middle, I end, const Pred& pred, I* out_eqbeg, I* out_eqend)
 | 
|---|
 | 4926 |         {
 | 
|---|
 | 4927 |                 I eqbeg = middle, eqend = middle + 1;
 | 
|---|
 | 4928 | 
 | 
|---|
 | 4929 |                 // expand equal range
 | 
|---|
 | 4930 |                 while (eqbeg != begin && *(eqbeg - 1) == *eqbeg) --eqbeg;
 | 
|---|
 | 4931 |                 while (eqend != end && *eqend == *eqbeg) ++eqend;
 | 
|---|
 | 4932 | 
 | 
|---|
 | 4933 |                 // process outer elements
 | 
|---|
 | 4934 |                 I ltend = eqbeg, gtbeg = eqend;
 | 
|---|
 | 4935 | 
 | 
|---|
 | 4936 |                 for (;;)
 | 
|---|
 | 4937 |                 {
 | 
|---|
 | 4938 |                         // find the element from the right side that belongs to the left one
 | 
|---|
 | 4939 |                         for (; gtbeg != end; ++gtbeg)
 | 
|---|
 | 4940 |                                 if (!pred(*eqbeg, *gtbeg))
 | 
|---|
 | 4941 |                                 {
 | 
|---|
 | 4942 |                                         if (*gtbeg == *eqbeg) swap(*gtbeg, *eqend++);
 | 
|---|
 | 4943 |                                         else break;
 | 
|---|
 | 4944 |                                 }
 | 
|---|
 | 4945 | 
 | 
|---|
 | 4946 |                         // find the element from the left side that belongs to the right one
 | 
|---|
 | 4947 |                         for (; ltend != begin; --ltend)
 | 
|---|
 | 4948 |                                 if (!pred(*(ltend - 1), *eqbeg))
 | 
|---|
 | 4949 |                                 {
 | 
|---|
 | 4950 |                                         if (*eqbeg == *(ltend - 1)) swap(*(ltend - 1), *--eqbeg);
 | 
|---|
 | 4951 |                                         else break;
 | 
|---|
 | 4952 |                                 }
 | 
|---|
 | 4953 | 
 | 
|---|
 | 4954 |                         // scanned all elements
 | 
|---|
 | 4955 |                         if (gtbeg == end && ltend == begin)
 | 
|---|
 | 4956 |                         {
 | 
|---|
 | 4957 |                                 *out_eqbeg = eqbeg;
 | 
|---|
 | 4958 |                                 *out_eqend = eqend;
 | 
|---|
 | 4959 |                                 return;
 | 
|---|
 | 4960 |                         }
 | 
|---|
 | 4961 | 
 | 
|---|
 | 4962 |                         // make room for elements by moving equal area
 | 
|---|
 | 4963 |                         if (gtbeg == end)
 | 
|---|
 | 4964 |                         {
 | 
|---|
 | 4965 |                                 if (--ltend != --eqbeg) swap(*ltend, *eqbeg);
 | 
|---|
 | 4966 |                                 swap(*eqbeg, *--eqend);
 | 
|---|
 | 4967 |                         }
 | 
|---|
 | 4968 |                         else if (ltend == begin)
 | 
|---|
 | 4969 |                         {
 | 
|---|
 | 4970 |                                 if (eqend != gtbeg) swap(*eqbeg, *eqend);
 | 
|---|
 | 4971 |                                 ++eqend;
 | 
|---|
 | 4972 |                                 swap(*gtbeg++, *eqbeg++);
 | 
|---|
 | 4973 |                         }
 | 
|---|
 | 4974 |                         else swap(*gtbeg++, *--ltend);
 | 
|---|
 | 4975 |                 }
 | 
|---|
 | 4976 |         }
 | 
|---|
 | 4977 | 
 | 
|---|
 | 4978 |         template <typename I, typename Pred> void median3(I first, I middle, I last, const Pred& pred)
 | 
|---|
 | 4979 |         {
 | 
|---|
 | 4980 |                 if (pred(*middle, *first)) swap(*middle, *first);
 | 
|---|
 | 4981 |                 if (pred(*last, *middle)) swap(*last, *middle);
 | 
|---|
 | 4982 |                 if (pred(*middle, *first)) swap(*middle, *first);
 | 
|---|
 | 4983 |         }
 | 
|---|
 | 4984 | 
 | 
|---|
 | 4985 |         template <typename I, typename Pred> void median(I first, I middle, I last, const Pred& pred)
 | 
|---|
 | 4986 |         {
 | 
|---|
 | 4987 |                 if (last - first <= 40)
 | 
|---|
 | 4988 |                 {
 | 
|---|
 | 4989 |                         // median of three for small chunks
 | 
|---|
 | 4990 |                         median3(first, middle, last, pred);
 | 
|---|
 | 4991 |                 }
 | 
|---|
 | 4992 |                 else
 | 
|---|
 | 4993 |                 {
 | 
|---|
 | 4994 |                         // median of nine
 | 
|---|
 | 4995 |                         size_t step = (last - first + 1) / 8;
 | 
|---|
 | 4996 | 
 | 
|---|
 | 4997 |                         median3(first, first + step, first + 2 * step, pred);
 | 
|---|
 | 4998 |                         median3(middle - step, middle, middle + step, pred);
 | 
|---|
 | 4999 |                         median3(last - 2 * step, last - step, last, pred);
 | 
|---|
 | 5000 |                         median3(first + step, middle, last - step, pred);
 | 
|---|
 | 5001 |                 }
 | 
|---|
 | 5002 |         }
 | 
|---|
 | 5003 | 
 | 
|---|
 | 5004 |         template <typename I, typename Pred> void sort(I begin, I end, const Pred& pred)
 | 
|---|
 | 5005 |         {
 | 
|---|
 | 5006 |                 // sort large chunks
 | 
|---|
 | 5007 |                 while (end - begin > 32)
 | 
|---|
 | 5008 |                 {
 | 
|---|
 | 5009 |                         // find median element
 | 
|---|
 | 5010 |                         I middle = begin + (end - begin) / 2;
 | 
|---|
 | 5011 |                         median(begin, middle, end - 1, pred);
 | 
|---|
 | 5012 | 
 | 
|---|
 | 5013 |                         // partition in three chunks (< = >)
 | 
|---|
 | 5014 |                         I eqbeg, eqend;
 | 
|---|
 | 5015 |                         partition(begin, middle, end, pred, &eqbeg, &eqend);
 | 
|---|
 | 5016 | 
 | 
|---|
 | 5017 |                         // loop on larger half
 | 
|---|
 | 5018 |                         if (eqbeg - begin > end - eqend)
 | 
|---|
 | 5019 |                         {
 | 
|---|
 | 5020 |                                 sort(eqend, end, pred);
 | 
|---|
 | 5021 |                                 end = eqbeg;
 | 
|---|
 | 5022 |                         }
 | 
|---|
 | 5023 |                         else
 | 
|---|
 | 5024 |                         {
 | 
|---|
 | 5025 |                                 sort(begin, eqbeg, pred);
 | 
|---|
 | 5026 |                                 begin = eqend;
 | 
|---|
 | 5027 |                         }
 | 
|---|
 | 5028 |                 }
 | 
|---|
 | 5029 | 
 | 
|---|
 | 5030 |                 // insertion sort small chunk
 | 
|---|
 | 5031 |                 if (begin != end) insertion_sort(begin, end, pred, &*begin);
 | 
|---|
 | 5032 |         }
 | 
|---|
 | 5033 | }
 | 
|---|
 | 5034 | 
 | 
|---|
 | 5035 | // Allocator used for AST and evaluation stacks
 | 
|---|
 | 5036 | namespace
 | 
|---|
 | 5037 | {
 | 
|---|
 | 5038 |         struct xpath_memory_block
 | 
|---|
 | 5039 |         {       
 | 
|---|
 | 5040 |                 xpath_memory_block* next;
 | 
|---|
 | 5041 | 
 | 
|---|
 | 5042 |                 char data[4096];
 | 
|---|
 | 5043 |         };
 | 
|---|
 | 5044 |                 
 | 
|---|
 | 5045 |         class xpath_allocator
 | 
|---|
 | 5046 |         {
 | 
|---|
 | 5047 |                 xpath_memory_block* _root;
 | 
|---|
 | 5048 |                 size_t _root_size;
 | 
|---|
 | 5049 | 
 | 
|---|
 | 5050 |         public:
 | 
|---|
 | 5051 |         #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 5052 |                 jmp_buf* error_handler;
 | 
|---|
 | 5053 |         #endif
 | 
|---|
 | 5054 | 
 | 
|---|
 | 5055 |                 xpath_allocator(xpath_memory_block* root, size_t root_size = 0): _root(root), _root_size(root_size)
 | 
|---|
 | 5056 |                 {
 | 
|---|
 | 5057 |                 #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 5058 |                         error_handler = 0;
 | 
|---|
 | 5059 |                 #endif
 | 
|---|
 | 5060 |                 }
 | 
|---|
 | 5061 |                 
 | 
|---|
 | 5062 |                 void* allocate_nothrow(size_t size)
 | 
|---|
 | 5063 |                 {
 | 
|---|
 | 5064 |                         const size_t block_capacity = sizeof(_root->data);
 | 
|---|
 | 5065 | 
 | 
|---|
 | 5066 |                         // align size so that we're able to store pointers in subsequent blocks
 | 
|---|
 | 5067 |                         size = (size + sizeof(void*) - 1) & ~(sizeof(void*) - 1);
 | 
|---|
 | 5068 | 
 | 
|---|
 | 5069 |                         if (_root_size + size <= block_capacity)
 | 
|---|
 | 5070 |                         {
 | 
|---|
 | 5071 |                                 void* buf = _root->data + _root_size;
 | 
|---|
 | 5072 |                                 _root_size += size;
 | 
|---|
 | 5073 |                                 return buf;
 | 
|---|
 | 5074 |                         }
 | 
|---|
 | 5075 |                         else
 | 
|---|
 | 5076 |                         {
 | 
|---|
 | 5077 |                                 size_t block_data_size = (size > block_capacity) ? size : block_capacity;
 | 
|---|
 | 5078 |                                 size_t block_size = block_data_size + offsetof(xpath_memory_block, data);
 | 
|---|
 | 5079 | 
 | 
|---|
 | 5080 |                                 xpath_memory_block* block = static_cast<xpath_memory_block*>(global_allocate(block_size));
 | 
|---|
 | 5081 |                                 if (!block) return 0;
 | 
|---|
 | 5082 |                                 
 | 
|---|
 | 5083 |                                 block->next = _root;
 | 
|---|
 | 5084 |                                 
 | 
|---|
 | 5085 |                                 _root = block;
 | 
|---|
 | 5086 |                                 _root_size = size;
 | 
|---|
 | 5087 |                                 
 | 
|---|
 | 5088 |                                 return block->data;
 | 
|---|
 | 5089 |                         }
 | 
|---|
 | 5090 |                 }
 | 
|---|
 | 5091 | 
 | 
|---|
 | 5092 |                 void* allocate(size_t size)
 | 
|---|
 | 5093 |                 {
 | 
|---|
 | 5094 |                         void* result = allocate_nothrow(size);
 | 
|---|
 | 5095 | 
 | 
|---|
 | 5096 |                         if (!result)
 | 
|---|
 | 5097 |                         {
 | 
|---|
 | 5098 |                         #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 5099 |                                 assert(error_handler);
 | 
|---|
 | 5100 |                                 longjmp(*error_handler, 1);
 | 
|---|
 | 5101 |                         #else
 | 
|---|
 | 5102 |                                 throw std::bad_alloc();
 | 
|---|
 | 5103 |                         #endif
 | 
|---|
 | 5104 |                         }
 | 
|---|
 | 5105 | 
 | 
|---|
 | 5106 |                         return result;
 | 
|---|
 | 5107 |                 }
 | 
|---|
 | 5108 | 
 | 
|---|
 | 5109 |                 void* reallocate(void* ptr, size_t old_size, size_t new_size)
 | 
|---|
 | 5110 |                 {
 | 
|---|
 | 5111 |                         // align size so that we're able to store pointers in subsequent blocks
 | 
|---|
 | 5112 |                         old_size = (old_size + sizeof(void*) - 1) & ~(sizeof(void*) - 1);
 | 
|---|
 | 5113 |                         new_size = (new_size + sizeof(void*) - 1) & ~(sizeof(void*) - 1);
 | 
|---|
 | 5114 | 
 | 
|---|
 | 5115 |                         // we can only reallocate the last object
 | 
|---|
 | 5116 |                         assert(ptr == 0 || static_cast<char*>(ptr) + old_size == _root->data + _root_size);
 | 
|---|
 | 5117 | 
 | 
|---|
 | 5118 |                         // adjust root size so that we have not allocated the object at all
 | 
|---|
 | 5119 |                         bool only_object = (_root_size == old_size);
 | 
|---|
 | 5120 | 
 | 
|---|
 | 5121 |                         if (ptr) _root_size -= old_size;
 | 
|---|
 | 5122 | 
 | 
|---|
 | 5123 |                         // allocate a new version (this will obviously reuse the memory if possible)
 | 
|---|
 | 5124 |                         void* result = allocate(new_size);
 | 
|---|
 | 5125 |                         assert(result);
 | 
|---|
 | 5126 | 
 | 
|---|
 | 5127 |                         // we have a new block
 | 
|---|
 | 5128 |                         if (result != ptr && ptr)
 | 
|---|
 | 5129 |                         {
 | 
|---|
 | 5130 |                                 // copy old data
 | 
|---|
 | 5131 |                                 assert(new_size > old_size);
 | 
|---|
 | 5132 |                                 memcpy(result, ptr, old_size);
 | 
|---|
 | 5133 | 
 | 
|---|
 | 5134 |                                 // free the previous page if it had no other objects
 | 
|---|
 | 5135 |                                 if (only_object)
 | 
|---|
 | 5136 |                                 {
 | 
|---|
 | 5137 |                                         assert(_root->data == result);
 | 
|---|
 | 5138 |                                         assert(_root->next);
 | 
|---|
 | 5139 | 
 | 
|---|
 | 5140 |                                         xpath_memory_block* next = _root->next->next;
 | 
|---|
 | 5141 | 
 | 
|---|
 | 5142 |                                         if (next)
 | 
|---|
 | 5143 |                                         {
 | 
|---|
 | 5144 |                                                 // deallocate the whole page, unless it was the first one
 | 
|---|
 | 5145 |                                                 global_deallocate(_root->next);
 | 
|---|
 | 5146 |                                                 _root->next = next;
 | 
|---|
 | 5147 |                                         }
 | 
|---|
 | 5148 |                                 }
 | 
|---|
 | 5149 |                         }
 | 
|---|
 | 5150 | 
 | 
|---|
 | 5151 |                         return result;
 | 
|---|
 | 5152 |                 }
 | 
|---|
 | 5153 | 
 | 
|---|
 | 5154 |                 void revert(const xpath_allocator& state)
 | 
|---|
 | 5155 |                 {
 | 
|---|
 | 5156 |                         // free all new pages
 | 
|---|
 | 5157 |                         xpath_memory_block* cur = _root;
 | 
|---|
 | 5158 | 
 | 
|---|
 | 5159 |                         while (cur != state._root)
 | 
|---|
 | 5160 |                         {
 | 
|---|
 | 5161 |                                 xpath_memory_block* next = cur->next;
 | 
|---|
 | 5162 | 
 | 
|---|
 | 5163 |                                 global_deallocate(cur);
 | 
|---|
 | 5164 | 
 | 
|---|
 | 5165 |                                 cur = next;
 | 
|---|
 | 5166 |                         }
 | 
|---|
 | 5167 | 
 | 
|---|
 | 5168 |                         // restore state
 | 
|---|
 | 5169 |                         _root = state._root;
 | 
|---|
 | 5170 |                         _root_size = state._root_size;
 | 
|---|
 | 5171 |                 }
 | 
|---|
 | 5172 | 
 | 
|---|
 | 5173 |                 void release()
 | 
|---|
 | 5174 |                 {
 | 
|---|
 | 5175 |                         xpath_memory_block* cur = _root;
 | 
|---|
 | 5176 |                         assert(cur);
 | 
|---|
 | 5177 | 
 | 
|---|
 | 5178 |                         while (cur->next)
 | 
|---|
 | 5179 |                         {
 | 
|---|
 | 5180 |                                 xpath_memory_block* next = cur->next;
 | 
|---|
 | 5181 | 
 | 
|---|
 | 5182 |                                 global_deallocate(cur);
 | 
|---|
 | 5183 | 
 | 
|---|
 | 5184 |                                 cur = next;
 | 
|---|
 | 5185 |                         }
 | 
|---|
 | 5186 |                 }
 | 
|---|
 | 5187 |         };
 | 
|---|
 | 5188 | 
 | 
|---|
 | 5189 |         struct xpath_allocator_capture
 | 
|---|
 | 5190 |         {
 | 
|---|
 | 5191 |                 xpath_allocator_capture(xpath_allocator* alloc): _target(alloc), _state(*alloc)
 | 
|---|
 | 5192 |                 {
 | 
|---|
 | 5193 |                 }
 | 
|---|
 | 5194 | 
 | 
|---|
 | 5195 |                 ~xpath_allocator_capture()
 | 
|---|
 | 5196 |                 {
 | 
|---|
 | 5197 |                         _target->revert(_state);
 | 
|---|
 | 5198 |                 }
 | 
|---|
 | 5199 | 
 | 
|---|
 | 5200 |                 xpath_allocator* _target;
 | 
|---|
 | 5201 |                 xpath_allocator _state;
 | 
|---|
 | 5202 |         };
 | 
|---|
 | 5203 | 
 | 
|---|
 | 5204 |         struct xpath_stack
 | 
|---|
 | 5205 |         {
 | 
|---|
 | 5206 |                 xpath_allocator* result;
 | 
|---|
 | 5207 |                 xpath_allocator* temp;
 | 
|---|
 | 5208 |         };
 | 
|---|
 | 5209 | 
 | 
|---|
 | 5210 |         struct xpath_stack_data
 | 
|---|
 | 5211 |         {
 | 
|---|
 | 5212 |                 xpath_memory_block blocks[2];
 | 
|---|
 | 5213 |                 xpath_allocator result;
 | 
|---|
 | 5214 |                 xpath_allocator temp;
 | 
|---|
 | 5215 |                 xpath_stack stack;
 | 
|---|
 | 5216 | 
 | 
|---|
 | 5217 |         #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 5218 |                 jmp_buf error_handler;
 | 
|---|
 | 5219 |         #endif
 | 
|---|
 | 5220 | 
 | 
|---|
 | 5221 |                 xpath_stack_data(): result(blocks + 0), temp(blocks + 1)
 | 
|---|
 | 5222 |                 {
 | 
|---|
 | 5223 |                         blocks[0].next = blocks[1].next = 0;
 | 
|---|
 | 5224 | 
 | 
|---|
 | 5225 |                         stack.result = &result;
 | 
|---|
 | 5226 |                         stack.temp = &temp;
 | 
|---|
 | 5227 | 
 | 
|---|
 | 5228 |                 #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 5229 |                         result.error_handler = temp.error_handler = &error_handler;
 | 
|---|
 | 5230 |                 #endif
 | 
|---|
 | 5231 |                 }
 | 
|---|
 | 5232 | 
 | 
|---|
 | 5233 |                 ~xpath_stack_data()
 | 
|---|
 | 5234 |                 {
 | 
|---|
 | 5235 |                         result.release();
 | 
|---|
 | 5236 |                         temp.release();
 | 
|---|
 | 5237 |                 }
 | 
|---|
 | 5238 |         };
 | 
|---|
 | 5239 | }
 | 
|---|
 | 5240 | 
 | 
|---|
 | 5241 | // String class
 | 
|---|
 | 5242 | namespace
 | 
|---|
 | 5243 | {
 | 
|---|
 | 5244 |         class xpath_string
 | 
|---|
 | 5245 |         {
 | 
|---|
 | 5246 |                 const char_t* _buffer;
 | 
|---|
 | 5247 |                 bool _uses_heap;
 | 
|---|
 | 5248 | 
 | 
|---|
 | 5249 |                 static char_t* duplicate_string(const char_t* string, size_t length, xpath_allocator* alloc)
 | 
|---|
 | 5250 |                 {
 | 
|---|
 | 5251 |                         char_t* result = static_cast<char_t*>(alloc->allocate((length + 1) * sizeof(char_t)));
 | 
|---|
 | 5252 |                         assert(result);
 | 
|---|
 | 5253 | 
 | 
|---|
 | 5254 |                         memcpy(result, string, length * sizeof(char_t));
 | 
|---|
 | 5255 |                         result[length] = 0;
 | 
|---|
 | 5256 | 
 | 
|---|
 | 5257 |                         return result;
 | 
|---|
 | 5258 |                 }
 | 
|---|
 | 5259 | 
 | 
|---|
 | 5260 |                 static char_t* duplicate_string(const char_t* string, xpath_allocator* alloc)
 | 
|---|
 | 5261 |                 {
 | 
|---|
 | 5262 |                         return duplicate_string(string, strlength(string), alloc);
 | 
|---|
 | 5263 |                 }
 | 
|---|
 | 5264 | 
 | 
|---|
 | 5265 |         public:
 | 
|---|
 | 5266 |                 xpath_string(): _buffer(PUGIXML_TEXT("")), _uses_heap(false)
 | 
|---|
 | 5267 |                 {
 | 
|---|
 | 5268 |                 }
 | 
|---|
 | 5269 | 
 | 
|---|
 | 5270 |                 explicit xpath_string(const char_t* str, xpath_allocator* alloc)
 | 
|---|
 | 5271 |                 {
 | 
|---|
 | 5272 |                         bool empty = (*str == 0);
 | 
|---|
 | 5273 | 
 | 
|---|
 | 5274 |                         _buffer = empty ? PUGIXML_TEXT("") : duplicate_string(str, alloc);
 | 
|---|
 | 5275 |                         _uses_heap = !empty;
 | 
|---|
 | 5276 |                 }
 | 
|---|
 | 5277 | 
 | 
|---|
 | 5278 |                 explicit xpath_string(const char_t* str, bool use_heap): _buffer(str), _uses_heap(use_heap)
 | 
|---|
 | 5279 |                 {
 | 
|---|
 | 5280 |                 }
 | 
|---|
 | 5281 | 
 | 
|---|
 | 5282 |                 xpath_string(const char_t* begin, const char_t* end, xpath_allocator* alloc)
 | 
|---|
 | 5283 |                 {
 | 
|---|
 | 5284 |                         assert(begin <= end);
 | 
|---|
 | 5285 | 
 | 
|---|
 | 5286 |                         bool empty = (begin == end);
 | 
|---|
 | 5287 | 
 | 
|---|
 | 5288 |                         _buffer = empty ? PUGIXML_TEXT("") : duplicate_string(begin, static_cast<size_t>(end - begin), alloc);
 | 
|---|
 | 5289 |                         _uses_heap = !empty;
 | 
|---|
 | 5290 |                 }
 | 
|---|
 | 5291 | 
 | 
|---|
 | 5292 |                 void append(const xpath_string& o, xpath_allocator* alloc)
 | 
|---|
 | 5293 |                 {
 | 
|---|
 | 5294 |                         // skip empty sources
 | 
|---|
 | 5295 |                         if (!*o._buffer) return;
 | 
|---|
 | 5296 | 
 | 
|---|
 | 5297 |                         // fast append for constant empty target and constant source
 | 
|---|
 | 5298 |                         if (!*_buffer && !_uses_heap && !o._uses_heap)
 | 
|---|
 | 5299 |                         {
 | 
|---|
 | 5300 |                                 _buffer = o._buffer;
 | 
|---|
 | 5301 |                         }
 | 
|---|
 | 5302 |                         else
 | 
|---|
 | 5303 |                         {
 | 
|---|
 | 5304 |                                 // need to make heap copy
 | 
|---|
 | 5305 |                                 size_t target_length = strlength(_buffer);
 | 
|---|
 | 5306 |                                 size_t source_length = strlength(o._buffer);
 | 
|---|
 | 5307 |                                 size_t length = target_length + source_length;
 | 
|---|
 | 5308 | 
 | 
|---|
 | 5309 |                                 // allocate new buffer
 | 
|---|
 | 5310 |                                 char_t* result = static_cast<char_t*>(alloc->reallocate(_uses_heap ? const_cast<char_t*>(_buffer) : 0, (target_length + 1) * sizeof(char_t), (length + 1) * sizeof(char_t)));
 | 
|---|
 | 5311 |                                 assert(result);
 | 
|---|
 | 5312 | 
 | 
|---|
 | 5313 |                                 // append first string to the new buffer in case there was no reallocation
 | 
|---|
 | 5314 |                                 if (!_uses_heap) memcpy(result, _buffer, target_length * sizeof(char_t));
 | 
|---|
 | 5315 | 
 | 
|---|
 | 5316 |                                 // append second string to the new buffer
 | 
|---|
 | 5317 |                                 memcpy(result + target_length, o._buffer, source_length * sizeof(char_t));
 | 
|---|
 | 5318 |                                 result[length] = 0;
 | 
|---|
 | 5319 | 
 | 
|---|
 | 5320 |                                 // finalize
 | 
|---|
 | 5321 |                                 _buffer = result;
 | 
|---|
 | 5322 |                                 _uses_heap = true;
 | 
|---|
 | 5323 |                         }
 | 
|---|
 | 5324 |                 }
 | 
|---|
 | 5325 | 
 | 
|---|
 | 5326 |                 const char_t* c_str() const
 | 
|---|
 | 5327 |                 {
 | 
|---|
 | 5328 |                         return _buffer;
 | 
|---|
 | 5329 |                 }
 | 
|---|
 | 5330 | 
 | 
|---|
 | 5331 |                 size_t length() const
 | 
|---|
 | 5332 |                 {
 | 
|---|
 | 5333 |                         return strlength(_buffer);
 | 
|---|
 | 5334 |                 }
 | 
|---|
 | 5335 |                 
 | 
|---|
 | 5336 |                 char_t* data(xpath_allocator* alloc)
 | 
|---|
 | 5337 |                 {
 | 
|---|
 | 5338 |                         // make private heap copy
 | 
|---|
 | 5339 |                         if (!_uses_heap)
 | 
|---|
 | 5340 |                         {
 | 
|---|
 | 5341 |                                 _buffer = duplicate_string(_buffer, alloc);
 | 
|---|
 | 5342 |                                 _uses_heap = true;
 | 
|---|
 | 5343 |                         }
 | 
|---|
 | 5344 | 
 | 
|---|
 | 5345 |                         return const_cast<char_t*>(_buffer);
 | 
|---|
 | 5346 |                 }
 | 
|---|
 | 5347 | 
 | 
|---|
 | 5348 |                 bool empty() const
 | 
|---|
 | 5349 |                 {
 | 
|---|
 | 5350 |                         return *_buffer == 0;
 | 
|---|
 | 5351 |                 }
 | 
|---|
 | 5352 | 
 | 
|---|
 | 5353 |                 bool operator==(const xpath_string& o) const
 | 
|---|
 | 5354 |                 {
 | 
|---|
 | 5355 |                         return strequal(_buffer, o._buffer);
 | 
|---|
 | 5356 |                 }
 | 
|---|
 | 5357 | 
 | 
|---|
 | 5358 |                 bool operator!=(const xpath_string& o) const
 | 
|---|
 | 5359 |                 {
 | 
|---|
 | 5360 |                         return !strequal(_buffer, o._buffer);
 | 
|---|
 | 5361 |                 }
 | 
|---|
 | 5362 | 
 | 
|---|
 | 5363 |                 bool uses_heap() const
 | 
|---|
 | 5364 |                 {
 | 
|---|
 | 5365 |                         return _uses_heap;
 | 
|---|
 | 5366 |                 }
 | 
|---|
 | 5367 |         };
 | 
|---|
 | 5368 | 
 | 
|---|
 | 5369 |         xpath_string xpath_string_const(const char_t* str)
 | 
|---|
 | 5370 |         {
 | 
|---|
 | 5371 |                 return xpath_string(str, false);
 | 
|---|
 | 5372 |         }
 | 
|---|
 | 5373 | }
 | 
|---|
 | 5374 | 
 | 
|---|
 | 5375 | namespace
 | 
|---|
 | 5376 | {
 | 
|---|
 | 5377 |         bool starts_with(const char_t* string, const char_t* pattern)
 | 
|---|
 | 5378 |         {
 | 
|---|
 | 5379 |                 while (*pattern && *string == *pattern)
 | 
|---|
 | 5380 |                 {
 | 
|---|
 | 5381 |                         string++;
 | 
|---|
 | 5382 |                         pattern++;
 | 
|---|
 | 5383 |                 }
 | 
|---|
 | 5384 | 
 | 
|---|
 | 5385 |                 return *pattern == 0;
 | 
|---|
 | 5386 |         }
 | 
|---|
 | 5387 | 
 | 
|---|
 | 5388 |         const char_t* find_char(const char_t* s, char_t c)
 | 
|---|
 | 5389 |         {
 | 
|---|
 | 5390 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 5391 |                 return wcschr(s, c);
 | 
|---|
 | 5392 |         #else
 | 
|---|
 | 5393 |                 return strchr(s, c);
 | 
|---|
 | 5394 |         #endif
 | 
|---|
 | 5395 |         }
 | 
|---|
 | 5396 | 
 | 
|---|
 | 5397 |         const char_t* find_substring(const char_t* s, const char_t* p)
 | 
|---|
 | 5398 |         {
 | 
|---|
 | 5399 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 5400 |                 // MSVC6 wcsstr bug workaround (if s is empty it always returns 0)
 | 
|---|
 | 5401 |                 return (*p == 0) ? s : wcsstr(s, p);
 | 
|---|
 | 5402 |         #else
 | 
|---|
 | 5403 |                 return strstr(s, p);
 | 
|---|
 | 5404 |         #endif
 | 
|---|
 | 5405 |         }
 | 
|---|
 | 5406 | 
 | 
|---|
 | 5407 |         // Converts symbol to lower case, if it is an ASCII one
 | 
|---|
 | 5408 |         char_t tolower_ascii(char_t ch)
 | 
|---|
 | 5409 |         {
 | 
|---|
 | 5410 |                 return static_cast<unsigned int>(ch - 'A') < 26 ? static_cast<char_t>(ch | ' ') : ch;
 | 
|---|
 | 5411 |         }
 | 
|---|
 | 5412 | 
 | 
|---|
 | 5413 |         xpath_string string_value(const xpath_node& na, xpath_allocator* alloc)
 | 
|---|
 | 5414 |         {
 | 
|---|
 | 5415 |                 if (na.attribute())
 | 
|---|
 | 5416 |                         return xpath_string_const(na.attribute().value());
 | 
|---|
 | 5417 |                 else
 | 
|---|
 | 5418 |                 {
 | 
|---|
 | 5419 |                         const xml_node& n = na.node();
 | 
|---|
 | 5420 | 
 | 
|---|
 | 5421 |                         switch (n.type())
 | 
|---|
 | 5422 |                         {
 | 
|---|
 | 5423 |                         case node_pcdata:
 | 
|---|
 | 5424 |                         case node_cdata:
 | 
|---|
 | 5425 |                         case node_comment:
 | 
|---|
 | 5426 |                         case node_pi:
 | 
|---|
 | 5427 |                                 return xpath_string_const(n.value());
 | 
|---|
 | 5428 |                         
 | 
|---|
 | 5429 |                         case node_document:
 | 
|---|
 | 5430 |                         case node_element:
 | 
|---|
 | 5431 |                         {
 | 
|---|
 | 5432 |                                 xpath_string result;
 | 
|---|
 | 5433 | 
 | 
|---|
 | 5434 |                                 xml_node cur = n.first_child();
 | 
|---|
 | 5435 |                                 
 | 
|---|
 | 5436 |                                 while (cur && cur != n)
 | 
|---|
 | 5437 |                                 {
 | 
|---|
 | 5438 |                                         if (cur.type() == node_pcdata || cur.type() == node_cdata)
 | 
|---|
 | 5439 |                                                 result.append(xpath_string_const(cur.value()), alloc);
 | 
|---|
 | 5440 | 
 | 
|---|
 | 5441 |                                         if (cur.first_child())
 | 
|---|
 | 5442 |                                                 cur = cur.first_child();
 | 
|---|
 | 5443 |                                         else if (cur.next_sibling())
 | 
|---|
 | 5444 |                                                 cur = cur.next_sibling();
 | 
|---|
 | 5445 |                                         else
 | 
|---|
 | 5446 |                                         {
 | 
|---|
 | 5447 |                                                 while (!cur.next_sibling() && cur != n)
 | 
|---|
 | 5448 |                                                         cur = cur.parent();
 | 
|---|
 | 5449 | 
 | 
|---|
 | 5450 |                                                 if (cur != n) cur = cur.next_sibling();
 | 
|---|
 | 5451 |                                         }
 | 
|---|
 | 5452 |                                 }
 | 
|---|
 | 5453 |                                 
 | 
|---|
 | 5454 |                                 return result;
 | 
|---|
 | 5455 |                         }
 | 
|---|
 | 5456 |                         
 | 
|---|
 | 5457 |                         default:
 | 
|---|
 | 5458 |                                 return xpath_string();
 | 
|---|
 | 5459 |                         }
 | 
|---|
 | 5460 |                 }
 | 
|---|
 | 5461 |         }
 | 
|---|
 | 5462 |         
 | 
|---|
 | 5463 |         unsigned int node_height(xml_node n)
 | 
|---|
 | 5464 |         {
 | 
|---|
 | 5465 |             unsigned int result = 0;
 | 
|---|
 | 5466 |             
 | 
|---|
 | 5467 |             while (n)
 | 
|---|
 | 5468 |             {
 | 
|---|
 | 5469 |                 ++result;
 | 
|---|
 | 5470 |                 n = n.parent();
 | 
|---|
 | 5471 |             }
 | 
|---|
 | 5472 |             
 | 
|---|
 | 5473 |             return result;
 | 
|---|
 | 5474 |         }
 | 
|---|
 | 5475 |         
 | 
|---|
 | 5476 |         bool node_is_before(xml_node ln, unsigned int lh, xml_node rn, unsigned int rh)
 | 
|---|
 | 5477 |         {
 | 
|---|
 | 5478 |                 // normalize heights
 | 
|---|
 | 5479 |                 for (unsigned int i = rh; i < lh; i++) ln = ln.parent();
 | 
|---|
 | 5480 |                 for (unsigned int j = lh; j < rh; j++) rn = rn.parent();
 | 
|---|
 | 5481 |             
 | 
|---|
 | 5482 |                 // one node is the ancestor of the other
 | 
|---|
 | 5483 |             if (ln == rn) return lh < rh;
 | 
|---|
 | 5484 |             
 | 
|---|
 | 5485 |                 // find common ancestor
 | 
|---|
 | 5486 |             while (ln.parent() != rn.parent())
 | 
|---|
 | 5487 |             {
 | 
|---|
 | 5488 |                 ln = ln.parent();
 | 
|---|
 | 5489 |                 rn = rn.parent();
 | 
|---|
 | 5490 |             }
 | 
|---|
 | 5491 | 
 | 
|---|
 | 5492 |                 // there is no common ancestor (the shared parent is null), nodes are from different documents
 | 
|---|
 | 5493 |                 if (!ln.parent()) return ln < rn;
 | 
|---|
 | 5494 | 
 | 
|---|
 | 5495 |                 // determine sibling order
 | 
|---|
 | 5496 |         for (; ln; ln = ln.next_sibling())
 | 
|---|
 | 5497 |             if (ln == rn)
 | 
|---|
 | 5498 |                 return true;
 | 
|---|
 | 5499 |                 
 | 
|---|
 | 5500 |         return false;
 | 
|---|
 | 5501 |     }
 | 
|---|
 | 5502 | 
 | 
|---|
 | 5503 |     bool node_is_ancestor(xml_node parent, xml_node node)
 | 
|---|
 | 5504 |     {
 | 
|---|
 | 5505 |         while (node && node != parent) node = node.parent();
 | 
|---|
 | 5506 | 
 | 
|---|
 | 5507 |         return parent && node == parent;
 | 
|---|
 | 5508 |     }
 | 
|---|
 | 5509 | 
 | 
|---|
 | 5510 |     const void* document_order(const xpath_node& xnode)
 | 
|---|
 | 5511 |     {
 | 
|---|
 | 5512 |         xml_node_struct* node = xnode.node().internal_object();
 | 
|---|
 | 5513 | 
 | 
|---|
 | 5514 |         if (node)
 | 
|---|
 | 5515 |         {
 | 
|---|
 | 5516 |             if (node->name && (node->header & xml_memory_page_name_allocated_mask) == 0) return node->name;
 | 
|---|
 | 5517 |             if (node->value && (node->header & xml_memory_page_value_allocated_mask) == 0) return node->value;
 | 
|---|
 | 5518 |             return 0;
 | 
|---|
 | 5519 |         }
 | 
|---|
 | 5520 | 
 | 
|---|
 | 5521 |         xml_attribute_struct* attr = xnode.attribute().internal_object();
 | 
|---|
 | 5522 | 
 | 
|---|
 | 5523 |         if (attr)
 | 
|---|
 | 5524 |         {
 | 
|---|
 | 5525 |             if ((attr->header & xml_memory_page_name_allocated_mask) == 0) return attr->name;
 | 
|---|
 | 5526 |             if ((attr->header & xml_memory_page_value_allocated_mask) == 0) return attr->value;
 | 
|---|
 | 5527 |             return 0;
 | 
|---|
 | 5528 |         }
 | 
|---|
 | 5529 | 
 | 
|---|
 | 5530 |                 return 0;
 | 
|---|
 | 5531 |     }
 | 
|---|
 | 5532 |     
 | 
|---|
 | 5533 |         struct document_order_comparator
 | 
|---|
 | 5534 |         {
 | 
|---|
 | 5535 |                 bool operator()(const xpath_node& lhs, const xpath_node& rhs) const
 | 
|---|
 | 5536 |                 {
 | 
|---|
 | 5537 |                         // optimized document order based check
 | 
|---|
 | 5538 |                         const void* lo = document_order(lhs);
 | 
|---|
 | 5539 |                         const void* ro = document_order(rhs);
 | 
|---|
 | 5540 | 
 | 
|---|
 | 5541 |                         if (lo && ro) return lo < ro;
 | 
|---|
 | 5542 | 
 | 
|---|
 | 5543 |             // slow comparison
 | 
|---|
 | 5544 |                         xml_node ln = lhs.node(), rn = rhs.node();
 | 
|---|
 | 5545 | 
 | 
|---|
 | 5546 |                         // compare attributes
 | 
|---|
 | 5547 |                         if (lhs.attribute() && rhs.attribute())
 | 
|---|
 | 5548 |                         {
 | 
|---|
 | 5549 |                                 // shared parent
 | 
|---|
 | 5550 |                                 if (lhs.parent() == rhs.parent())
 | 
|---|
 | 5551 |                                 {
 | 
|---|
 | 5552 |                                         // determine sibling order
 | 
|---|
 | 5553 |                                     for (xml_attribute a = lhs.attribute(); a; a = a.next_attribute())
 | 
|---|
 | 5554 |                                         if (a == rhs.attribute())
 | 
|---|
 | 5555 |                                             return true;
 | 
|---|
 | 5556 |                                     
 | 
|---|
 | 5557 |                                     return false;
 | 
|---|
 | 5558 |                                 }
 | 
|---|
 | 5559 |                                 
 | 
|---|
 | 5560 |                                 // compare attribute parents
 | 
|---|
 | 5561 |                                 ln = lhs.parent();
 | 
|---|
 | 5562 |                                 rn = rhs.parent();
 | 
|---|
 | 5563 |                         }
 | 
|---|
 | 5564 |                         else if (lhs.attribute())
 | 
|---|
 | 5565 |                         {
 | 
|---|
 | 5566 |                                 // attributes go after the parent element
 | 
|---|
 | 5567 |                                 if (lhs.parent() == rhs.node()) return false;
 | 
|---|
 | 5568 |                                 
 | 
|---|
 | 5569 |                                 ln = lhs.parent();
 | 
|---|
 | 5570 |                         }
 | 
|---|
 | 5571 |                         else if (rhs.attribute())
 | 
|---|
 | 5572 |                         {
 | 
|---|
 | 5573 |                                 // attributes go after the parent element
 | 
|---|
 | 5574 |                                 if (rhs.parent() == lhs.node()) return true;
 | 
|---|
 | 5575 |                                 
 | 
|---|
 | 5576 |                                 rn = rhs.parent();
 | 
|---|
 | 5577 |                         }
 | 
|---|
 | 5578 | 
 | 
|---|
 | 5579 |                         if (ln == rn) return false;
 | 
|---|
 | 5580 |                         
 | 
|---|
 | 5581 |                         unsigned int lh = node_height(ln);
 | 
|---|
 | 5582 |                         unsigned int rh = node_height(rn);
 | 
|---|
 | 5583 |                         
 | 
|---|
 | 5584 |                         return node_is_before(ln, lh, rn, rh);
 | 
|---|
 | 5585 |                 }
 | 
|---|
 | 5586 |         };
 | 
|---|
 | 5587 | 
 | 
|---|
 | 5588 |         struct duplicate_comparator
 | 
|---|
 | 5589 |         {
 | 
|---|
 | 5590 |                 bool operator()(const xpath_node& lhs, const xpath_node& rhs) const
 | 
|---|
 | 5591 |                 {
 | 
|---|
 | 5592 |                         if (lhs.attribute()) return rhs.attribute() ? lhs.attribute() < rhs.attribute() : true;
 | 
|---|
 | 5593 |                         else return rhs.attribute() ? false : lhs.node() < rhs.node();
 | 
|---|
 | 5594 |                 }
 | 
|---|
 | 5595 |         };
 | 
|---|
 | 5596 |         
 | 
|---|
 | 5597 |         double gen_nan()
 | 
|---|
 | 5598 |         {
 | 
|---|
 | 5599 |         #if defined(__STDC_IEC_559__) || ((FLT_RADIX - 0 == 2) && (FLT_MAX_EXP - 0 == 128) && (FLT_MANT_DIG - 0 == 24))
 | 
|---|
 | 5600 |                 union { float f; int32_t i; } u[sizeof(float) == sizeof(int32_t) ? 1 : -1];
 | 
|---|
 | 5601 |                 u[0].i = 0x7fc00000;
 | 
|---|
 | 5602 |                 return u[0].f;
 | 
|---|
 | 5603 |         #else
 | 
|---|
 | 5604 |                 // fallback
 | 
|---|
 | 5605 |                 const volatile double zero = 0.0;
 | 
|---|
 | 5606 |                 return zero / zero;
 | 
|---|
 | 5607 |         #endif
 | 
|---|
 | 5608 |         }
 | 
|---|
 | 5609 |         
 | 
|---|
 | 5610 |         bool is_nan(double value)
 | 
|---|
 | 5611 |         {
 | 
|---|
 | 5612 |         #if defined(_MSC_VER) || defined(__BORLANDC__)
 | 
|---|
 | 5613 |                 return !!_isnan(value);
 | 
|---|
 | 5614 |         #elif defined(fpclassify) && defined(FP_NAN)
 | 
|---|
 | 5615 |                 return fpclassify(value) == FP_NAN;
 | 
|---|
 | 5616 |         #else
 | 
|---|
 | 5617 |                 // fallback
 | 
|---|
 | 5618 |                 const volatile double v = value;
 | 
|---|
 | 5619 |                 return v != v;
 | 
|---|
 | 5620 |         #endif
 | 
|---|
 | 5621 |         }
 | 
|---|
 | 5622 |         
 | 
|---|
 | 5623 |         const char_t* convert_number_to_string_special(double value)
 | 
|---|
 | 5624 |         {
 | 
|---|
 | 5625 |         #if defined(_MSC_VER) || defined(__BORLANDC__)
 | 
|---|
 | 5626 |                 if (_finite(value)) return (value == 0) ? PUGIXML_TEXT("0") : 0;
 | 
|---|
 | 5627 |                 if (_isnan(value)) return PUGIXML_TEXT("NaN");
 | 
|---|
 | 5628 |                 return PUGIXML_TEXT("-Infinity") + (value > 0);
 | 
|---|
 | 5629 |         #elif defined(fpclassify) && defined(FP_NAN) && defined(FP_INFINITE) && defined(FP_ZERO)
 | 
|---|
 | 5630 |                 switch (fpclassify(value))
 | 
|---|
 | 5631 |                 {
 | 
|---|
 | 5632 |                 case FP_NAN:
 | 
|---|
 | 5633 |                         return PUGIXML_TEXT("NaN");
 | 
|---|
 | 5634 | 
 | 
|---|
 | 5635 |                 case FP_INFINITE:
 | 
|---|
 | 5636 |                         return PUGIXML_TEXT("-Infinity") + (value > 0);
 | 
|---|
 | 5637 | 
 | 
|---|
 | 5638 |                 case FP_ZERO:
 | 
|---|
 | 5639 |                         return PUGIXML_TEXT("0");
 | 
|---|
 | 5640 | 
 | 
|---|
 | 5641 |                 default:
 | 
|---|
 | 5642 |                         return 0;
 | 
|---|
 | 5643 |                 }
 | 
|---|
 | 5644 |         #else
 | 
|---|
 | 5645 |                 // fallback
 | 
|---|
 | 5646 |                 const volatile double v = value;
 | 
|---|
 | 5647 | 
 | 
|---|
 | 5648 |                 if (v == 0) return PUGIXML_TEXT("0");
 | 
|---|
 | 5649 |                 if (v != v) return PUGIXML_TEXT("NaN");
 | 
|---|
 | 5650 |                 if (v * 2 == v) return PUGIXML_TEXT("-Infinity") + (value > 0);
 | 
|---|
 | 5651 |                 return 0;
 | 
|---|
 | 5652 |         #endif
 | 
|---|
 | 5653 |         }
 | 
|---|
 | 5654 |         
 | 
|---|
 | 5655 |         bool convert_number_to_boolean(double value)
 | 
|---|
 | 5656 |         {
 | 
|---|
 | 5657 |                 return (value != 0 && !is_nan(value));
 | 
|---|
 | 5658 |         }
 | 
|---|
 | 5659 |         
 | 
|---|
 | 5660 |         void truncate_zeros(char* begin, char* end)
 | 
|---|
 | 5661 |         {
 | 
|---|
 | 5662 |                 while (begin != end && end[-1] == '0') end--;
 | 
|---|
 | 5663 | 
 | 
|---|
 | 5664 |                 *end = 0;
 | 
|---|
 | 5665 |         }
 | 
|---|
 | 5666 | 
 | 
|---|
 | 5667 |         // gets mantissa digits in the form of 0.xxxxx with 0. implied and the exponent
 | 
|---|
 | 5668 | #if defined(_MSC_VER) && _MSC_VER >= 1400
 | 
|---|
 | 5669 |         void convert_number_to_mantissa_exponent(double value, char* buffer, size_t buffer_size, char** out_mantissa, int* out_exponent)
 | 
|---|
 | 5670 |         {
 | 
|---|
 | 5671 |                 // get base values
 | 
|---|
 | 5672 |                 int sign, exponent;
 | 
|---|
 | 5673 |                 _ecvt_s(buffer, buffer_size, value, DBL_DIG + 1, &exponent, &sign);
 | 
|---|
 | 5674 | 
 | 
|---|
 | 5675 |                 // truncate redundant zeros
 | 
|---|
 | 5676 |                 truncate_zeros(buffer, buffer + strlen(buffer));
 | 
|---|
 | 5677 | 
 | 
|---|
 | 5678 |                 // fill results
 | 
|---|
 | 5679 |                 *out_mantissa = buffer;
 | 
|---|
 | 5680 |                 *out_exponent = exponent;
 | 
|---|
 | 5681 |         }
 | 
|---|
 | 5682 | #else
 | 
|---|
 | 5683 |         void convert_number_to_mantissa_exponent(double value, char* buffer, size_t buffer_size, char** out_mantissa, int* out_exponent)
 | 
|---|
 | 5684 |         {
 | 
|---|
 | 5685 |                 // get a scientific notation value with IEEE DBL_DIG decimals
 | 
|---|
 | 5686 |                 sprintf(buffer, "%.*e", DBL_DIG, value);
 | 
|---|
 | 5687 |                 assert(strlen(buffer) < buffer_size);
 | 
|---|
 | 5688 |                 (void)!buffer_size;
 | 
|---|
 | 5689 | 
 | 
|---|
 | 5690 |                 // get the exponent (possibly negative)
 | 
|---|
 | 5691 |                 char* exponent_string = strchr(buffer, 'e');
 | 
|---|
 | 5692 |                 assert(exponent_string);
 | 
|---|
 | 5693 | 
 | 
|---|
 | 5694 |                 int exponent = atoi(exponent_string + 1);
 | 
|---|
 | 5695 | 
 | 
|---|
 | 5696 |                 // extract mantissa string: skip sign
 | 
|---|
 | 5697 |                 char* mantissa = buffer[0] == '-' ? buffer + 1 : buffer;
 | 
|---|
 | 5698 |                 assert(mantissa[0] != '0' && mantissa[1] == '.');
 | 
|---|
 | 5699 | 
 | 
|---|
 | 5700 |                 // divide mantissa by 10 to eliminate integer part
 | 
|---|
 | 5701 |                 mantissa[1] = mantissa[0];
 | 
|---|
 | 5702 |                 mantissa++;
 | 
|---|
 | 5703 |                 exponent++;
 | 
|---|
 | 5704 | 
 | 
|---|
 | 5705 |                 // remove extra mantissa digits and zero-terminate mantissa
 | 
|---|
 | 5706 |                 truncate_zeros(mantissa, exponent_string);
 | 
|---|
 | 5707 | 
 | 
|---|
 | 5708 |                 // fill results
 | 
|---|
 | 5709 |                 *out_mantissa = mantissa;
 | 
|---|
 | 5710 |                 *out_exponent = exponent;
 | 
|---|
 | 5711 |         }
 | 
|---|
 | 5712 | #endif
 | 
|---|
 | 5713 | 
 | 
|---|
 | 5714 |         xpath_string convert_number_to_string(double value, xpath_allocator* alloc)
 | 
|---|
 | 5715 |         {
 | 
|---|
 | 5716 |                 // try special number conversion
 | 
|---|
 | 5717 |                 const char_t* special = convert_number_to_string_special(value);
 | 
|---|
 | 5718 |                 if (special) return xpath_string_const(special);
 | 
|---|
 | 5719 | 
 | 
|---|
 | 5720 |                 // get mantissa + exponent form
 | 
|---|
 | 5721 |                 char mantissa_buffer[64];
 | 
|---|
 | 5722 | 
 | 
|---|
 | 5723 |                 char* mantissa;
 | 
|---|
 | 5724 |                 int exponent;
 | 
|---|
 | 5725 |                 convert_number_to_mantissa_exponent(value, mantissa_buffer, sizeof(mantissa_buffer), &mantissa, &exponent);
 | 
|---|
 | 5726 | 
 | 
|---|
 | 5727 |                 // make the number!
 | 
|---|
 | 5728 |                 char_t result[512];
 | 
|---|
 | 5729 |                 char_t* s = result;
 | 
|---|
 | 5730 | 
 | 
|---|
 | 5731 |                 // sign
 | 
|---|
 | 5732 |                 if (value < 0) *s++ = '-';
 | 
|---|
 | 5733 | 
 | 
|---|
 | 5734 |                 // integer part
 | 
|---|
 | 5735 |                 if (exponent <= 0)
 | 
|---|
 | 5736 |                 {
 | 
|---|
 | 5737 |                         *s++ = '0';
 | 
|---|
 | 5738 |                 }
 | 
|---|
 | 5739 |                 else
 | 
|---|
 | 5740 |                 {
 | 
|---|
 | 5741 |                         while (exponent > 0)
 | 
|---|
 | 5742 |                         {
 | 
|---|
 | 5743 |                                 assert(*mantissa == 0 || (unsigned)(*mantissa - '0') <= 9);
 | 
|---|
 | 5744 |                                 *s++ = *mantissa ? *mantissa++ : '0';
 | 
|---|
 | 5745 |                                 exponent--;
 | 
|---|
 | 5746 |                         }
 | 
|---|
 | 5747 |                 }
 | 
|---|
 | 5748 | 
 | 
|---|
 | 5749 |                 // fractional part
 | 
|---|
 | 5750 |                 if (*mantissa)
 | 
|---|
 | 5751 |                 {
 | 
|---|
 | 5752 |                         // decimal point
 | 
|---|
 | 5753 |                         *s++ = '.';
 | 
|---|
 | 5754 | 
 | 
|---|
 | 5755 |                         // extra zeroes from negative exponent
 | 
|---|
 | 5756 |                         while (exponent < 0)
 | 
|---|
 | 5757 |                         {
 | 
|---|
 | 5758 |                                 *s++ = '0';
 | 
|---|
 | 5759 |                                 exponent++;
 | 
|---|
 | 5760 |                         }
 | 
|---|
 | 5761 | 
 | 
|---|
 | 5762 |                         // extra mantissa digits
 | 
|---|
 | 5763 |                         while (*mantissa)
 | 
|---|
 | 5764 |                         {
 | 
|---|
 | 5765 |                                 assert((unsigned)(*mantissa - '0') <= 9);
 | 
|---|
 | 5766 |                                 *s++ = *mantissa++;
 | 
|---|
 | 5767 |                         }
 | 
|---|
 | 5768 |                 }
 | 
|---|
 | 5769 | 
 | 
|---|
 | 5770 |                 // zero-terminate
 | 
|---|
 | 5771 |                 assert(s < result + sizeof(result) / sizeof(result[0]));
 | 
|---|
 | 5772 |                 *s = 0;
 | 
|---|
 | 5773 | 
 | 
|---|
 | 5774 |                 return xpath_string(result, alloc);
 | 
|---|
 | 5775 |         }
 | 
|---|
 | 5776 |         
 | 
|---|
 | 5777 |         bool check_string_to_number_format(const char_t* string)
 | 
|---|
 | 5778 |         {
 | 
|---|
 | 5779 |                 // parse leading whitespace
 | 
|---|
 | 5780 |                 while (IS_CHARTYPE(*string, ct_space)) ++string;
 | 
|---|
 | 5781 | 
 | 
|---|
 | 5782 |                 // parse sign
 | 
|---|
 | 5783 |                 if (*string == '-') ++string;
 | 
|---|
 | 5784 | 
 | 
|---|
 | 5785 |                 if (!*string) return false;
 | 
|---|
 | 5786 | 
 | 
|---|
 | 5787 |                 // if there is no integer part, there should be a decimal part with at least one digit
 | 
|---|
 | 5788 |                 if (!IS_CHARTYPEX(string[0], ctx_digit) && (string[0] != '.' || !IS_CHARTYPEX(string[1], ctx_digit))) return false;
 | 
|---|
 | 5789 | 
 | 
|---|
 | 5790 |                 // parse integer part
 | 
|---|
 | 5791 |                 while (IS_CHARTYPEX(*string, ctx_digit)) ++string;
 | 
|---|
 | 5792 | 
 | 
|---|
 | 5793 |                 // parse decimal part
 | 
|---|
 | 5794 |                 if (*string == '.')
 | 
|---|
 | 5795 |                 {
 | 
|---|
 | 5796 |                         ++string;
 | 
|---|
 | 5797 | 
 | 
|---|
 | 5798 |                         while (IS_CHARTYPEX(*string, ctx_digit)) ++string;
 | 
|---|
 | 5799 |                 }
 | 
|---|
 | 5800 | 
 | 
|---|
 | 5801 |                 // parse trailing whitespace
 | 
|---|
 | 5802 |                 while (IS_CHARTYPE(*string, ct_space)) ++string;
 | 
|---|
 | 5803 | 
 | 
|---|
 | 5804 |                 return *string == 0;
 | 
|---|
 | 5805 |         }
 | 
|---|
 | 5806 | 
 | 
|---|
 | 5807 |         double convert_string_to_number(const char_t* string)
 | 
|---|
 | 5808 |         {
 | 
|---|
 | 5809 |                 // check string format
 | 
|---|
 | 5810 |                 if (!check_string_to_number_format(string)) return gen_nan();
 | 
|---|
 | 5811 | 
 | 
|---|
 | 5812 |                 // parse string
 | 
|---|
 | 5813 |         #ifdef PUGIXML_WCHAR_MODE
 | 
|---|
 | 5814 |                 return wcstod(string, 0);
 | 
|---|
 | 5815 |         #else
 | 
|---|
 | 5816 |                 return atof(string);
 | 
|---|
 | 5817 |         #endif
 | 
|---|
 | 5818 |         }
 | 
|---|
 | 5819 | 
 | 
|---|
 | 5820 |         bool convert_string_to_number(const char_t* begin, const char_t* end, double* out_result)
 | 
|---|
 | 5821 |         {
 | 
|---|
 | 5822 |                 char_t buffer[32];
 | 
|---|
 | 5823 | 
 | 
|---|
 | 5824 |                 size_t length = static_cast<size_t>(end - begin);
 | 
|---|
 | 5825 |                 char_t* scratch = buffer;
 | 
|---|
 | 5826 | 
 | 
|---|
 | 5827 |                 if (length >= sizeof(buffer) / sizeof(buffer[0]))
 | 
|---|
 | 5828 |                 {
 | 
|---|
 | 5829 |                         // need to make dummy on-heap copy
 | 
|---|
 | 5830 |                         scratch = static_cast<char_t*>(global_allocate((length + 1) * sizeof(char_t)));
 | 
|---|
 | 5831 |                         if (!scratch) return false;
 | 
|---|
 | 5832 |                 }
 | 
|---|
 | 5833 | 
 | 
|---|
 | 5834 |                 // copy string to zero-terminated buffer and perform conversion
 | 
|---|
 | 5835 |                 memcpy(scratch, begin, length * sizeof(char_t));
 | 
|---|
 | 5836 |                 scratch[length] = 0;
 | 
|---|
 | 5837 | 
 | 
|---|
 | 5838 |                 *out_result = convert_string_to_number(scratch);
 | 
|---|
 | 5839 | 
 | 
|---|
 | 5840 |                 // free dummy buffer
 | 
|---|
 | 5841 |                 if (scratch != buffer) global_deallocate(scratch);
 | 
|---|
 | 5842 | 
 | 
|---|
 | 5843 |                 return true;
 | 
|---|
 | 5844 |         }
 | 
|---|
 | 5845 |         
 | 
|---|
 | 5846 |         double round_nearest(double value)
 | 
|---|
 | 5847 |         {
 | 
|---|
 | 5848 |                 return floor(value + 0.5);
 | 
|---|
 | 5849 |         }
 | 
|---|
 | 5850 | 
 | 
|---|
 | 5851 |         double round_nearest_nzero(double value)
 | 
|---|
 | 5852 |         {
 | 
|---|
 | 5853 |                 // same as round_nearest, but returns -0 for [-0.5, -0]
 | 
|---|
 | 5854 |                 // ceil is used to differentiate between +0 and -0 (we return -0 for [-0.5, -0] and +0 for +0)
 | 
|---|
 | 5855 |                 return (value >= -0.5 && value <= 0) ? ceil(value) : floor(value + 0.5);
 | 
|---|
 | 5856 |         }
 | 
|---|
 | 5857 |         
 | 
|---|
 | 5858 |         const char_t* qualified_name(const xpath_node& node)
 | 
|---|
 | 5859 |         {
 | 
|---|
 | 5860 |                 return node.attribute() ? node.attribute().name() : node.node().name();
 | 
|---|
 | 5861 |         }
 | 
|---|
 | 5862 |         
 | 
|---|
 | 5863 |         const char_t* local_name(const xpath_node& node)
 | 
|---|
 | 5864 |         {
 | 
|---|
 | 5865 |                 const char_t* name = qualified_name(node);
 | 
|---|
 | 5866 |                 const char_t* p = find_char(name, ':');
 | 
|---|
 | 5867 |                 
 | 
|---|
 | 5868 |                 return p ? p + 1 : name;
 | 
|---|
 | 5869 |         }
 | 
|---|
 | 5870 | 
 | 
|---|
 | 5871 |         struct namespace_uri_predicate
 | 
|---|
 | 5872 |         {
 | 
|---|
 | 5873 |                 const char_t* prefix;
 | 
|---|
 | 5874 |                 size_t prefix_length;
 | 
|---|
 | 5875 | 
 | 
|---|
 | 5876 |                 namespace_uri_predicate(const char_t* name)
 | 
|---|
 | 5877 |                 {
 | 
|---|
 | 5878 |                         const char_t* pos = find_char(name, ':');
 | 
|---|
 | 5879 | 
 | 
|---|
 | 5880 |                         prefix = pos ? name : 0;
 | 
|---|
 | 5881 |                         prefix_length = pos ? static_cast<size_t>(pos - name) : 0;
 | 
|---|
 | 5882 |                 }
 | 
|---|
 | 5883 | 
 | 
|---|
 | 5884 |                 bool operator()(const xml_attribute& a) const
 | 
|---|
 | 5885 |                 {
 | 
|---|
 | 5886 |                         const char_t* name = a.name();
 | 
|---|
 | 5887 | 
 | 
|---|
 | 5888 |                         if (!starts_with(name, PUGIXML_TEXT("xmlns"))) return false;
 | 
|---|
 | 5889 | 
 | 
|---|
 | 5890 |                         return prefix ? name[5] == ':' && strequalrange(name + 6, prefix, prefix_length) : name[5] == 0;
 | 
|---|
 | 5891 |                 }
 | 
|---|
 | 5892 |         };
 | 
|---|
 | 5893 | 
 | 
|---|
 | 5894 |         const char_t* namespace_uri(const xml_node& node)
 | 
|---|
 | 5895 |         {
 | 
|---|
 | 5896 |                 namespace_uri_predicate pred = node.name();
 | 
|---|
 | 5897 |                 
 | 
|---|
 | 5898 |                 xml_node p = node;
 | 
|---|
 | 5899 |                 
 | 
|---|
 | 5900 |                 while (p)
 | 
|---|
 | 5901 |                 {
 | 
|---|
 | 5902 |                         xml_attribute a = p.find_attribute(pred);
 | 
|---|
 | 5903 |                         
 | 
|---|
 | 5904 |                         if (a) return a.value();
 | 
|---|
 | 5905 |                         
 | 
|---|
 | 5906 |                         p = p.parent();
 | 
|---|
 | 5907 |                 }
 | 
|---|
 | 5908 |                 
 | 
|---|
 | 5909 |                 return PUGIXML_TEXT("");
 | 
|---|
 | 5910 |         }
 | 
|---|
 | 5911 | 
 | 
|---|
 | 5912 |         const char_t* namespace_uri(const xml_attribute& attr, const xml_node& parent)
 | 
|---|
 | 5913 |         {
 | 
|---|
 | 5914 |                 namespace_uri_predicate pred = attr.name();
 | 
|---|
 | 5915 |                 
 | 
|---|
 | 5916 |                 // Default namespace does not apply to attributes
 | 
|---|
 | 5917 |                 if (!pred.prefix) return PUGIXML_TEXT("");
 | 
|---|
 | 5918 |                 
 | 
|---|
 | 5919 |                 xml_node p = parent;
 | 
|---|
 | 5920 |                 
 | 
|---|
 | 5921 |                 while (p)
 | 
|---|
 | 5922 |                 {
 | 
|---|
 | 5923 |                         xml_attribute a = p.find_attribute(pred);
 | 
|---|
 | 5924 |                         
 | 
|---|
 | 5925 |                         if (a) return a.value();
 | 
|---|
 | 5926 |                         
 | 
|---|
 | 5927 |                         p = p.parent();
 | 
|---|
 | 5928 |                 }
 | 
|---|
 | 5929 |                 
 | 
|---|
 | 5930 |                 return PUGIXML_TEXT("");
 | 
|---|
 | 5931 |         }
 | 
|---|
 | 5932 | 
 | 
|---|
 | 5933 |         const char_t* namespace_uri(const xpath_node& node)
 | 
|---|
 | 5934 |         {
 | 
|---|
 | 5935 |                 return node.attribute() ? namespace_uri(node.attribute(), node.parent()) : namespace_uri(node.node());
 | 
|---|
 | 5936 |         }
 | 
|---|
 | 5937 | 
 | 
|---|
 | 5938 |         void normalize_space(char_t* buffer)
 | 
|---|
 | 5939 |         {
 | 
|---|
 | 5940 |                 char_t* write = buffer;
 | 
|---|
 | 5941 | 
 | 
|---|
 | 5942 |                 for (char_t* it = buffer; *it; )
 | 
|---|
 | 5943 |                 {
 | 
|---|
 | 5944 |                         char_t ch = *it++;
 | 
|---|
 | 5945 | 
 | 
|---|
 | 5946 |                         if (IS_CHARTYPE(ch, ct_space))
 | 
|---|
 | 5947 |                         {
 | 
|---|
 | 5948 |                                 // replace whitespace sequence with single space
 | 
|---|
 | 5949 |                                 while (IS_CHARTYPE(*it, ct_space)) it++;
 | 
|---|
 | 5950 | 
 | 
|---|
 | 5951 |                                 // avoid leading spaces
 | 
|---|
 | 5952 |                                 if (write != buffer) *write++ = ' ';
 | 
|---|
 | 5953 |                         }
 | 
|---|
 | 5954 |                         else *write++ = ch;
 | 
|---|
 | 5955 |                 }
 | 
|---|
 | 5956 | 
 | 
|---|
 | 5957 |                 // remove trailing space
 | 
|---|
 | 5958 |                 if (write != buffer && IS_CHARTYPE(write[-1], ct_space)) write--;
 | 
|---|
 | 5959 | 
 | 
|---|
 | 5960 |                 // zero-terminate
 | 
|---|
 | 5961 |                 *write = 0;
 | 
|---|
 | 5962 |         }
 | 
|---|
 | 5963 | 
 | 
|---|
 | 5964 |         void translate(char_t* buffer, const char_t* from, const char_t* to)
 | 
|---|
 | 5965 |         {
 | 
|---|
 | 5966 |                 size_t to_length = strlength(to);
 | 
|---|
 | 5967 | 
 | 
|---|
 | 5968 |                 char_t* write = buffer;
 | 
|---|
 | 5969 | 
 | 
|---|
 | 5970 |                 while (*buffer)
 | 
|---|
 | 5971 |                 {
 | 
|---|
 | 5972 |                         DMC_VOLATILE char_t ch = *buffer++;
 | 
|---|
 | 5973 | 
 | 
|---|
 | 5974 |                         const char_t* pos = find_char(from, ch);
 | 
|---|
 | 5975 | 
 | 
|---|
 | 5976 |                         if (!pos)
 | 
|---|
 | 5977 |                                 *write++ = ch; // do not process
 | 
|---|
 | 5978 |                         else if (static_cast<size_t>(pos - from) < to_length)
 | 
|---|
 | 5979 |                                 *write++ = to[pos - from]; // replace
 | 
|---|
 | 5980 |                 }
 | 
|---|
 | 5981 | 
 | 
|---|
 | 5982 |                 // zero-terminate
 | 
|---|
 | 5983 |                 *write = 0;
 | 
|---|
 | 5984 |         }
 | 
|---|
 | 5985 | 
 | 
|---|
 | 5986 |         struct xpath_variable_boolean: xpath_variable
 | 
|---|
 | 5987 |         {
 | 
|---|
 | 5988 |                 xpath_variable_boolean(): value(false)
 | 
|---|
 | 5989 |                 {
 | 
|---|
 | 5990 |                 }
 | 
|---|
 | 5991 | 
 | 
|---|
 | 5992 |                 bool value;
 | 
|---|
 | 5993 |                 char_t name[1];
 | 
|---|
 | 5994 |         };
 | 
|---|
 | 5995 | 
 | 
|---|
 | 5996 |         struct xpath_variable_number: xpath_variable
 | 
|---|
 | 5997 |         {
 | 
|---|
 | 5998 |                 xpath_variable_number(): value(0)
 | 
|---|
 | 5999 |                 {
 | 
|---|
 | 6000 |                 }
 | 
|---|
 | 6001 | 
 | 
|---|
 | 6002 |                 double value;
 | 
|---|
 | 6003 |                 char_t name[1];
 | 
|---|
 | 6004 |         };
 | 
|---|
 | 6005 | 
 | 
|---|
 | 6006 |         struct xpath_variable_string: xpath_variable
 | 
|---|
 | 6007 |         {
 | 
|---|
 | 6008 |                 xpath_variable_string(): value(0)
 | 
|---|
 | 6009 |                 {
 | 
|---|
 | 6010 |                 }
 | 
|---|
 | 6011 | 
 | 
|---|
 | 6012 |                 ~xpath_variable_string()
 | 
|---|
 | 6013 |                 {
 | 
|---|
 | 6014 |                         if (value) global_deallocate(value);
 | 
|---|
 | 6015 |                 }
 | 
|---|
 | 6016 | 
 | 
|---|
 | 6017 |                 char_t* value;
 | 
|---|
 | 6018 |                 char_t name[1];
 | 
|---|
 | 6019 |         };
 | 
|---|
 | 6020 | 
 | 
|---|
 | 6021 |         struct xpath_variable_node_set: xpath_variable
 | 
|---|
 | 6022 |         {
 | 
|---|
 | 6023 |                 xpath_node_set value;
 | 
|---|
 | 6024 |                 char_t name[1];
 | 
|---|
 | 6025 |         };
 | 
|---|
 | 6026 | 
 | 
|---|
 | 6027 |         const xpath_node_set dummy_node_set;
 | 
|---|
 | 6028 | 
 | 
|---|
 | 6029 |         unsigned int hash_string(const char_t* str)
 | 
|---|
 | 6030 |         {
 | 
|---|
 | 6031 |                 // Jenkins one-at-a-time hash (http://en.wikipedia.org/wiki/Jenkins_hash_function#one-at-a-time)
 | 
|---|
 | 6032 |                 unsigned int result = 0;
 | 
|---|
 | 6033 | 
 | 
|---|
 | 6034 |                 while (*str)
 | 
|---|
 | 6035 |                 {
 | 
|---|
 | 6036 |                         result += static_cast<unsigned int>(*str++);
 | 
|---|
 | 6037 |                         result += result << 10;
 | 
|---|
 | 6038 |                         result ^= result >> 6;
 | 
|---|
 | 6039 |                 }
 | 
|---|
 | 6040 |         
 | 
|---|
 | 6041 |                 result += result << 3;
 | 
|---|
 | 6042 |                 result ^= result >> 11;
 | 
|---|
 | 6043 |                 result += result << 15;
 | 
|---|
 | 6044 |         
 | 
|---|
 | 6045 |                 return result;
 | 
|---|
 | 6046 |         }
 | 
|---|
 | 6047 | 
 | 
|---|
 | 6048 |         template <typename T> T* new_xpath_variable(const char_t* name)
 | 
|---|
 | 6049 |         {
 | 
|---|
 | 6050 |                 size_t length = strlength(name);
 | 
|---|
 | 6051 |                 if (length == 0) return 0; // empty variable names are invalid
 | 
|---|
 | 6052 | 
 | 
|---|
 | 6053 |                 // $$ we can't use offsetof(T, name) because T is non-POD, so we just allocate additional length characters
 | 
|---|
 | 6054 |                 void* memory = global_allocate(sizeof(T) + length * sizeof(char_t));
 | 
|---|
 | 6055 |                 if (!memory) return 0;
 | 
|---|
 | 6056 | 
 | 
|---|
 | 6057 |                 T* result = new (memory) T();
 | 
|---|
 | 6058 | 
 | 
|---|
 | 6059 |                 memcpy(result->name, name, (length + 1) * sizeof(char_t));
 | 
|---|
 | 6060 | 
 | 
|---|
 | 6061 |                 return result;
 | 
|---|
 | 6062 |         }
 | 
|---|
 | 6063 | 
 | 
|---|
 | 6064 |         xpath_variable* new_xpath_variable(xpath_value_type type, const char_t* name)
 | 
|---|
 | 6065 |         {
 | 
|---|
 | 6066 |                 switch (type)
 | 
|---|
 | 6067 |                 {
 | 
|---|
 | 6068 |                 case xpath_type_node_set:
 | 
|---|
 | 6069 |                         return new_xpath_variable<xpath_variable_node_set>(name);
 | 
|---|
 | 6070 | 
 | 
|---|
 | 6071 |                 case xpath_type_number:
 | 
|---|
 | 6072 |                         return new_xpath_variable<xpath_variable_number>(name);
 | 
|---|
 | 6073 | 
 | 
|---|
 | 6074 |                 case xpath_type_string:
 | 
|---|
 | 6075 |                         return new_xpath_variable<xpath_variable_string>(name);
 | 
|---|
 | 6076 | 
 | 
|---|
 | 6077 |                 case xpath_type_boolean:
 | 
|---|
 | 6078 |                         return new_xpath_variable<xpath_variable_boolean>(name);
 | 
|---|
 | 6079 | 
 | 
|---|
 | 6080 |                 default:
 | 
|---|
 | 6081 |                         return 0;
 | 
|---|
 | 6082 |                 }
 | 
|---|
 | 6083 |         }
 | 
|---|
 | 6084 | 
 | 
|---|
 | 6085 |         template <typename T> void delete_xpath_variable(T* var)
 | 
|---|
 | 6086 |         {
 | 
|---|
 | 6087 |                 var->~T();
 | 
|---|
 | 6088 |                 global_deallocate(var);
 | 
|---|
 | 6089 |         }
 | 
|---|
 | 6090 | 
 | 
|---|
 | 6091 |         void delete_xpath_variable(xpath_value_type type, xpath_variable* var)
 | 
|---|
 | 6092 |         {
 | 
|---|
 | 6093 |                 switch (type)
 | 
|---|
 | 6094 |                 {
 | 
|---|
 | 6095 |                 case xpath_type_node_set:
 | 
|---|
 | 6096 |                         delete_xpath_variable(static_cast<xpath_variable_node_set*>(var));
 | 
|---|
 | 6097 |                         break;
 | 
|---|
 | 6098 | 
 | 
|---|
 | 6099 |                 case xpath_type_number:
 | 
|---|
 | 6100 |                         delete_xpath_variable(static_cast<xpath_variable_number*>(var));
 | 
|---|
 | 6101 |                         break;
 | 
|---|
 | 6102 | 
 | 
|---|
 | 6103 |                 case xpath_type_string:
 | 
|---|
 | 6104 |                         delete_xpath_variable(static_cast<xpath_variable_string*>(var));
 | 
|---|
 | 6105 |                         break;
 | 
|---|
 | 6106 | 
 | 
|---|
 | 6107 |                 case xpath_type_boolean:
 | 
|---|
 | 6108 |                         delete_xpath_variable(static_cast<xpath_variable_boolean*>(var));
 | 
|---|
 | 6109 |                         break;
 | 
|---|
 | 6110 | 
 | 
|---|
 | 6111 |                 default:
 | 
|---|
 | 6112 |                         assert(!"Invalid variable type");
 | 
|---|
 | 6113 |                 }
 | 
|---|
 | 6114 |         }
 | 
|---|
 | 6115 | 
 | 
|---|
 | 6116 |         xpath_variable* get_variable(xpath_variable_set* set, const char_t* begin, const char_t* end)
 | 
|---|
 | 6117 |         {
 | 
|---|
 | 6118 |                 char_t buffer[32];
 | 
|---|
 | 6119 | 
 | 
|---|
 | 6120 |                 size_t length = static_cast<size_t>(end - begin);
 | 
|---|
 | 6121 |                 char_t* scratch = buffer;
 | 
|---|
 | 6122 | 
 | 
|---|
 | 6123 |                 if (length >= sizeof(buffer) / sizeof(buffer[0]))
 | 
|---|
 | 6124 |                 {
 | 
|---|
 | 6125 |                         // need to make dummy on-heap copy
 | 
|---|
 | 6126 |                         scratch = static_cast<char_t*>(global_allocate((length + 1) * sizeof(char_t)));
 | 
|---|
 | 6127 |                         if (!scratch) return 0;
 | 
|---|
 | 6128 |                 }
 | 
|---|
 | 6129 | 
 | 
|---|
 | 6130 |                 // copy string to zero-terminated buffer and perform lookup
 | 
|---|
 | 6131 |                 memcpy(scratch, begin, length * sizeof(char_t));
 | 
|---|
 | 6132 |                 scratch[length] = 0;
 | 
|---|
 | 6133 | 
 | 
|---|
 | 6134 |                 xpath_variable* result = set->get(scratch);
 | 
|---|
 | 6135 | 
 | 
|---|
 | 6136 |                 // free dummy buffer
 | 
|---|
 | 6137 |                 if (scratch != buffer) global_deallocate(scratch);
 | 
|---|
 | 6138 | 
 | 
|---|
 | 6139 |                 return result;
 | 
|---|
 | 6140 |         }
 | 
|---|
 | 6141 | }
 | 
|---|
 | 6142 | 
 | 
|---|
 | 6143 | // Internal node set class
 | 
|---|
 | 6144 | namespace
 | 
|---|
 | 6145 | {
 | 
|---|
 | 6146 |         xpath_node_set::type_t xpath_sort(xpath_node* begin, xpath_node* end, xpath_node_set::type_t type, bool rev)
 | 
|---|
 | 6147 |         {
 | 
|---|
 | 6148 |                 xpath_node_set::type_t order = rev ? xpath_node_set::type_sorted_reverse : xpath_node_set::type_sorted;
 | 
|---|
 | 6149 | 
 | 
|---|
 | 6150 |                 if (type == xpath_node_set::type_unsorted)
 | 
|---|
 | 6151 |                 {
 | 
|---|
 | 6152 |                         sort(begin, end, document_order_comparator());
 | 
|---|
 | 6153 | 
 | 
|---|
 | 6154 |                         type = xpath_node_set::type_sorted;
 | 
|---|
 | 6155 |                 }
 | 
|---|
 | 6156 |                 
 | 
|---|
 | 6157 |                 if (type != order) reverse(begin, end);
 | 
|---|
 | 6158 |                         
 | 
|---|
 | 6159 |                 return order;
 | 
|---|
 | 6160 |         }
 | 
|---|
 | 6161 | 
 | 
|---|
 | 6162 |         xpath_node xpath_first(const xpath_node* begin, const xpath_node* end, xpath_node_set::type_t type)
 | 
|---|
 | 6163 |         {
 | 
|---|
 | 6164 |                 if (begin == end) return xpath_node();
 | 
|---|
 | 6165 | 
 | 
|---|
 | 6166 |                 switch (type)
 | 
|---|
 | 6167 |                 {
 | 
|---|
 | 6168 |                 case xpath_node_set::type_sorted:
 | 
|---|
 | 6169 |                         return *begin;
 | 
|---|
 | 6170 | 
 | 
|---|
 | 6171 |                 case xpath_node_set::type_sorted_reverse:
 | 
|---|
 | 6172 |                         return *(end - 1);
 | 
|---|
 | 6173 | 
 | 
|---|
 | 6174 |                 case xpath_node_set::type_unsorted:
 | 
|---|
 | 6175 |                         return *min_element(begin, end, document_order_comparator());
 | 
|---|
 | 6176 | 
 | 
|---|
 | 6177 |                 default:
 | 
|---|
 | 6178 |                         assert(!"Invalid node set type");
 | 
|---|
 | 6179 |                         return xpath_node();
 | 
|---|
 | 6180 |                 }
 | 
|---|
 | 6181 |         }
 | 
|---|
 | 6182 |         class xpath_node_set_raw
 | 
|---|
 | 6183 |         {
 | 
|---|
 | 6184 |                 xpath_node_set::type_t _type;
 | 
|---|
 | 6185 | 
 | 
|---|
 | 6186 |                 xpath_node* _begin;
 | 
|---|
 | 6187 |                 xpath_node* _end;
 | 
|---|
 | 6188 |                 xpath_node* _eos;
 | 
|---|
 | 6189 | 
 | 
|---|
 | 6190 |         public:
 | 
|---|
 | 6191 |                 xpath_node_set_raw(): _type(xpath_node_set::type_unsorted), _begin(0), _end(0), _eos(0)
 | 
|---|
 | 6192 |                 {
 | 
|---|
 | 6193 |                 }
 | 
|---|
 | 6194 | 
 | 
|---|
 | 6195 |                 xpath_node* begin() const
 | 
|---|
 | 6196 |                 {
 | 
|---|
 | 6197 |                         return _begin;
 | 
|---|
 | 6198 |                 }
 | 
|---|
 | 6199 | 
 | 
|---|
 | 6200 |                 xpath_node* end() const
 | 
|---|
 | 6201 |                 {
 | 
|---|
 | 6202 |                         return _end;
 | 
|---|
 | 6203 |                 }
 | 
|---|
 | 6204 | 
 | 
|---|
 | 6205 |                 bool empty() const
 | 
|---|
 | 6206 |                 {
 | 
|---|
 | 6207 |                         return _begin == _end;
 | 
|---|
 | 6208 |                 }
 | 
|---|
 | 6209 | 
 | 
|---|
 | 6210 |                 size_t size() const
 | 
|---|
 | 6211 |                 {
 | 
|---|
 | 6212 |                         return static_cast<size_t>(_end - _begin);
 | 
|---|
 | 6213 |                 }
 | 
|---|
 | 6214 | 
 | 
|---|
 | 6215 |                 xpath_node first() const
 | 
|---|
 | 6216 |                 {
 | 
|---|
 | 6217 |                         return xpath_first(_begin, _end, _type);
 | 
|---|
 | 6218 |                 }
 | 
|---|
 | 6219 | 
 | 
|---|
 | 6220 |                 void push_back(const xpath_node& node, xpath_allocator* alloc)
 | 
|---|
 | 6221 |                 {
 | 
|---|
 | 6222 |                         if (_end == _eos)
 | 
|---|
 | 6223 |                         {
 | 
|---|
 | 6224 |                                 size_t capacity = static_cast<size_t>(_eos - _begin);
 | 
|---|
 | 6225 | 
 | 
|---|
 | 6226 |                                 // get new capacity (1.5x rule)
 | 
|---|
 | 6227 |                                 size_t new_capacity = capacity + capacity / 2 + 1;
 | 
|---|
 | 6228 | 
 | 
|---|
 | 6229 |                                 // reallocate the old array or allocate a new one
 | 
|---|
 | 6230 |                                 xpath_node* data = static_cast<xpath_node*>(alloc->reallocate(_begin, capacity * sizeof(xpath_node), new_capacity * sizeof(xpath_node)));
 | 
|---|
 | 6231 |                                 assert(data);
 | 
|---|
 | 6232 | 
 | 
|---|
 | 6233 |                                 // finalize
 | 
|---|
 | 6234 |                                 _begin = data;
 | 
|---|
 | 6235 |                                 _end = data + capacity;
 | 
|---|
 | 6236 |                                 _eos = data + new_capacity;
 | 
|---|
 | 6237 |                         }
 | 
|---|
 | 6238 | 
 | 
|---|
 | 6239 |                         *_end++ = node;
 | 
|---|
 | 6240 |                 }
 | 
|---|
 | 6241 | 
 | 
|---|
 | 6242 |                 void append(const xpath_node* begin, const xpath_node* end, xpath_allocator* alloc)
 | 
|---|
 | 6243 |                 {
 | 
|---|
 | 6244 |                         size_t size = static_cast<size_t>(_end - _begin);
 | 
|---|
 | 6245 |                         size_t capacity = static_cast<size_t>(_eos - _begin);
 | 
|---|
 | 6246 |                         size_t count = static_cast<size_t>(end - begin);
 | 
|---|
 | 6247 | 
 | 
|---|
 | 6248 |                         if (size + count > capacity)
 | 
|---|
 | 6249 |                         {
 | 
|---|
 | 6250 |                                 // reallocate the old array or allocate a new one
 | 
|---|
 | 6251 |                                 xpath_node* data = static_cast<xpath_node*>(alloc->reallocate(_begin, capacity * sizeof(xpath_node), (size + count) * sizeof(xpath_node)));
 | 
|---|
 | 6252 |                                 assert(data);
 | 
|---|
 | 6253 | 
 | 
|---|
 | 6254 |                                 // finalize
 | 
|---|
 | 6255 |                                 _begin = data;
 | 
|---|
 | 6256 |                                 _end = data + size;
 | 
|---|
 | 6257 |                                 _eos = data + size + count;
 | 
|---|
 | 6258 |                         }
 | 
|---|
 | 6259 | 
 | 
|---|
 | 6260 |                         memcpy(_end, begin, count * sizeof(xpath_node));
 | 
|---|
 | 6261 |                         _end += count;
 | 
|---|
 | 6262 |                 }
 | 
|---|
 | 6263 | 
 | 
|---|
 | 6264 |                 void sort_do()
 | 
|---|
 | 6265 |                 {
 | 
|---|
 | 6266 |                         _type = xpath_sort(_begin, _end, _type, false);
 | 
|---|
 | 6267 |                 }
 | 
|---|
 | 6268 | 
 | 
|---|
 | 6269 |                 void truncate(xpath_node* pos)
 | 
|---|
 | 6270 |                 {
 | 
|---|
 | 6271 |                         assert(_begin <= pos && pos <= _end);
 | 
|---|
 | 6272 | 
 | 
|---|
 | 6273 |                         _end = pos;
 | 
|---|
 | 6274 |                 }
 | 
|---|
 | 6275 | 
 | 
|---|
 | 6276 |                 void remove_duplicates()
 | 
|---|
 | 6277 |                 {
 | 
|---|
 | 6278 |                         if (_type == xpath_node_set::type_unsorted)
 | 
|---|
 | 6279 |                                 sort(_begin, _end, duplicate_comparator());
 | 
|---|
 | 6280 |                 
 | 
|---|
 | 6281 |                         _end = unique(_begin, _end);
 | 
|---|
 | 6282 |                 }
 | 
|---|
 | 6283 | 
 | 
|---|
 | 6284 |                 xpath_node_set::type_t type() const
 | 
|---|
 | 6285 |                 {
 | 
|---|
 | 6286 |                         return _type;
 | 
|---|
 | 6287 |                 }
 | 
|---|
 | 6288 | 
 | 
|---|
 | 6289 |                 void set_type(xpath_node_set::type_t type)
 | 
|---|
 | 6290 |                 {
 | 
|---|
 | 6291 |                         _type = type;
 | 
|---|
 | 6292 |                 }
 | 
|---|
 | 6293 |         };
 | 
|---|
 | 6294 | }
 | 
|---|
 | 6295 | 
 | 
|---|
 | 6296 | namespace
 | 
|---|
 | 6297 | {
 | 
|---|
 | 6298 |         struct xpath_context
 | 
|---|
 | 6299 |         {
 | 
|---|
 | 6300 |                 xpath_node n;
 | 
|---|
 | 6301 |                 size_t position, size;
 | 
|---|
 | 6302 | 
 | 
|---|
 | 6303 |                 xpath_context(const xpath_node& n, size_t position, size_t size): n(n), position(position), size(size)
 | 
|---|
 | 6304 |                 {
 | 
|---|
 | 6305 |                 }
 | 
|---|
 | 6306 |         };
 | 
|---|
 | 6307 | 
 | 
|---|
 | 6308 |         enum lexeme_t
 | 
|---|
 | 6309 |         {
 | 
|---|
 | 6310 |                 lex_none = 0,
 | 
|---|
 | 6311 |                 lex_equal,
 | 
|---|
 | 6312 |                 lex_not_equal,
 | 
|---|
 | 6313 |                 lex_less,
 | 
|---|
 | 6314 |                 lex_greater,
 | 
|---|
 | 6315 |                 lex_less_or_equal,
 | 
|---|
 | 6316 |                 lex_greater_or_equal,
 | 
|---|
 | 6317 |                 lex_plus,
 | 
|---|
 | 6318 |                 lex_minus,
 | 
|---|
 | 6319 |                 lex_multiply,
 | 
|---|
 | 6320 |                 lex_union,
 | 
|---|
 | 6321 |                 lex_var_ref,
 | 
|---|
 | 6322 |                 lex_open_brace,
 | 
|---|
 | 6323 |                 lex_close_brace,
 | 
|---|
 | 6324 |                 lex_quoted_string,
 | 
|---|
 | 6325 |                 lex_number,
 | 
|---|
 | 6326 |                 lex_slash,
 | 
|---|
 | 6327 |                 lex_double_slash,
 | 
|---|
 | 6328 |                 lex_open_square_brace,
 | 
|---|
 | 6329 |                 lex_close_square_brace,
 | 
|---|
 | 6330 |                 lex_string,
 | 
|---|
 | 6331 |                 lex_comma,
 | 
|---|
 | 6332 |                 lex_axis_attribute,
 | 
|---|
 | 6333 |                 lex_dot,
 | 
|---|
 | 6334 |                 lex_double_dot,
 | 
|---|
 | 6335 |                 lex_double_colon,
 | 
|---|
 | 6336 |                 lex_eof
 | 
|---|
 | 6337 |         };
 | 
|---|
 | 6338 | 
 | 
|---|
 | 6339 |         struct xpath_lexer_string
 | 
|---|
 | 6340 |         {
 | 
|---|
 | 6341 |                 const char_t* begin;
 | 
|---|
 | 6342 |                 const char_t* end;
 | 
|---|
 | 6343 | 
 | 
|---|
 | 6344 |                 xpath_lexer_string(): begin(0), end(0)
 | 
|---|
 | 6345 |                 {
 | 
|---|
 | 6346 |                 }
 | 
|---|
 | 6347 | 
 | 
|---|
 | 6348 |                 bool operator==(const char_t* other) const
 | 
|---|
 | 6349 |                 {
 | 
|---|
 | 6350 |                         size_t length = static_cast<size_t>(end - begin);
 | 
|---|
 | 6351 | 
 | 
|---|
 | 6352 |                         return strequalrange(other, begin, length);
 | 
|---|
 | 6353 |                 }
 | 
|---|
 | 6354 |         };
 | 
|---|
 | 6355 | 
 | 
|---|
 | 6356 |         class xpath_lexer
 | 
|---|
 | 6357 |         {
 | 
|---|
 | 6358 |                 const char_t* _cur;
 | 
|---|
 | 6359 |                 const char_t* _cur_lexeme_pos;
 | 
|---|
 | 6360 |                 xpath_lexer_string _cur_lexeme_contents;
 | 
|---|
 | 6361 | 
 | 
|---|
 | 6362 |                 lexeme_t _cur_lexeme;
 | 
|---|
 | 6363 | 
 | 
|---|
 | 6364 |         public:
 | 
|---|
 | 6365 |                 explicit xpath_lexer(const char_t* query): _cur(query)
 | 
|---|
 | 6366 |                 {
 | 
|---|
 | 6367 |                         next();
 | 
|---|
 | 6368 |                 }
 | 
|---|
 | 6369 |                 
 | 
|---|
 | 6370 |                 const char_t* state() const
 | 
|---|
 | 6371 |                 {
 | 
|---|
 | 6372 |                         return _cur;
 | 
|---|
 | 6373 |                 }
 | 
|---|
 | 6374 |                 
 | 
|---|
 | 6375 |                 void next()
 | 
|---|
 | 6376 |                 {
 | 
|---|
 | 6377 |                         const char_t* cur = _cur;
 | 
|---|
 | 6378 | 
 | 
|---|
 | 6379 |                         while (IS_CHARTYPE(*cur, ct_space)) ++cur;
 | 
|---|
 | 6380 | 
 | 
|---|
 | 6381 |                         // save lexeme position for error reporting
 | 
|---|
 | 6382 |                         _cur_lexeme_pos = cur;
 | 
|---|
 | 6383 | 
 | 
|---|
 | 6384 |                         switch (*cur)
 | 
|---|
 | 6385 |                         {
 | 
|---|
 | 6386 |                         case 0:
 | 
|---|
 | 6387 |                                 _cur_lexeme = lex_eof;
 | 
|---|
 | 6388 |                                 break;
 | 
|---|
 | 6389 |                         
 | 
|---|
 | 6390 |                         case '>':
 | 
|---|
 | 6391 |                                 if (*(cur+1) == '=')
 | 
|---|
 | 6392 |                                 {
 | 
|---|
 | 6393 |                                         cur += 2;
 | 
|---|
 | 6394 |                                         _cur_lexeme = lex_greater_or_equal;
 | 
|---|
 | 6395 |                                 }
 | 
|---|
 | 6396 |                                 else
 | 
|---|
 | 6397 |                                 {
 | 
|---|
 | 6398 |                                         cur += 1;
 | 
|---|
 | 6399 |                                         _cur_lexeme = lex_greater;
 | 
|---|
 | 6400 |                                 }
 | 
|---|
 | 6401 |                                 break;
 | 
|---|
 | 6402 | 
 | 
|---|
 | 6403 |                         case '<':
 | 
|---|
 | 6404 |                                 if (*(cur+1) == '=')
 | 
|---|
 | 6405 |                                 {
 | 
|---|
 | 6406 |                                         cur += 2;
 | 
|---|
 | 6407 |                                         _cur_lexeme = lex_less_or_equal;
 | 
|---|
 | 6408 |                                 }
 | 
|---|
 | 6409 |                                 else
 | 
|---|
 | 6410 |                                 {
 | 
|---|
 | 6411 |                                         cur += 1;
 | 
|---|
 | 6412 |                                         _cur_lexeme = lex_less;
 | 
|---|
 | 6413 |                                 }
 | 
|---|
 | 6414 |                                 break;
 | 
|---|
 | 6415 | 
 | 
|---|
 | 6416 |                         case '!':
 | 
|---|
 | 6417 |                                 if (*(cur+1) == '=')
 | 
|---|
 | 6418 |                                 {
 | 
|---|
 | 6419 |                                         cur += 2;
 | 
|---|
 | 6420 |                                         _cur_lexeme = lex_not_equal;
 | 
|---|
 | 6421 |                                 }
 | 
|---|
 | 6422 |                                 else
 | 
|---|
 | 6423 |                                 {
 | 
|---|
 | 6424 |                                         _cur_lexeme = lex_none;
 | 
|---|
 | 6425 |                                 }
 | 
|---|
 | 6426 |                                 break;
 | 
|---|
 | 6427 | 
 | 
|---|
 | 6428 |                         case '=':
 | 
|---|
 | 6429 |                                 cur += 1;
 | 
|---|
 | 6430 |                                 _cur_lexeme = lex_equal;
 | 
|---|
 | 6431 | 
 | 
|---|
 | 6432 |                                 break;
 | 
|---|
 | 6433 |                         
 | 
|---|
 | 6434 |                         case '+':
 | 
|---|
 | 6435 |                                 cur += 1;
 | 
|---|
 | 6436 |                                 _cur_lexeme = lex_plus;
 | 
|---|
 | 6437 | 
 | 
|---|
 | 6438 |                                 break;
 | 
|---|
 | 6439 | 
 | 
|---|
 | 6440 |                         case '-':
 | 
|---|
 | 6441 |                                 cur += 1;
 | 
|---|
 | 6442 |                                 _cur_lexeme = lex_minus;
 | 
|---|
 | 6443 | 
 | 
|---|
 | 6444 |                                 break;
 | 
|---|
 | 6445 | 
 | 
|---|
 | 6446 |                         case '*':
 | 
|---|
 | 6447 |                                 cur += 1;
 | 
|---|
 | 6448 |                                 _cur_lexeme = lex_multiply;
 | 
|---|
 | 6449 | 
 | 
|---|
 | 6450 |                                 break;
 | 
|---|
 | 6451 | 
 | 
|---|
 | 6452 |                         case '|':
 | 
|---|
 | 6453 |                                 cur += 1;
 | 
|---|
 | 6454 |                                 _cur_lexeme = lex_union;
 | 
|---|
 | 6455 | 
 | 
|---|
 | 6456 |                                 break;
 | 
|---|
 | 6457 |                         
 | 
|---|
 | 6458 |                         case '$':
 | 
|---|
 | 6459 |                                 cur += 1;
 | 
|---|
 | 6460 | 
 | 
|---|
 | 6461 |                                 if (IS_CHARTYPEX(*cur, ctx_start_symbol))
 | 
|---|
 | 6462 |                                 {
 | 
|---|
 | 6463 |                                         _cur_lexeme_contents.begin = cur;
 | 
|---|
 | 6464 | 
 | 
|---|
 | 6465 |                                         while (IS_CHARTYPEX(*cur, ctx_symbol)) cur++;
 | 
|---|
 | 6466 | 
 | 
|---|
 | 6467 |                                         if (cur[0] == ':' && IS_CHARTYPEX(cur[1], ctx_symbol)) // qname
 | 
|---|
 | 6468 |                                         {
 | 
|---|
 | 6469 |                                                 cur++; // :
 | 
|---|
 | 6470 | 
 | 
|---|
 | 6471 |                                                 while (IS_CHARTYPEX(*cur, ctx_symbol)) cur++;
 | 
|---|
 | 6472 |                                         }
 | 
|---|
 | 6473 | 
 | 
|---|
 | 6474 |                                         _cur_lexeme_contents.end = cur;
 | 
|---|
 | 6475 |                                 
 | 
|---|
 | 6476 |                                         _cur_lexeme = lex_var_ref;
 | 
|---|
 | 6477 |                                 }
 | 
|---|
 | 6478 |                                 else
 | 
|---|
 | 6479 |                                 {
 | 
|---|
 | 6480 |                                         _cur_lexeme = lex_none;
 | 
|---|
 | 6481 |                                 }
 | 
|---|
 | 6482 | 
 | 
|---|
 | 6483 |                                 break;
 | 
|---|
 | 6484 | 
 | 
|---|
 | 6485 |                         case '(':
 | 
|---|
 | 6486 |                                 cur += 1;
 | 
|---|
 | 6487 |                                 _cur_lexeme = lex_open_brace;
 | 
|---|
 | 6488 | 
 | 
|---|
 | 6489 |                                 break;
 | 
|---|
 | 6490 | 
 | 
|---|
 | 6491 |                         case ')':
 | 
|---|
 | 6492 |                                 cur += 1;
 | 
|---|
 | 6493 |                                 _cur_lexeme = lex_close_brace;
 | 
|---|
 | 6494 | 
 | 
|---|
 | 6495 |                                 break;
 | 
|---|
 | 6496 |                         
 | 
|---|
 | 6497 |                         case '[':
 | 
|---|
 | 6498 |                                 cur += 1;
 | 
|---|
 | 6499 |                                 _cur_lexeme = lex_open_square_brace;
 | 
|---|
 | 6500 | 
 | 
|---|
 | 6501 |                                 break;
 | 
|---|
 | 6502 | 
 | 
|---|
 | 6503 |                         case ']':
 | 
|---|
 | 6504 |                                 cur += 1;
 | 
|---|
 | 6505 |                                 _cur_lexeme = lex_close_square_brace;
 | 
|---|
 | 6506 | 
 | 
|---|
 | 6507 |                                 break;
 | 
|---|
 | 6508 | 
 | 
|---|
 | 6509 |                         case ',':
 | 
|---|
 | 6510 |                                 cur += 1;
 | 
|---|
 | 6511 |                                 _cur_lexeme = lex_comma;
 | 
|---|
 | 6512 | 
 | 
|---|
 | 6513 |                                 break;
 | 
|---|
 | 6514 | 
 | 
|---|
 | 6515 |                         case '/':
 | 
|---|
 | 6516 |                                 if (*(cur+1) == '/')
 | 
|---|
 | 6517 |                                 {
 | 
|---|
 | 6518 |                                         cur += 2;
 | 
|---|
 | 6519 |                                         _cur_lexeme = lex_double_slash;
 | 
|---|
 | 6520 |                                 }
 | 
|---|
 | 6521 |                                 else
 | 
|---|
 | 6522 |                                 {
 | 
|---|
 | 6523 |                                         cur += 1;
 | 
|---|
 | 6524 |                                         _cur_lexeme = lex_slash;
 | 
|---|
 | 6525 |                                 }
 | 
|---|
 | 6526 |                                 break;
 | 
|---|
 | 6527 |                 
 | 
|---|
 | 6528 |                         case '.':
 | 
|---|
 | 6529 |                                 if (*(cur+1) == '.')
 | 
|---|
 | 6530 |                                 {
 | 
|---|
 | 6531 |                                         cur += 2;
 | 
|---|
 | 6532 |                                         _cur_lexeme = lex_double_dot;
 | 
|---|
 | 6533 |                                 }
 | 
|---|
 | 6534 |                                 else if (IS_CHARTYPEX(*(cur+1), ctx_digit))
 | 
|---|
 | 6535 |                                 {
 | 
|---|
 | 6536 |                                         _cur_lexeme_contents.begin = cur; // .
 | 
|---|
 | 6537 | 
 | 
|---|
 | 6538 |                                         ++cur;
 | 
|---|
 | 6539 | 
 | 
|---|
 | 6540 |                                         while (IS_CHARTYPEX(*cur, ctx_digit)) cur++;
 | 
|---|
 | 6541 | 
 | 
|---|
 | 6542 |                                         _cur_lexeme_contents.end = cur;
 | 
|---|
 | 6543 |                                         
 | 
|---|
 | 6544 |                                         _cur_lexeme = lex_number;
 | 
|---|
 | 6545 |                                 }
 | 
|---|
 | 6546 |                                 else
 | 
|---|
 | 6547 |                                 {
 | 
|---|
 | 6548 |                                         cur += 1;
 | 
|---|
 | 6549 |                                         _cur_lexeme = lex_dot;
 | 
|---|
 | 6550 |                                 }
 | 
|---|
 | 6551 |                                 break;
 | 
|---|
 | 6552 | 
 | 
|---|
 | 6553 |                         case '@':
 | 
|---|
 | 6554 |                                 cur += 1;
 | 
|---|
 | 6555 |                                 _cur_lexeme = lex_axis_attribute;
 | 
|---|
 | 6556 | 
 | 
|---|
 | 6557 |                                 break;
 | 
|---|
 | 6558 | 
 | 
|---|
 | 6559 |                         case '"':
 | 
|---|
 | 6560 |                         case '\'':
 | 
|---|
 | 6561 |                         {
 | 
|---|
 | 6562 |                                 char_t terminator = *cur;
 | 
|---|
 | 6563 | 
 | 
|---|
 | 6564 |                                 ++cur;
 | 
|---|
 | 6565 | 
 | 
|---|
 | 6566 |                                 _cur_lexeme_contents.begin = cur;
 | 
|---|
 | 6567 |                                 while (*cur && *cur != terminator) cur++;
 | 
|---|
 | 6568 |                                 _cur_lexeme_contents.end = cur;
 | 
|---|
 | 6569 |                                 
 | 
|---|
 | 6570 |                                 if (!*cur)
 | 
|---|
 | 6571 |                                         _cur_lexeme = lex_none;
 | 
|---|
 | 6572 |                                 else
 | 
|---|
 | 6573 |                                 {
 | 
|---|
 | 6574 |                                         cur += 1;
 | 
|---|
 | 6575 |                                         _cur_lexeme = lex_quoted_string;
 | 
|---|
 | 6576 |                                 }
 | 
|---|
 | 6577 | 
 | 
|---|
 | 6578 |                                 break;
 | 
|---|
 | 6579 |                         }
 | 
|---|
 | 6580 | 
 | 
|---|
 | 6581 |                         case ':':
 | 
|---|
 | 6582 |                                 if (*(cur+1) == ':')
 | 
|---|
 | 6583 |                                 {
 | 
|---|
 | 6584 |                                         cur += 2;
 | 
|---|
 | 6585 |                                         _cur_lexeme = lex_double_colon;
 | 
|---|
 | 6586 |                                 }
 | 
|---|
 | 6587 |                                 else
 | 
|---|
 | 6588 |                                 {
 | 
|---|
 | 6589 |                                         _cur_lexeme = lex_none;
 | 
|---|
 | 6590 |                                 }
 | 
|---|
 | 6591 |                                 break;
 | 
|---|
 | 6592 | 
 | 
|---|
 | 6593 |                         default:
 | 
|---|
 | 6594 |                                 if (IS_CHARTYPEX(*cur, ctx_digit))
 | 
|---|
 | 6595 |                                 {
 | 
|---|
 | 6596 |                                         _cur_lexeme_contents.begin = cur;
 | 
|---|
 | 6597 | 
 | 
|---|
 | 6598 |                                         while (IS_CHARTYPEX(*cur, ctx_digit)) cur++;
 | 
|---|
 | 6599 |                                 
 | 
|---|
 | 6600 |                                         if (*cur == '.')
 | 
|---|
 | 6601 |                                         {
 | 
|---|
 | 6602 |                                                 cur++;
 | 
|---|
 | 6603 | 
 | 
|---|
 | 6604 |                                                 while (IS_CHARTYPEX(*cur, ctx_digit)) cur++;
 | 
|---|
 | 6605 |                                         }
 | 
|---|
 | 6606 | 
 | 
|---|
 | 6607 |                                         _cur_lexeme_contents.end = cur;
 | 
|---|
 | 6608 | 
 | 
|---|
 | 6609 |                                         _cur_lexeme = lex_number;
 | 
|---|
 | 6610 |                                 }
 | 
|---|
 | 6611 |                                 else if (IS_CHARTYPEX(*cur, ctx_start_symbol))
 | 
|---|
 | 6612 |                                 {
 | 
|---|
 | 6613 |                                         _cur_lexeme_contents.begin = cur;
 | 
|---|
 | 6614 | 
 | 
|---|
 | 6615 |                                         while (IS_CHARTYPEX(*cur, ctx_symbol)) cur++;
 | 
|---|
 | 6616 | 
 | 
|---|
 | 6617 |                                         if (cur[0] == ':')
 | 
|---|
 | 6618 |                                         {
 | 
|---|
 | 6619 |                                                 if (cur[1] == '*') // namespace test ncname:*
 | 
|---|
 | 6620 |                                                 {
 | 
|---|
 | 6621 |                                                         cur += 2; // :*
 | 
|---|
 | 6622 |                                                 }
 | 
|---|
 | 6623 |                                                 else if (IS_CHARTYPEX(cur[1], ctx_symbol)) // namespace test qname
 | 
|---|
 | 6624 |                                                 {
 | 
|---|
 | 6625 |                                                         cur++; // :
 | 
|---|
 | 6626 | 
 | 
|---|
 | 6627 |                                                         while (IS_CHARTYPEX(*cur, ctx_symbol)) cur++;
 | 
|---|
 | 6628 |                                                 }
 | 
|---|
 | 6629 |                                         }
 | 
|---|
 | 6630 | 
 | 
|---|
 | 6631 |                                         _cur_lexeme_contents.end = cur;
 | 
|---|
 | 6632 |                                 
 | 
|---|
 | 6633 |                                         _cur_lexeme = lex_string;
 | 
|---|
 | 6634 |                                 }
 | 
|---|
 | 6635 |                                 else
 | 
|---|
 | 6636 |                                 {
 | 
|---|
 | 6637 |                                         _cur_lexeme = lex_none;
 | 
|---|
 | 6638 |                                 }
 | 
|---|
 | 6639 |                         }
 | 
|---|
 | 6640 | 
 | 
|---|
 | 6641 |                         _cur = cur;
 | 
|---|
 | 6642 |                 }
 | 
|---|
 | 6643 | 
 | 
|---|
 | 6644 |                 lexeme_t current() const
 | 
|---|
 | 6645 |                 {
 | 
|---|
 | 6646 |                         return _cur_lexeme;
 | 
|---|
 | 6647 |                 }
 | 
|---|
 | 6648 | 
 | 
|---|
 | 6649 |                 const char_t* current_pos() const
 | 
|---|
 | 6650 |                 {
 | 
|---|
 | 6651 |                         return _cur_lexeme_pos;
 | 
|---|
 | 6652 |                 }
 | 
|---|
 | 6653 | 
 | 
|---|
 | 6654 |                 const xpath_lexer_string& contents() const
 | 
|---|
 | 6655 |                 {
 | 
|---|
 | 6656 |                         assert(_cur_lexeme == lex_var_ref || _cur_lexeme == lex_number || _cur_lexeme == lex_string || _cur_lexeme == lex_quoted_string);
 | 
|---|
 | 6657 | 
 | 
|---|
 | 6658 |                         return _cur_lexeme_contents;
 | 
|---|
 | 6659 |                 }
 | 
|---|
 | 6660 |         };
 | 
|---|
 | 6661 | 
 | 
|---|
 | 6662 |         enum ast_type_t
 | 
|---|
 | 6663 |         {
 | 
|---|
 | 6664 |                 ast_op_or,                                              // left or right
 | 
|---|
 | 6665 |                 ast_op_and,                                             // left and right
 | 
|---|
 | 6666 |                 ast_op_equal,                                   // left = right
 | 
|---|
 | 6667 |                 ast_op_not_equal,                               // left != right
 | 
|---|
 | 6668 |                 ast_op_less,                                    // left < right
 | 
|---|
 | 6669 |                 ast_op_greater,                                 // left > right
 | 
|---|
 | 6670 |                 ast_op_less_or_equal,                   // left <= right
 | 
|---|
 | 6671 |                 ast_op_greater_or_equal,                // left >= right
 | 
|---|
 | 6672 |                 ast_op_add,                                             // left + right
 | 
|---|
 | 6673 |                 ast_op_subtract,                                // left - right
 | 
|---|
 | 6674 |                 ast_op_multiply,                                // left * right
 | 
|---|
 | 6675 |                 ast_op_divide,                                  // left / right
 | 
|---|
 | 6676 |                 ast_op_mod,                                             // left % right
 | 
|---|
 | 6677 |                 ast_op_negate,                                  // left - right
 | 
|---|
 | 6678 |                 ast_op_union,                                   // left | right
 | 
|---|
 | 6679 |                 ast_predicate,                                  // apply predicate to set; next points to next predicate
 | 
|---|
 | 6680 |                 ast_filter,                                             // select * from left where right
 | 
|---|
 | 6681 |                 ast_filter_posinv,                              // select * from left where right; proximity position invariant
 | 
|---|
 | 6682 |                 ast_string_constant,                    // string constant
 | 
|---|
 | 6683 |                 ast_number_constant,                    // number constant
 | 
|---|
 | 6684 |                 ast_variable,                                   // variable
 | 
|---|
 | 6685 |                 ast_func_last,                                  // last()
 | 
|---|
 | 6686 |                 ast_func_position,                              // position()
 | 
|---|
 | 6687 |                 ast_func_count,                                 // count(left)
 | 
|---|
 | 6688 |                 ast_func_id,                                    // id(left)
 | 
|---|
 | 6689 |                 ast_func_local_name_0,                  // local-name()
 | 
|---|
 | 6690 |                 ast_func_local_name_1,                  // local-name(left)
 | 
|---|
 | 6691 |                 ast_func_namespace_uri_0,               // namespace-uri()
 | 
|---|
 | 6692 |                 ast_func_namespace_uri_1,               // namespace-uri(left)
 | 
|---|
 | 6693 |                 ast_func_name_0,                                // name()
 | 
|---|
 | 6694 |                 ast_func_name_1,                                // name(left)
 | 
|---|
 | 6695 |                 ast_func_string_0,                              // string()
 | 
|---|
 | 6696 |                 ast_func_string_1,                              // string(left)
 | 
|---|
 | 6697 |                 ast_func_concat,                                // concat(left, right, siblings)
 | 
|---|
 | 6698 |                 ast_func_starts_with,                   // starts_with(left, right)
 | 
|---|
 | 6699 |                 ast_func_contains,                              // contains(left, right)
 | 
|---|
 | 6700 |                 ast_func_substring_before,              // substring-before(left, right)
 | 
|---|
 | 6701 |                 ast_func_substring_after,               // substring-after(left, right)
 | 
|---|
 | 6702 |                 ast_func_substring_2,                   // substring(left, right)
 | 
|---|
 | 6703 |                 ast_func_substring_3,                   // substring(left, right, third)
 | 
|---|
 | 6704 |                 ast_func_string_length_0,               // string-length()
 | 
|---|
 | 6705 |                 ast_func_string_length_1,               // string-length(left)
 | 
|---|
 | 6706 |                 ast_func_normalize_space_0,             // normalize-space()
 | 
|---|
 | 6707 |                 ast_func_normalize_space_1,             // normalize-space(left)
 | 
|---|
 | 6708 |                 ast_func_translate,                             // translate(left, right, third)
 | 
|---|
 | 6709 |                 ast_func_boolean,                               // boolean(left)
 | 
|---|
 | 6710 |                 ast_func_not,                                   // not(left)
 | 
|---|
 | 6711 |                 ast_func_true,                                  // true()
 | 
|---|
 | 6712 |                 ast_func_false,                                 // false()
 | 
|---|
 | 6713 |                 ast_func_lang,                                  // lang(left)
 | 
|---|
 | 6714 |                 ast_func_number_0,                              // number()
 | 
|---|
 | 6715 |                 ast_func_number_1,                              // number(left)
 | 
|---|
 | 6716 |                 ast_func_sum,                                   // sum(left)
 | 
|---|
 | 6717 |                 ast_func_floor,                                 // floor(left)
 | 
|---|
 | 6718 |                 ast_func_ceiling,                               // ceiling(left)
 | 
|---|
 | 6719 |                 ast_func_round,                                 // round(left)
 | 
|---|
 | 6720 |                 ast_step,                                               // process set left with step
 | 
|---|
 | 6721 |                 ast_step_root                                   // select root node
 | 
|---|
 | 6722 |         };
 | 
|---|
 | 6723 | 
 | 
|---|
 | 6724 |         enum axis_t
 | 
|---|
 | 6725 |         {
 | 
|---|
 | 6726 |                 axis_ancestor,
 | 
|---|
 | 6727 |                 axis_ancestor_or_self,
 | 
|---|
 | 6728 |                 axis_attribute,
 | 
|---|
 | 6729 |                 axis_child,
 | 
|---|
 | 6730 |                 axis_descendant,
 | 
|---|
 | 6731 |                 axis_descendant_or_self,
 | 
|---|
 | 6732 |                 axis_following,
 | 
|---|
 | 6733 |                 axis_following_sibling,
 | 
|---|
 | 6734 |                 axis_namespace,
 | 
|---|
 | 6735 |                 axis_parent,
 | 
|---|
 | 6736 |                 axis_preceding,
 | 
|---|
 | 6737 |                 axis_preceding_sibling,
 | 
|---|
 | 6738 |                 axis_self
 | 
|---|
 | 6739 |         };
 | 
|---|
 | 6740 |         
 | 
|---|
 | 6741 |         enum nodetest_t
 | 
|---|
 | 6742 |         {
 | 
|---|
 | 6743 |                 nodetest_none,
 | 
|---|
 | 6744 |                 nodetest_name,
 | 
|---|
 | 6745 |                 nodetest_type_node,
 | 
|---|
 | 6746 |                 nodetest_type_comment,
 | 
|---|
 | 6747 |                 nodetest_type_pi,
 | 
|---|
 | 6748 |                 nodetest_type_text,
 | 
|---|
 | 6749 |                 nodetest_pi,
 | 
|---|
 | 6750 |                 nodetest_all,
 | 
|---|
 | 6751 |                 nodetest_all_in_namespace
 | 
|---|
 | 6752 |         };
 | 
|---|
 | 6753 | 
 | 
|---|
 | 6754 |         template <axis_t N> struct axis_to_type
 | 
|---|
 | 6755 |         {
 | 
|---|
 | 6756 |                 static const axis_t axis;
 | 
|---|
 | 6757 |         };
 | 
|---|
 | 6758 | 
 | 
|---|
 | 6759 |         template <axis_t N> const axis_t axis_to_type<N>::axis = N;
 | 
|---|
 | 6760 |                 
 | 
|---|
 | 6761 |         class xpath_ast_node
 | 
|---|
 | 6762 |         {
 | 
|---|
 | 6763 |         private:
 | 
|---|
 | 6764 |                 // node type
 | 
|---|
 | 6765 |                 char _type;
 | 
|---|
 | 6766 |                 char _rettype;
 | 
|---|
 | 6767 | 
 | 
|---|
 | 6768 |                 // for ast_step / ast_predicate
 | 
|---|
 | 6769 |                 char _axis;
 | 
|---|
 | 6770 |                 char _test;
 | 
|---|
 | 6771 | 
 | 
|---|
 | 6772 |                 // tree node structure
 | 
|---|
 | 6773 |                 xpath_ast_node* _left;
 | 
|---|
 | 6774 |                 xpath_ast_node* _right;
 | 
|---|
 | 6775 |                 xpath_ast_node* _next;
 | 
|---|
 | 6776 | 
 | 
|---|
 | 6777 |                 union
 | 
|---|
 | 6778 |                 {
 | 
|---|
 | 6779 |                         // value for ast_string_constant
 | 
|---|
 | 6780 |                         const char_t* string;
 | 
|---|
 | 6781 |                         // value for ast_number_constant
 | 
|---|
 | 6782 |                         double number;
 | 
|---|
 | 6783 |                         // variable for ast_variable
 | 
|---|
 | 6784 |                         xpath_variable* variable;
 | 
|---|
 | 6785 |                         // node test for ast_step (node name/namespace/node type/pi target)
 | 
|---|
 | 6786 |                         const char_t* nodetest;
 | 
|---|
 | 6787 |                 } _data;
 | 
|---|
 | 6788 | 
 | 
|---|
 | 6789 |                 xpath_ast_node(const xpath_ast_node&);
 | 
|---|
 | 6790 |                 xpath_ast_node& operator=(const xpath_ast_node&);
 | 
|---|
 | 6791 | 
 | 
|---|
 | 6792 |                 template <class Comp> static bool compare_eq(xpath_ast_node* lhs, xpath_ast_node* rhs, const xpath_context& c, const xpath_stack& stack, const Comp& comp)
 | 
|---|
 | 6793 |                 {
 | 
|---|
 | 6794 |                         xpath_value_type lt = lhs->rettype(), rt = rhs->rettype();
 | 
|---|
 | 6795 | 
 | 
|---|
 | 6796 |                         if (lt != xpath_type_node_set && rt != xpath_type_node_set)
 | 
|---|
 | 6797 |                         {
 | 
|---|
 | 6798 |                                 if (lt == xpath_type_boolean || rt == xpath_type_boolean)
 | 
|---|
 | 6799 |                                         return comp(lhs->eval_boolean(c, stack), rhs->eval_boolean(c, stack));
 | 
|---|
 | 6800 |                                 else if (lt == xpath_type_number || rt == xpath_type_number)
 | 
|---|
 | 6801 |                                         return comp(lhs->eval_number(c, stack), rhs->eval_number(c, stack));
 | 
|---|
 | 6802 |                                 else if (lt == xpath_type_string || rt == xpath_type_string)
 | 
|---|
 | 6803 |                                 {
 | 
|---|
 | 6804 |                                         xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 6805 | 
 | 
|---|
 | 6806 |                                         xpath_string ls = lhs->eval_string(c, stack);
 | 
|---|
 | 6807 |                                         xpath_string rs = rhs->eval_string(c, stack);
 | 
|---|
 | 6808 | 
 | 
|---|
 | 6809 |                                         return comp(ls, rs);
 | 
|---|
 | 6810 |                                 }
 | 
|---|
 | 6811 |                         }
 | 
|---|
 | 6812 |                         else if (lt == xpath_type_node_set && rt == xpath_type_node_set)
 | 
|---|
 | 6813 |                         {
 | 
|---|
 | 6814 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 6815 | 
 | 
|---|
 | 6816 |                                 xpath_node_set_raw ls = lhs->eval_node_set(c, stack);
 | 
|---|
 | 6817 |                                 xpath_node_set_raw rs = rhs->eval_node_set(c, stack);
 | 
|---|
 | 6818 | 
 | 
|---|
 | 6819 |                                 for (const xpath_node* li = ls.begin(); li != ls.end(); ++li)
 | 
|---|
 | 6820 |                                         for (const xpath_node* ri = rs.begin(); ri != rs.end(); ++ri)
 | 
|---|
 | 6821 |                                         {
 | 
|---|
 | 6822 |                                                 xpath_allocator_capture cri(stack.result);
 | 
|---|
 | 6823 | 
 | 
|---|
 | 6824 |                                                 if (comp(string_value(*li, stack.result), string_value(*ri, stack.result)))
 | 
|---|
 | 6825 |                                                         return true;
 | 
|---|
 | 6826 |                                         }
 | 
|---|
 | 6827 | 
 | 
|---|
 | 6828 |                                 return false;
 | 
|---|
 | 6829 |                         }
 | 
|---|
 | 6830 |                         else
 | 
|---|
 | 6831 |                         {
 | 
|---|
 | 6832 |                                 if (lt == xpath_type_node_set)
 | 
|---|
 | 6833 |                                 {
 | 
|---|
 | 6834 |                                         swap(lhs, rhs);
 | 
|---|
 | 6835 |                                         swap(lt, rt);
 | 
|---|
 | 6836 |                                 }
 | 
|---|
 | 6837 | 
 | 
|---|
 | 6838 |                                 if (lt == xpath_type_boolean)
 | 
|---|
 | 6839 |                                         return comp(lhs->eval_boolean(c, stack), rhs->eval_boolean(c, stack));
 | 
|---|
 | 6840 |                                 else if (lt == xpath_type_number)
 | 
|---|
 | 6841 |                                 {
 | 
|---|
 | 6842 |                                         xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 6843 | 
 | 
|---|
 | 6844 |                                         double l = lhs->eval_number(c, stack);
 | 
|---|
 | 6845 |                                         xpath_node_set_raw rs = rhs->eval_node_set(c, stack);
 | 
|---|
 | 6846 | 
 | 
|---|
 | 6847 |                                         for (const xpath_node* ri = rs.begin(); ri != rs.end(); ++ri)
 | 
|---|
 | 6848 |                                         {
 | 
|---|
 | 6849 |                                                 xpath_allocator_capture cri(stack.result);
 | 
|---|
 | 6850 | 
 | 
|---|
 | 6851 |                                                 if (comp(l, convert_string_to_number(string_value(*ri, stack.result).c_str())))
 | 
|---|
 | 6852 |                                                         return true;
 | 
|---|
 | 6853 |                                         }
 | 
|---|
 | 6854 | 
 | 
|---|
 | 6855 |                                         return false;
 | 
|---|
 | 6856 |                                 }
 | 
|---|
 | 6857 |                                 else if (lt == xpath_type_string)
 | 
|---|
 | 6858 |                                 {
 | 
|---|
 | 6859 |                                         xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 6860 | 
 | 
|---|
 | 6861 |                                         xpath_string l = lhs->eval_string(c, stack);
 | 
|---|
 | 6862 |                                         xpath_node_set_raw rs = rhs->eval_node_set(c, stack);
 | 
|---|
 | 6863 | 
 | 
|---|
 | 6864 |                                         for (const xpath_node* ri = rs.begin(); ri != rs.end(); ++ri)
 | 
|---|
 | 6865 |                                         {
 | 
|---|
 | 6866 |                                                 xpath_allocator_capture cri(stack.result);
 | 
|---|
 | 6867 | 
 | 
|---|
 | 6868 |                                                 if (comp(l, string_value(*ri, stack.result)))
 | 
|---|
 | 6869 |                                                         return true;
 | 
|---|
 | 6870 |                                         }
 | 
|---|
 | 6871 | 
 | 
|---|
 | 6872 |                                         return false;
 | 
|---|
 | 6873 |                                 }
 | 
|---|
 | 6874 |                         }
 | 
|---|
 | 6875 | 
 | 
|---|
 | 6876 |                         assert(!"Wrong types");
 | 
|---|
 | 6877 |                         return false;
 | 
|---|
 | 6878 |                 }
 | 
|---|
 | 6879 | 
 | 
|---|
 | 6880 |                 template <class Comp> static bool compare_rel(xpath_ast_node* lhs, xpath_ast_node* rhs, const xpath_context& c, const xpath_stack& stack, const Comp& comp)
 | 
|---|
 | 6881 |                 {
 | 
|---|
 | 6882 |                         xpath_value_type lt = lhs->rettype(), rt = rhs->rettype();
 | 
|---|
 | 6883 | 
 | 
|---|
 | 6884 |                         if (lt != xpath_type_node_set && rt != xpath_type_node_set)
 | 
|---|
 | 6885 |                                 return comp(lhs->eval_number(c, stack), rhs->eval_number(c, stack));
 | 
|---|
 | 6886 |                         else if (lt == xpath_type_node_set && rt == xpath_type_node_set)
 | 
|---|
 | 6887 |                         {
 | 
|---|
 | 6888 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 6889 | 
 | 
|---|
 | 6890 |                                 xpath_node_set_raw ls = lhs->eval_node_set(c, stack);
 | 
|---|
 | 6891 |                                 xpath_node_set_raw rs = rhs->eval_node_set(c, stack);
 | 
|---|
 | 6892 | 
 | 
|---|
 | 6893 |                                 for (const xpath_node* li = ls.begin(); li != ls.end(); ++li)
 | 
|---|
 | 6894 |                                 {
 | 
|---|
 | 6895 |                                         xpath_allocator_capture cri(stack.result);
 | 
|---|
 | 6896 | 
 | 
|---|
 | 6897 |                                         double l = convert_string_to_number(string_value(*li, stack.result).c_str());
 | 
|---|
 | 6898 | 
 | 
|---|
 | 6899 |                                         for (const xpath_node* ri = rs.begin(); ri != rs.end(); ++ri)
 | 
|---|
 | 6900 |                                         {
 | 
|---|
 | 6901 |                                                 xpath_allocator_capture crii(stack.result);
 | 
|---|
 | 6902 | 
 | 
|---|
 | 6903 |                                                 if (comp(l, convert_string_to_number(string_value(*ri, stack.result).c_str())))
 | 
|---|
 | 6904 |                                                         return true;
 | 
|---|
 | 6905 |                                         }
 | 
|---|
 | 6906 |                                 }
 | 
|---|
 | 6907 | 
 | 
|---|
 | 6908 |                                 return false;
 | 
|---|
 | 6909 |                         }
 | 
|---|
 | 6910 |                         else if (lt != xpath_type_node_set && rt == xpath_type_node_set)
 | 
|---|
 | 6911 |                         {
 | 
|---|
 | 6912 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 6913 | 
 | 
|---|
 | 6914 |                                 double l = lhs->eval_number(c, stack);
 | 
|---|
 | 6915 |                                 xpath_node_set_raw rs = rhs->eval_node_set(c, stack);
 | 
|---|
 | 6916 | 
 | 
|---|
 | 6917 |                                 for (const xpath_node* ri = rs.begin(); ri != rs.end(); ++ri)
 | 
|---|
 | 6918 |                                 {
 | 
|---|
 | 6919 |                                         xpath_allocator_capture cri(stack.result);
 | 
|---|
 | 6920 | 
 | 
|---|
 | 6921 |                                         if (comp(l, convert_string_to_number(string_value(*ri, stack.result).c_str())))
 | 
|---|
 | 6922 |                                                 return true;
 | 
|---|
 | 6923 |                                 }
 | 
|---|
 | 6924 | 
 | 
|---|
 | 6925 |                                 return false;
 | 
|---|
 | 6926 |                         }
 | 
|---|
 | 6927 |                         else if (lt == xpath_type_node_set && rt != xpath_type_node_set)
 | 
|---|
 | 6928 |                         {
 | 
|---|
 | 6929 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 6930 | 
 | 
|---|
 | 6931 |                                 xpath_node_set_raw ls = lhs->eval_node_set(c, stack);
 | 
|---|
 | 6932 |                                 double r = rhs->eval_number(c, stack);
 | 
|---|
 | 6933 | 
 | 
|---|
 | 6934 |                                 for (const xpath_node* li = ls.begin(); li != ls.end(); ++li)
 | 
|---|
 | 6935 |                                 {
 | 
|---|
 | 6936 |                                         xpath_allocator_capture cri(stack.result);
 | 
|---|
 | 6937 | 
 | 
|---|
 | 6938 |                                         if (comp(convert_string_to_number(string_value(*li, stack.result).c_str()), r))
 | 
|---|
 | 6939 |                                                 return true;
 | 
|---|
 | 6940 |                                 }
 | 
|---|
 | 6941 | 
 | 
|---|
 | 6942 |                                 return false;
 | 
|---|
 | 6943 |                         }
 | 
|---|
 | 6944 |                         else
 | 
|---|
 | 6945 |                         {
 | 
|---|
 | 6946 |                                 assert(!"Wrong types");
 | 
|---|
 | 6947 |                                 return false;
 | 
|---|
 | 6948 |                         }
 | 
|---|
 | 6949 |                 }
 | 
|---|
 | 6950 | 
 | 
|---|
 | 6951 |                 void apply_predicate(xpath_node_set_raw& ns, size_t first, xpath_ast_node* expr, const xpath_stack& stack)
 | 
|---|
 | 6952 |                 {
 | 
|---|
 | 6953 |                         assert(ns.size() >= first);
 | 
|---|
 | 6954 | 
 | 
|---|
 | 6955 |                         size_t i = 1;
 | 
|---|
 | 6956 |                         size_t size = ns.size() - first;
 | 
|---|
 | 6957 |                                 
 | 
|---|
 | 6958 |                         xpath_node* last = ns.begin() + first;
 | 
|---|
 | 6959 |                                 
 | 
|---|
 | 6960 |                         // remove_if... or well, sort of
 | 
|---|
 | 6961 |                         for (xpath_node* it = last; it != ns.end(); ++it, ++i)
 | 
|---|
 | 6962 |                         {
 | 
|---|
 | 6963 |                                 xpath_context c(*it, i, size);
 | 
|---|
 | 6964 |                         
 | 
|---|
 | 6965 |                                 if (expr->rettype() == xpath_type_number)
 | 
|---|
 | 6966 |                                 {
 | 
|---|
 | 6967 |                                         if (expr->eval_number(c, stack) == i)
 | 
|---|
 | 6968 |                                                 *last++ = *it;
 | 
|---|
 | 6969 |                                 }
 | 
|---|
 | 6970 |                                 else if (expr->eval_boolean(c, stack))
 | 
|---|
 | 6971 |                                         *last++ = *it;
 | 
|---|
 | 6972 |                         }
 | 
|---|
 | 6973 |                         
 | 
|---|
 | 6974 |                         ns.truncate(last);
 | 
|---|
 | 6975 |                 }
 | 
|---|
 | 6976 | 
 | 
|---|
 | 6977 |                 void apply_predicates(xpath_node_set_raw& ns, size_t first, const xpath_stack& stack)
 | 
|---|
 | 6978 |                 {
 | 
|---|
 | 6979 |                         if (ns.size() == first) return;
 | 
|---|
 | 6980 |                         
 | 
|---|
 | 6981 |                         for (xpath_ast_node* pred = _right; pred; pred = pred->_next)
 | 
|---|
 | 6982 |                         {
 | 
|---|
 | 6983 |                                 apply_predicate(ns, first, pred->_left, stack);
 | 
|---|
 | 6984 |                         }
 | 
|---|
 | 6985 |                 }
 | 
|---|
 | 6986 | 
 | 
|---|
 | 6987 |                 void step_push(xpath_node_set_raw& ns, const xml_attribute& a, const xml_node& parent, xpath_allocator* alloc)
 | 
|---|
 | 6988 |                 {
 | 
|---|
 | 6989 |                         if (!a) return;
 | 
|---|
 | 6990 | 
 | 
|---|
 | 6991 |                         const char_t* name = a.name();
 | 
|---|
 | 6992 | 
 | 
|---|
 | 6993 |                         // There are no attribute nodes corresponding to attributes that declare namespaces
 | 
|---|
 | 6994 |                         // That is, "xmlns:..." or "xmlns"
 | 
|---|
 | 6995 |                         if (starts_with(name, PUGIXML_TEXT("xmlns")) && (name[5] == 0 || name[5] == ':')) return;
 | 
|---|
 | 6996 |                         
 | 
|---|
 | 6997 |                         switch (_test)
 | 
|---|
 | 6998 |                         {
 | 
|---|
 | 6999 |                         case nodetest_name:
 | 
|---|
 | 7000 |                                 if (strequal(name, _data.nodetest)) ns.push_back(xpath_node(a, parent), alloc);
 | 
|---|
 | 7001 |                                 break;
 | 
|---|
 | 7002 |                                 
 | 
|---|
 | 7003 |                         case nodetest_type_node:
 | 
|---|
 | 7004 |                         case nodetest_all:
 | 
|---|
 | 7005 |                                 ns.push_back(xpath_node(a, parent), alloc);
 | 
|---|
 | 7006 |                                 break;
 | 
|---|
 | 7007 |                                 
 | 
|---|
 | 7008 |                         case nodetest_all_in_namespace:
 | 
|---|
 | 7009 |                                 if (starts_with(name, _data.nodetest))
 | 
|---|
 | 7010 |                                         ns.push_back(xpath_node(a, parent), alloc);
 | 
|---|
 | 7011 |                                 break;
 | 
|---|
 | 7012 |                         
 | 
|---|
 | 7013 |                         default:
 | 
|---|
 | 7014 |                                 ;
 | 
|---|
 | 7015 |                         }
 | 
|---|
 | 7016 |                 }
 | 
|---|
 | 7017 |                 
 | 
|---|
 | 7018 |                 void step_push(xpath_node_set_raw& ns, const xml_node& n, xpath_allocator* alloc)
 | 
|---|
 | 7019 |                 {
 | 
|---|
 | 7020 |                         if (!n) return;
 | 
|---|
 | 7021 | 
 | 
|---|
 | 7022 |                         switch (_test)
 | 
|---|
 | 7023 |                         {
 | 
|---|
 | 7024 |                         case nodetest_name:
 | 
|---|
 | 7025 |                                 if (n.type() == node_element && strequal(n.name(), _data.nodetest)) ns.push_back(n, alloc);
 | 
|---|
 | 7026 |                                 break;
 | 
|---|
 | 7027 |                                 
 | 
|---|
 | 7028 |                         case nodetest_type_node:
 | 
|---|
 | 7029 |                                 ns.push_back(n, alloc);
 | 
|---|
 | 7030 |                                 break;
 | 
|---|
 | 7031 |                                 
 | 
|---|
 | 7032 |                         case nodetest_type_comment:
 | 
|---|
 | 7033 |                                 if (n.type() == node_comment)
 | 
|---|
 | 7034 |                                         ns.push_back(n, alloc);
 | 
|---|
 | 7035 |                                 break;
 | 
|---|
 | 7036 |                                 
 | 
|---|
 | 7037 |                         case nodetest_type_text:
 | 
|---|
 | 7038 |                                 if (n.type() == node_pcdata || n.type() == node_cdata)
 | 
|---|
 | 7039 |                                         ns.push_back(n, alloc);
 | 
|---|
 | 7040 |                                 break;
 | 
|---|
 | 7041 |                                 
 | 
|---|
 | 7042 |                         case nodetest_type_pi:
 | 
|---|
 | 7043 |                                 if (n.type() == node_pi)
 | 
|---|
 | 7044 |                                         ns.push_back(n, alloc);
 | 
|---|
 | 7045 |                                 break;
 | 
|---|
 | 7046 |                                                                         
 | 
|---|
 | 7047 |                         case nodetest_pi:
 | 
|---|
 | 7048 |                                 if (n.type() == node_pi && strequal(n.name(), _data.nodetest))
 | 
|---|
 | 7049 |                                         ns.push_back(n, alloc);
 | 
|---|
 | 7050 |                                 break;
 | 
|---|
 | 7051 |                                 
 | 
|---|
 | 7052 |                         case nodetest_all:
 | 
|---|
 | 7053 |                                 if (n.type() == node_element)
 | 
|---|
 | 7054 |                                         ns.push_back(n, alloc);
 | 
|---|
 | 7055 |                                 break;
 | 
|---|
 | 7056 |                                 
 | 
|---|
 | 7057 |                         case nodetest_all_in_namespace:
 | 
|---|
 | 7058 |                                 if (n.type() == node_element && starts_with(n.name(), _data.nodetest))
 | 
|---|
 | 7059 |                                         ns.push_back(n, alloc);
 | 
|---|
 | 7060 |                                 break;
 | 
|---|
 | 7061 | 
 | 
|---|
 | 7062 |                         default:
 | 
|---|
 | 7063 |                                 assert(!"Unknown axis");
 | 
|---|
 | 7064 |                         } 
 | 
|---|
 | 7065 |                 }
 | 
|---|
 | 7066 | 
 | 
|---|
 | 7067 |                 template <class T> void step_fill(xpath_node_set_raw& ns, const xml_node& n, xpath_allocator* alloc, T)
 | 
|---|
 | 7068 |                 {
 | 
|---|
 | 7069 |                         const axis_t axis = T::axis;
 | 
|---|
 | 7070 | 
 | 
|---|
 | 7071 |                         switch (axis)
 | 
|---|
 | 7072 |                         {
 | 
|---|
 | 7073 |                         case axis_attribute:
 | 
|---|
 | 7074 |                         {
 | 
|---|
 | 7075 |                                 for (xml_attribute a = n.first_attribute(); a; a = a.next_attribute())
 | 
|---|
 | 7076 |                                         step_push(ns, a, n, alloc);
 | 
|---|
 | 7077 |                                 
 | 
|---|
 | 7078 |                                 break;
 | 
|---|
 | 7079 |                         }
 | 
|---|
 | 7080 |                         
 | 
|---|
 | 7081 |                         case axis_child:
 | 
|---|
 | 7082 |                         {
 | 
|---|
 | 7083 |                                 for (xml_node c = n.first_child(); c; c = c.next_sibling())
 | 
|---|
 | 7084 |                                         step_push(ns, c, alloc);
 | 
|---|
 | 7085 |                                         
 | 
|---|
 | 7086 |                                 break;
 | 
|---|
 | 7087 |                         }
 | 
|---|
 | 7088 |                         
 | 
|---|
 | 7089 |                         case axis_descendant:
 | 
|---|
 | 7090 |                         case axis_descendant_or_self:
 | 
|---|
 | 7091 |                         {
 | 
|---|
 | 7092 |                                 if (axis == axis_descendant_or_self)
 | 
|---|
 | 7093 |                                         step_push(ns, n, alloc);
 | 
|---|
 | 7094 |                                         
 | 
|---|
 | 7095 |                                 xml_node cur = n.first_child();
 | 
|---|
 | 7096 |                                 
 | 
|---|
 | 7097 |                                 while (cur && cur != n)
 | 
|---|
 | 7098 |                                 {
 | 
|---|
 | 7099 |                                         step_push(ns, cur, alloc);
 | 
|---|
 | 7100 |                                         
 | 
|---|
 | 7101 |                                         if (cur.first_child())
 | 
|---|
 | 7102 |                                                 cur = cur.first_child();
 | 
|---|
 | 7103 |                                         else if (cur.next_sibling())
 | 
|---|
 | 7104 |                                                 cur = cur.next_sibling();
 | 
|---|
 | 7105 |                                         else
 | 
|---|
 | 7106 |                                         {
 | 
|---|
 | 7107 |                                                 while (!cur.next_sibling() && cur != n)
 | 
|---|
 | 7108 |                                                         cur = cur.parent();
 | 
|---|
 | 7109 |                                         
 | 
|---|
 | 7110 |                                                 if (cur != n) cur = cur.next_sibling();
 | 
|---|
 | 7111 |                                         }
 | 
|---|
 | 7112 |                                 }
 | 
|---|
 | 7113 |                                 
 | 
|---|
 | 7114 |                                 break;
 | 
|---|
 | 7115 |                         }
 | 
|---|
 | 7116 |                         
 | 
|---|
 | 7117 |                         case axis_following_sibling:
 | 
|---|
 | 7118 |                         {
 | 
|---|
 | 7119 |                                 for (xml_node c = n.next_sibling(); c; c = c.next_sibling())
 | 
|---|
 | 7120 |                                         step_push(ns, c, alloc);
 | 
|---|
 | 7121 |                                 
 | 
|---|
 | 7122 |                                 break;
 | 
|---|
 | 7123 |                         }
 | 
|---|
 | 7124 |                         
 | 
|---|
 | 7125 |                         case axis_preceding_sibling:
 | 
|---|
 | 7126 |                         {
 | 
|---|
 | 7127 |                                 for (xml_node c = n.previous_sibling(); c; c = c.previous_sibling())
 | 
|---|
 | 7128 |                                         step_push(ns, c, alloc);
 | 
|---|
 | 7129 |                                 
 | 
|---|
 | 7130 |                                 break;
 | 
|---|
 | 7131 |                         }
 | 
|---|
 | 7132 |                         
 | 
|---|
 | 7133 |                         case axis_following:
 | 
|---|
 | 7134 |                         {
 | 
|---|
 | 7135 |                                 xml_node cur = n;
 | 
|---|
 | 7136 | 
 | 
|---|
 | 7137 |                                 // exit from this node so that we don't include descendants
 | 
|---|
 | 7138 |                                 while (cur && !cur.next_sibling()) cur = cur.parent();
 | 
|---|
 | 7139 |                                 cur = cur.next_sibling();
 | 
|---|
 | 7140 | 
 | 
|---|
 | 7141 |                                 for (;;)
 | 
|---|
 | 7142 |                                 {
 | 
|---|
 | 7143 |                                         step_push(ns, cur, alloc);
 | 
|---|
 | 7144 | 
 | 
|---|
 | 7145 |                                         if (cur.first_child())
 | 
|---|
 | 7146 |                                                 cur = cur.first_child();
 | 
|---|
 | 7147 |                                         else if (cur.next_sibling())
 | 
|---|
 | 7148 |                                                 cur = cur.next_sibling();
 | 
|---|
 | 7149 |                                         else
 | 
|---|
 | 7150 |                                         {
 | 
|---|
 | 7151 |                                                 while (cur && !cur.next_sibling()) cur = cur.parent();
 | 
|---|
 | 7152 |                                                 cur = cur.next_sibling();
 | 
|---|
 | 7153 | 
 | 
|---|
 | 7154 |                                                 if (!cur) break;
 | 
|---|
 | 7155 |                                         }
 | 
|---|
 | 7156 |                                 }
 | 
|---|
 | 7157 | 
 | 
|---|
 | 7158 |                                 break;
 | 
|---|
 | 7159 |                         }
 | 
|---|
 | 7160 | 
 | 
|---|
 | 7161 |                         case axis_preceding:
 | 
|---|
 | 7162 |                         {
 | 
|---|
 | 7163 |                                 xml_node cur = n;
 | 
|---|
 | 7164 | 
 | 
|---|
 | 7165 |                                 while (cur && !cur.previous_sibling()) cur = cur.parent();
 | 
|---|
 | 7166 |                                 cur = cur.previous_sibling();
 | 
|---|
 | 7167 | 
 | 
|---|
 | 7168 |                                 for (;;)
 | 
|---|
 | 7169 |                                 {
 | 
|---|
 | 7170 |                                         if (cur.last_child())
 | 
|---|
 | 7171 |                                                 cur = cur.last_child();
 | 
|---|
 | 7172 |                                         else
 | 
|---|
 | 7173 |                                         {
 | 
|---|
 | 7174 |                                                 // leaf node, can't be ancestor
 | 
|---|
 | 7175 |                                                 step_push(ns, cur, alloc);
 | 
|---|
 | 7176 | 
 | 
|---|
 | 7177 |                                                 if (cur.previous_sibling())
 | 
|---|
 | 7178 |                                                         cur = cur.previous_sibling();
 | 
|---|
 | 7179 |                                                 else
 | 
|---|
 | 7180 |                                                 {
 | 
|---|
 | 7181 |                                                         do 
 | 
|---|
 | 7182 |                                                         {
 | 
|---|
 | 7183 |                                                                 cur = cur.parent();
 | 
|---|
 | 7184 |                                                                 if (!cur) break;
 | 
|---|
 | 7185 | 
 | 
|---|
 | 7186 |                                                                 if (!node_is_ancestor(cur, n)) step_push(ns, cur, alloc);
 | 
|---|
 | 7187 |                                                         }
 | 
|---|
 | 7188 |                                                         while (!cur.previous_sibling());
 | 
|---|
 | 7189 | 
 | 
|---|
 | 7190 |                                                         cur = cur.previous_sibling();
 | 
|---|
 | 7191 | 
 | 
|---|
 | 7192 |                                                         if (!cur) break;
 | 
|---|
 | 7193 |                                                 }
 | 
|---|
 | 7194 |                                         }
 | 
|---|
 | 7195 |                                 }
 | 
|---|
 | 7196 | 
 | 
|---|
 | 7197 |                                 break;
 | 
|---|
 | 7198 |                         }
 | 
|---|
 | 7199 |                         
 | 
|---|
 | 7200 |                         case axis_ancestor:
 | 
|---|
 | 7201 |                         case axis_ancestor_or_self:
 | 
|---|
 | 7202 |                         {
 | 
|---|
 | 7203 |                                 if (axis == axis_ancestor_or_self)
 | 
|---|
 | 7204 |                                         step_push(ns, n, alloc);
 | 
|---|
 | 7205 | 
 | 
|---|
 | 7206 |                                 xml_node cur = n.parent();
 | 
|---|
 | 7207 |                                 
 | 
|---|
 | 7208 |                                 while (cur)
 | 
|---|
 | 7209 |                                 {
 | 
|---|
 | 7210 |                                         step_push(ns, cur, alloc);
 | 
|---|
 | 7211 |                                         
 | 
|---|
 | 7212 |                                         cur = cur.parent();
 | 
|---|
 | 7213 |                                 }
 | 
|---|
 | 7214 |                                 
 | 
|---|
 | 7215 |                                 break;
 | 
|---|
 | 7216 |                         }
 | 
|---|
 | 7217 | 
 | 
|---|
 | 7218 |                         case axis_self:
 | 
|---|
 | 7219 |                         {
 | 
|---|
 | 7220 |                                 step_push(ns, n, alloc);
 | 
|---|
 | 7221 | 
 | 
|---|
 | 7222 |                                 break;
 | 
|---|
 | 7223 |                         }
 | 
|---|
 | 7224 | 
 | 
|---|
 | 7225 |                         case axis_parent:
 | 
|---|
 | 7226 |                         {
 | 
|---|
 | 7227 |                                 if (n.parent()) step_push(ns, n.parent(), alloc);
 | 
|---|
 | 7228 | 
 | 
|---|
 | 7229 |                                 break;
 | 
|---|
 | 7230 |                         }
 | 
|---|
 | 7231 |                                 
 | 
|---|
 | 7232 |                         default:
 | 
|---|
 | 7233 |                                 assert(!"Unimplemented axis");
 | 
|---|
 | 7234 |                         }
 | 
|---|
 | 7235 |                 }
 | 
|---|
 | 7236 |                 
 | 
|---|
 | 7237 |                 template <class T> void step_fill(xpath_node_set_raw& ns, const xml_attribute& a, const xml_node& p, xpath_allocator* alloc, T v)
 | 
|---|
 | 7238 |                 {
 | 
|---|
 | 7239 |                         const axis_t axis = T::axis;
 | 
|---|
 | 7240 | 
 | 
|---|
 | 7241 |                         switch (axis)
 | 
|---|
 | 7242 |                         {
 | 
|---|
 | 7243 |                         case axis_ancestor:
 | 
|---|
 | 7244 |                         case axis_ancestor_or_self:
 | 
|---|
 | 7245 |                         {
 | 
|---|
 | 7246 |                                 if (axis == axis_ancestor_or_self && _test == nodetest_type_node) // reject attributes based on principal node type test
 | 
|---|
 | 7247 |                                         step_push(ns, a, p, alloc);
 | 
|---|
 | 7248 | 
 | 
|---|
 | 7249 |                                 xml_node cur = p;
 | 
|---|
 | 7250 |                                 
 | 
|---|
 | 7251 |                                 while (cur)
 | 
|---|
 | 7252 |                                 {
 | 
|---|
 | 7253 |                                         step_push(ns, cur, alloc);
 | 
|---|
 | 7254 |                                         
 | 
|---|
 | 7255 |                                         cur = cur.parent();
 | 
|---|
 | 7256 |                                 }
 | 
|---|
 | 7257 |                                 
 | 
|---|
 | 7258 |                                 break;
 | 
|---|
 | 7259 |                         }
 | 
|---|
 | 7260 | 
 | 
|---|
 | 7261 |                         case axis_descendant_or_self:
 | 
|---|
 | 7262 |                         case axis_self:
 | 
|---|
 | 7263 |                         {
 | 
|---|
 | 7264 |                                 if (_test == nodetest_type_node) // reject attributes based on principal node type test
 | 
|---|
 | 7265 |                                         step_push(ns, a, p, alloc);
 | 
|---|
 | 7266 | 
 | 
|---|
 | 7267 |                                 break;
 | 
|---|
 | 7268 |                         }
 | 
|---|
 | 7269 | 
 | 
|---|
 | 7270 |                         case axis_following:
 | 
|---|
 | 7271 |                         {
 | 
|---|
 | 7272 |                                 xml_node cur = p;
 | 
|---|
 | 7273 |                                 
 | 
|---|
 | 7274 |                                 for (;;)
 | 
|---|
 | 7275 |                                 {
 | 
|---|
 | 7276 |                                         if (cur.first_child())
 | 
|---|
 | 7277 |                                                 cur = cur.first_child();
 | 
|---|
 | 7278 |                                         else if (cur.next_sibling())
 | 
|---|
 | 7279 |                                                 cur = cur.next_sibling();
 | 
|---|
 | 7280 |                                         else
 | 
|---|
 | 7281 |                                         {
 | 
|---|
 | 7282 |                                                 while (cur && !cur.next_sibling()) cur = cur.parent();
 | 
|---|
 | 7283 |                                                 cur = cur.next_sibling();
 | 
|---|
 | 7284 |                                                 
 | 
|---|
 | 7285 |                                                 if (!cur) break;
 | 
|---|
 | 7286 |                                         }
 | 
|---|
 | 7287 | 
 | 
|---|
 | 7288 |                                         step_push(ns, cur, alloc);
 | 
|---|
 | 7289 |                                 }
 | 
|---|
 | 7290 | 
 | 
|---|
 | 7291 |                                 break;
 | 
|---|
 | 7292 |                         }
 | 
|---|
 | 7293 | 
 | 
|---|
 | 7294 |                         case axis_parent:
 | 
|---|
 | 7295 |                         {
 | 
|---|
 | 7296 |                                 step_push(ns, p, alloc);
 | 
|---|
 | 7297 | 
 | 
|---|
 | 7298 |                                 break;
 | 
|---|
 | 7299 |                         }
 | 
|---|
 | 7300 | 
 | 
|---|
 | 7301 |                         case axis_preceding:
 | 
|---|
 | 7302 |                         {
 | 
|---|
 | 7303 |                                 // preceding:: axis does not include attribute nodes and attribute ancestors (they are the same as parent's ancestors), so we can reuse node preceding
 | 
|---|
 | 7304 |                                 step_fill(ns, p, alloc, v);
 | 
|---|
 | 7305 |                                 break;
 | 
|---|
 | 7306 |                         }
 | 
|---|
 | 7307 |                         
 | 
|---|
 | 7308 |                         default:
 | 
|---|
 | 7309 |                                 assert(!"Unimplemented axis");
 | 
|---|
 | 7310 |                         }
 | 
|---|
 | 7311 |                 }
 | 
|---|
 | 7312 |                 
 | 
|---|
 | 7313 |                 template <class T> xpath_node_set_raw step_do(const xpath_context& c, const xpath_stack& stack, T v)
 | 
|---|
 | 7314 |                 {
 | 
|---|
 | 7315 |                         const axis_t axis = T::axis;
 | 
|---|
 | 7316 |                         bool attributes = (axis == axis_ancestor || axis == axis_ancestor_or_self || axis == axis_descendant_or_self || axis == axis_following || axis == axis_parent || axis == axis_preceding || axis == axis_self);
 | 
|---|
 | 7317 | 
 | 
|---|
 | 7318 |                         xpath_node_set_raw ns;
 | 
|---|
 | 7319 |                         ns.set_type((axis == axis_ancestor || axis == axis_ancestor_or_self || axis == axis_preceding || axis == axis_preceding_sibling) ? xpath_node_set::type_sorted_reverse : xpath_node_set::type_sorted);
 | 
|---|
 | 7320 | 
 | 
|---|
 | 7321 |                         if (_left)
 | 
|---|
 | 7322 |                         {
 | 
|---|
 | 7323 |                                 xpath_node_set_raw s = _left->eval_node_set(c, stack);
 | 
|---|
 | 7324 | 
 | 
|---|
 | 7325 |                                 // self axis preserves the original order
 | 
|---|
 | 7326 |                                 if (axis == axis_self) ns.set_type(s.type());
 | 
|---|
 | 7327 | 
 | 
|---|
 | 7328 |                                 for (const xpath_node* it = s.begin(); it != s.end(); ++it)
 | 
|---|
 | 7329 |                                 {
 | 
|---|
 | 7330 |                                         size_t size = ns.size();
 | 
|---|
 | 7331 | 
 | 
|---|
 | 7332 |                                         // in general, all axes generate elements in a particular order, but there is no order guarantee if axis is applied to two nodes
 | 
|---|
 | 7333 |                                         if (axis != axis_self && size != 0) ns.set_type(xpath_node_set::type_unsorted);
 | 
|---|
 | 7334 |                                         
 | 
|---|
 | 7335 |                                         if (it->node())
 | 
|---|
 | 7336 |                                                 step_fill(ns, it->node(), stack.result, v);
 | 
|---|
 | 7337 |                                         else if (attributes)
 | 
|---|
 | 7338 |                                                 step_fill(ns, it->attribute(), it->parent(), stack.result, v);
 | 
|---|
 | 7339 |                                                 
 | 
|---|
 | 7340 |                                         apply_predicates(ns, size, stack);
 | 
|---|
 | 7341 |                                 }
 | 
|---|
 | 7342 |                         }
 | 
|---|
 | 7343 |                         else
 | 
|---|
 | 7344 |                         {
 | 
|---|
 | 7345 |                                 if (c.n.node())
 | 
|---|
 | 7346 |                                         step_fill(ns, c.n.node(), stack.result, v);
 | 
|---|
 | 7347 |                                 else if (attributes)
 | 
|---|
 | 7348 |                                         step_fill(ns, c.n.attribute(), c.n.parent(), stack.result, v);
 | 
|---|
 | 7349 |                                 
 | 
|---|
 | 7350 |                                 apply_predicates(ns, 0, stack);
 | 
|---|
 | 7351 |                         }
 | 
|---|
 | 7352 | 
 | 
|---|
 | 7353 |                         // child, attribute and self axes always generate unique set of nodes
 | 
|---|
 | 7354 |                         // for other axis, if the set stayed sorted, it stayed unique because the traversal algorithms do not visit the same node twice
 | 
|---|
 | 7355 |                         if (axis != axis_child && axis != axis_attribute && axis != axis_self && ns.type() == xpath_node_set::type_unsorted)
 | 
|---|
 | 7356 |                                 ns.remove_duplicates();
 | 
|---|
 | 7357 | 
 | 
|---|
 | 7358 |                         return ns;
 | 
|---|
 | 7359 |                 }
 | 
|---|
 | 7360 |                 
 | 
|---|
 | 7361 |         public:
 | 
|---|
 | 7362 |                 xpath_ast_node(ast_type_t type, xpath_value_type rettype, const char_t* value):
 | 
|---|
 | 7363 |                         _type((char)type), _rettype((char)rettype), _axis(0), _test(0), _left(0), _right(0), _next(0)
 | 
|---|
 | 7364 |                 {
 | 
|---|
 | 7365 |                         assert(type == ast_string_constant);
 | 
|---|
 | 7366 |                         _data.string = value;
 | 
|---|
 | 7367 |                 }
 | 
|---|
 | 7368 | 
 | 
|---|
 | 7369 |                 xpath_ast_node(ast_type_t type, xpath_value_type rettype, double value):
 | 
|---|
 | 7370 |                         _type((char)type), _rettype((char)rettype), _axis(0), _test(0), _left(0), _right(0), _next(0)
 | 
|---|
 | 7371 |                 {
 | 
|---|
 | 7372 |                         assert(type == ast_number_constant);
 | 
|---|
 | 7373 |                         _data.number = value;
 | 
|---|
 | 7374 |                 }
 | 
|---|
 | 7375 |                 
 | 
|---|
 | 7376 |                 xpath_ast_node(ast_type_t type, xpath_value_type rettype, xpath_variable* value):
 | 
|---|
 | 7377 |                         _type((char)type), _rettype((char)rettype), _axis(0), _test(0), _left(0), _right(0), _next(0)
 | 
|---|
 | 7378 |                 {
 | 
|---|
 | 7379 |                         assert(type == ast_variable);
 | 
|---|
 | 7380 |                         _data.variable = value;
 | 
|---|
 | 7381 |                 }
 | 
|---|
 | 7382 |                 
 | 
|---|
 | 7383 |                 xpath_ast_node(ast_type_t type, xpath_value_type rettype, xpath_ast_node* left = 0, xpath_ast_node* right = 0):
 | 
|---|
 | 7384 |                         _type((char)type), _rettype((char)rettype), _axis(0), _test(0), _left(left), _right(right), _next(0)
 | 
|---|
 | 7385 |                 {
 | 
|---|
 | 7386 |                 }
 | 
|---|
 | 7387 | 
 | 
|---|
 | 7388 |                 xpath_ast_node(ast_type_t type, xpath_ast_node* left, axis_t axis, nodetest_t test, const char_t* contents):
 | 
|---|
 | 7389 |                         _type((char)type), _rettype(xpath_type_node_set), _axis((char)axis), _test((char)test), _left(left), _right(0), _next(0)
 | 
|---|
 | 7390 |                 {
 | 
|---|
 | 7391 |                         _data.nodetest = contents;
 | 
|---|
 | 7392 |                 }
 | 
|---|
 | 7393 | 
 | 
|---|
 | 7394 |                 void set_next(xpath_ast_node* value)
 | 
|---|
 | 7395 |                 {
 | 
|---|
 | 7396 |                         _next = value;
 | 
|---|
 | 7397 |                 }
 | 
|---|
 | 7398 | 
 | 
|---|
 | 7399 |                 void set_right(xpath_ast_node* value)
 | 
|---|
 | 7400 |                 {
 | 
|---|
 | 7401 |                         _right = value;
 | 
|---|
 | 7402 |                 }
 | 
|---|
 | 7403 | 
 | 
|---|
 | 7404 |                 bool eval_boolean(const xpath_context& c, const xpath_stack& stack)
 | 
|---|
 | 7405 |                 {
 | 
|---|
 | 7406 |                         switch (_type)
 | 
|---|
 | 7407 |                         {
 | 
|---|
 | 7408 |                         case ast_op_or:
 | 
|---|
 | 7409 |                                 return _left->eval_boolean(c, stack) || _right->eval_boolean(c, stack);
 | 
|---|
 | 7410 |                                 
 | 
|---|
 | 7411 |                         case ast_op_and:
 | 
|---|
 | 7412 |                                 return _left->eval_boolean(c, stack) && _right->eval_boolean(c, stack);
 | 
|---|
 | 7413 |                                 
 | 
|---|
 | 7414 |                         case ast_op_equal:
 | 
|---|
 | 7415 |                                 return compare_eq(_left, _right, c, stack, equal_to());
 | 
|---|
 | 7416 | 
 | 
|---|
 | 7417 |                         case ast_op_not_equal:
 | 
|---|
 | 7418 |                                 return compare_eq(_left, _right, c, stack, not_equal_to());
 | 
|---|
 | 7419 |         
 | 
|---|
 | 7420 |                         case ast_op_less:
 | 
|---|
 | 7421 |                                 return compare_rel(_left, _right, c, stack, less());
 | 
|---|
 | 7422 |                         
 | 
|---|
 | 7423 |                         case ast_op_greater:
 | 
|---|
 | 7424 |                                 return compare_rel(_right, _left, c, stack, less());
 | 
|---|
 | 7425 | 
 | 
|---|
 | 7426 |                         case ast_op_less_or_equal:
 | 
|---|
 | 7427 |                                 return compare_rel(_left, _right, c, stack, less_equal());
 | 
|---|
 | 7428 |                         
 | 
|---|
 | 7429 |                         case ast_op_greater_or_equal:
 | 
|---|
 | 7430 |                                 return compare_rel(_right, _left, c, stack, less_equal());
 | 
|---|
 | 7431 | 
 | 
|---|
 | 7432 |                         case ast_func_starts_with:
 | 
|---|
 | 7433 |                         {
 | 
|---|
 | 7434 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7435 | 
 | 
|---|
 | 7436 |                                 xpath_string lr = _left->eval_string(c, stack);
 | 
|---|
 | 7437 |                                 xpath_string rr = _right->eval_string(c, stack);
 | 
|---|
 | 7438 | 
 | 
|---|
 | 7439 |                                 return starts_with(lr.c_str(), rr.c_str());
 | 
|---|
 | 7440 |                         }
 | 
|---|
 | 7441 | 
 | 
|---|
 | 7442 |                         case ast_func_contains:
 | 
|---|
 | 7443 |                         {
 | 
|---|
 | 7444 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7445 | 
 | 
|---|
 | 7446 |                                 xpath_string lr = _left->eval_string(c, stack);
 | 
|---|
 | 7447 |                                 xpath_string rr = _right->eval_string(c, stack);
 | 
|---|
 | 7448 | 
 | 
|---|
 | 7449 |                                 return find_substring(lr.c_str(), rr.c_str()) != 0;
 | 
|---|
 | 7450 |                         }
 | 
|---|
 | 7451 | 
 | 
|---|
 | 7452 |                         case ast_func_boolean:
 | 
|---|
 | 7453 |                                 return _left->eval_boolean(c, stack);
 | 
|---|
 | 7454 |                                 
 | 
|---|
 | 7455 |                         case ast_func_not:
 | 
|---|
 | 7456 |                                 return !_left->eval_boolean(c, stack);
 | 
|---|
 | 7457 |                                 
 | 
|---|
 | 7458 |                         case ast_func_true:
 | 
|---|
 | 7459 |                                 return true;
 | 
|---|
 | 7460 |                                 
 | 
|---|
 | 7461 |                         case ast_func_false:
 | 
|---|
 | 7462 |                                 return false;
 | 
|---|
 | 7463 | 
 | 
|---|
 | 7464 |                         case ast_func_lang:
 | 
|---|
 | 7465 |                         {
 | 
|---|
 | 7466 |                                 if (c.n.attribute()) return false;
 | 
|---|
 | 7467 |                                 
 | 
|---|
 | 7468 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7469 | 
 | 
|---|
 | 7470 |                                 xpath_string lang = _left->eval_string(c, stack);
 | 
|---|
 | 7471 |                                 
 | 
|---|
 | 7472 |                                 for (xml_node n = c.n.node(); n; n = n.parent())
 | 
|---|
 | 7473 |                                 {
 | 
|---|
 | 7474 |                                         xml_attribute a = n.attribute(PUGIXML_TEXT("xml:lang"));
 | 
|---|
 | 7475 |                                         
 | 
|---|
 | 7476 |                                         if (a)
 | 
|---|
 | 7477 |                                         {
 | 
|---|
 | 7478 |                                                 const char_t* value = a.value();
 | 
|---|
 | 7479 |                                                 
 | 
|---|
 | 7480 |                                                 // strnicmp / strncasecmp is not portable
 | 
|---|
 | 7481 |                                                 for (const char_t* lit = lang.c_str(); *lit; ++lit)
 | 
|---|
 | 7482 |                                                 {
 | 
|---|
 | 7483 |                                                         if (tolower_ascii(*lit) != tolower_ascii(*value)) return false;
 | 
|---|
 | 7484 |                                                         ++value;
 | 
|---|
 | 7485 |                                                 }
 | 
|---|
 | 7486 |                                                 
 | 
|---|
 | 7487 |                                                 return *value == 0 || *value == '-';
 | 
|---|
 | 7488 |                                         }
 | 
|---|
 | 7489 |                                 }
 | 
|---|
 | 7490 |                                 
 | 
|---|
 | 7491 |                                 return false;
 | 
|---|
 | 7492 |                         }
 | 
|---|
 | 7493 | 
 | 
|---|
 | 7494 |                         case ast_variable:
 | 
|---|
 | 7495 |                         {
 | 
|---|
 | 7496 |                                 assert(_rettype == _data.variable->type());
 | 
|---|
 | 7497 | 
 | 
|---|
 | 7498 |                                 if (_rettype == xpath_type_boolean)
 | 
|---|
 | 7499 |                                         return _data.variable->get_boolean();
 | 
|---|
 | 7500 | 
 | 
|---|
 | 7501 |                                 // fallthrough to type conversion
 | 
|---|
 | 7502 |                         }
 | 
|---|
 | 7503 | 
 | 
|---|
 | 7504 |                         default:
 | 
|---|
 | 7505 |                         {
 | 
|---|
 | 7506 |                                 switch (_rettype)
 | 
|---|
 | 7507 |                                 {
 | 
|---|
 | 7508 |                                 case xpath_type_number:
 | 
|---|
 | 7509 |                                         return convert_number_to_boolean(eval_number(c, stack));
 | 
|---|
 | 7510 |                                         
 | 
|---|
 | 7511 |                                 case xpath_type_string:
 | 
|---|
 | 7512 |                                 {
 | 
|---|
 | 7513 |                                         xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7514 | 
 | 
|---|
 | 7515 |                                         return !eval_string(c, stack).empty();
 | 
|---|
 | 7516 |                                 }
 | 
|---|
 | 7517 |                                         
 | 
|---|
 | 7518 |                                 case xpath_type_node_set:                               
 | 
|---|
 | 7519 |                                 {
 | 
|---|
 | 7520 |                                         xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7521 | 
 | 
|---|
 | 7522 |                                         return !eval_node_set(c, stack).empty();
 | 
|---|
 | 7523 |                                 }
 | 
|---|
 | 7524 | 
 | 
|---|
 | 7525 |                                 default:
 | 
|---|
 | 7526 |                                         assert(!"Wrong expression for return type boolean");
 | 
|---|
 | 7527 |                                         return false;
 | 
|---|
 | 7528 |                                 }
 | 
|---|
 | 7529 |                         }
 | 
|---|
 | 7530 |                         }
 | 
|---|
 | 7531 |                 }
 | 
|---|
 | 7532 | 
 | 
|---|
 | 7533 |                 double eval_number(const xpath_context& c, const xpath_stack& stack)
 | 
|---|
 | 7534 |                 {
 | 
|---|
 | 7535 |                         switch (_type)
 | 
|---|
 | 7536 |                         {
 | 
|---|
 | 7537 |                         case ast_op_add:
 | 
|---|
 | 7538 |                                 return _left->eval_number(c, stack) + _right->eval_number(c, stack);
 | 
|---|
 | 7539 |                                 
 | 
|---|
 | 7540 |                         case ast_op_subtract:
 | 
|---|
 | 7541 |                                 return _left->eval_number(c, stack) - _right->eval_number(c, stack);
 | 
|---|
 | 7542 | 
 | 
|---|
 | 7543 |                         case ast_op_multiply:
 | 
|---|
 | 7544 |                                 return _left->eval_number(c, stack) * _right->eval_number(c, stack);
 | 
|---|
 | 7545 | 
 | 
|---|
 | 7546 |                         case ast_op_divide:
 | 
|---|
 | 7547 |                                 return _left->eval_number(c, stack) / _right->eval_number(c, stack);
 | 
|---|
 | 7548 | 
 | 
|---|
 | 7549 |                         case ast_op_mod:
 | 
|---|
 | 7550 |                                 return fmod(_left->eval_number(c, stack), _right->eval_number(c, stack));
 | 
|---|
 | 7551 | 
 | 
|---|
 | 7552 |                         case ast_op_negate:
 | 
|---|
 | 7553 |                                 return -_left->eval_number(c, stack);
 | 
|---|
 | 7554 | 
 | 
|---|
 | 7555 |                         case ast_number_constant:
 | 
|---|
 | 7556 |                                 return _data.number;
 | 
|---|
 | 7557 | 
 | 
|---|
 | 7558 |                         case ast_func_last:
 | 
|---|
 | 7559 |                                 return (double)c.size;
 | 
|---|
 | 7560 |                         
 | 
|---|
 | 7561 |                         case ast_func_position:
 | 
|---|
 | 7562 |                                 return (double)c.position;
 | 
|---|
 | 7563 | 
 | 
|---|
 | 7564 |                         case ast_func_count:
 | 
|---|
 | 7565 |                         {
 | 
|---|
 | 7566 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7567 | 
 | 
|---|
 | 7568 |                                 return (double)_left->eval_node_set(c, stack).size();
 | 
|---|
 | 7569 |                         }
 | 
|---|
 | 7570 |                         
 | 
|---|
 | 7571 |                         case ast_func_string_length_0:
 | 
|---|
 | 7572 |                         {
 | 
|---|
 | 7573 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7574 | 
 | 
|---|
 | 7575 |                                 return (double)string_value(c.n, stack.result).length();
 | 
|---|
 | 7576 |                         }
 | 
|---|
 | 7577 |                         
 | 
|---|
 | 7578 |                         case ast_func_string_length_1:
 | 
|---|
 | 7579 |                         {
 | 
|---|
 | 7580 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7581 | 
 | 
|---|
 | 7582 |                                 return (double)_left->eval_string(c, stack).length();
 | 
|---|
 | 7583 |                         }
 | 
|---|
 | 7584 |                         
 | 
|---|
 | 7585 |                         case ast_func_number_0:
 | 
|---|
 | 7586 |                         {
 | 
|---|
 | 7587 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7588 | 
 | 
|---|
 | 7589 |                                 return convert_string_to_number(string_value(c.n, stack.result).c_str());
 | 
|---|
 | 7590 |                         }
 | 
|---|
 | 7591 |                         
 | 
|---|
 | 7592 |                         case ast_func_number_1:
 | 
|---|
 | 7593 |                                 return _left->eval_number(c, stack);
 | 
|---|
 | 7594 | 
 | 
|---|
 | 7595 |                         case ast_func_sum:
 | 
|---|
 | 7596 |                         {
 | 
|---|
 | 7597 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7598 | 
 | 
|---|
 | 7599 |                                 double r = 0;
 | 
|---|
 | 7600 |                                 
 | 
|---|
 | 7601 |                                 xpath_node_set_raw ns = _left->eval_node_set(c, stack);
 | 
|---|
 | 7602 |                                 
 | 
|---|
 | 7603 |                                 for (const xpath_node* it = ns.begin(); it != ns.end(); ++it)
 | 
|---|
 | 7604 |                                 {
 | 
|---|
 | 7605 |                                         xpath_allocator_capture cri(stack.result);
 | 
|---|
 | 7606 | 
 | 
|---|
 | 7607 |                                         r += convert_string_to_number(string_value(*it, stack.result).c_str());
 | 
|---|
 | 7608 |                                 }
 | 
|---|
 | 7609 |                         
 | 
|---|
 | 7610 |                                 return r;
 | 
|---|
 | 7611 |                         }
 | 
|---|
 | 7612 | 
 | 
|---|
 | 7613 |                         case ast_func_floor:
 | 
|---|
 | 7614 |                         {
 | 
|---|
 | 7615 |                                 double r = _left->eval_number(c, stack);
 | 
|---|
 | 7616 |                                 
 | 
|---|
 | 7617 |                                 return r == r ? floor(r) : r;
 | 
|---|
 | 7618 |                         }
 | 
|---|
 | 7619 | 
 | 
|---|
 | 7620 |                         case ast_func_ceiling:
 | 
|---|
 | 7621 |                         {
 | 
|---|
 | 7622 |                                 double r = _left->eval_number(c, stack);
 | 
|---|
 | 7623 |                                 
 | 
|---|
 | 7624 |                                 return r == r ? ceil(r) : r;
 | 
|---|
 | 7625 |                         }
 | 
|---|
 | 7626 | 
 | 
|---|
 | 7627 |                         case ast_func_round:
 | 
|---|
 | 7628 |                                 return round_nearest_nzero(_left->eval_number(c, stack));
 | 
|---|
 | 7629 |                         
 | 
|---|
 | 7630 |                         case ast_variable:
 | 
|---|
 | 7631 |                         {
 | 
|---|
 | 7632 |                                 assert(_rettype == _data.variable->type());
 | 
|---|
 | 7633 | 
 | 
|---|
 | 7634 |                                 if (_rettype == xpath_type_number)
 | 
|---|
 | 7635 |                                         return _data.variable->get_number();
 | 
|---|
 | 7636 | 
 | 
|---|
 | 7637 |                                 // fallthrough to type conversion
 | 
|---|
 | 7638 |                         }
 | 
|---|
 | 7639 | 
 | 
|---|
 | 7640 |                         default:
 | 
|---|
 | 7641 |                         {
 | 
|---|
 | 7642 |                                 switch (_rettype)
 | 
|---|
 | 7643 |                                 {
 | 
|---|
 | 7644 |                                 case xpath_type_boolean:
 | 
|---|
 | 7645 |                                         return eval_boolean(c, stack) ? 1 : 0;
 | 
|---|
 | 7646 |                                         
 | 
|---|
 | 7647 |                                 case xpath_type_string:
 | 
|---|
 | 7648 |                                 {
 | 
|---|
 | 7649 |                                         xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7650 | 
 | 
|---|
 | 7651 |                                         return convert_string_to_number(eval_string(c, stack).c_str());
 | 
|---|
 | 7652 |                                 }
 | 
|---|
 | 7653 |                                         
 | 
|---|
 | 7654 |                                 case xpath_type_node_set:
 | 
|---|
 | 7655 |                                 {
 | 
|---|
 | 7656 |                                         xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7657 | 
 | 
|---|
 | 7658 |                                         return convert_string_to_number(eval_string(c, stack).c_str());
 | 
|---|
 | 7659 |                                 }
 | 
|---|
 | 7660 |                                         
 | 
|---|
 | 7661 |                                 default:
 | 
|---|
 | 7662 |                                         assert(!"Wrong expression for return type number");
 | 
|---|
 | 7663 |                                         return 0;
 | 
|---|
 | 7664 |                                 }
 | 
|---|
 | 7665 |                                 
 | 
|---|
 | 7666 |                         }
 | 
|---|
 | 7667 |                         }
 | 
|---|
 | 7668 |                 }
 | 
|---|
 | 7669 |                 
 | 
|---|
 | 7670 |                 xpath_string eval_string_concat(const xpath_context& c, const xpath_stack& stack)
 | 
|---|
 | 7671 |                 {
 | 
|---|
 | 7672 |                         assert(_type == ast_func_concat);
 | 
|---|
 | 7673 | 
 | 
|---|
 | 7674 |                         xpath_allocator_capture ct(stack.temp);
 | 
|---|
 | 7675 | 
 | 
|---|
 | 7676 |                         // count the string number
 | 
|---|
 | 7677 |                         size_t count = 1;
 | 
|---|
 | 7678 |                         for (xpath_ast_node* nc = _right; nc; nc = nc->_next) count++;
 | 
|---|
 | 7679 | 
 | 
|---|
 | 7680 |                         // gather all strings
 | 
|---|
 | 7681 |                         xpath_string static_buffer[4];
 | 
|---|
 | 7682 |                         xpath_string* buffer = static_buffer;
 | 
|---|
 | 7683 | 
 | 
|---|
 | 7684 |                         // allocate on-heap for large concats
 | 
|---|
 | 7685 |                         if (count > sizeof(static_buffer) / sizeof(static_buffer[0]))
 | 
|---|
 | 7686 |                         {
 | 
|---|
 | 7687 |                                 buffer = static_cast<xpath_string*>(stack.temp->allocate(count * sizeof(xpath_string)));
 | 
|---|
 | 7688 |                                 assert(buffer);
 | 
|---|
 | 7689 |                         }
 | 
|---|
 | 7690 | 
 | 
|---|
 | 7691 |                         // evaluate all strings to temporary stack
 | 
|---|
 | 7692 |                         xpath_stack swapped_stack = {stack.temp, stack.result};
 | 
|---|
 | 7693 | 
 | 
|---|
 | 7694 |                         buffer[0] = _left->eval_string(c, swapped_stack);
 | 
|---|
 | 7695 | 
 | 
|---|
 | 7696 |                         size_t pos = 1;
 | 
|---|
 | 7697 |                         for (xpath_ast_node* n = _right; n; n = n->_next, ++pos) buffer[pos] = n->eval_string(c, swapped_stack);
 | 
|---|
 | 7698 |                         assert(pos == count);
 | 
|---|
 | 7699 | 
 | 
|---|
 | 7700 |                         // get total length
 | 
|---|
 | 7701 |                         size_t length = 0;
 | 
|---|
 | 7702 |                         for (size_t i = 0; i < count; ++i) length += buffer[i].length();
 | 
|---|
 | 7703 | 
 | 
|---|
 | 7704 |                         // create final string
 | 
|---|
 | 7705 |                         char_t* result = static_cast<char_t*>(stack.result->allocate((length + 1) * sizeof(char_t)));
 | 
|---|
 | 7706 |                         assert(result);
 | 
|---|
 | 7707 | 
 | 
|---|
 | 7708 |                         char_t* ri = result;
 | 
|---|
 | 7709 | 
 | 
|---|
 | 7710 |                         for (size_t j = 0; j < count; ++j)
 | 
|---|
 | 7711 |                                 for (const char_t* bi = buffer[j].c_str(); *bi; ++bi)
 | 
|---|
 | 7712 |                                         *ri++ = *bi;
 | 
|---|
 | 7713 | 
 | 
|---|
 | 7714 |                         *ri = 0;
 | 
|---|
 | 7715 | 
 | 
|---|
 | 7716 |                         return xpath_string(result, true);
 | 
|---|
 | 7717 |                 }
 | 
|---|
 | 7718 | 
 | 
|---|
 | 7719 |                 xpath_string eval_string(const xpath_context& c, const xpath_stack& stack)
 | 
|---|
 | 7720 |                 {
 | 
|---|
 | 7721 |                         switch (_type)
 | 
|---|
 | 7722 |                         {
 | 
|---|
 | 7723 |                         case ast_string_constant:
 | 
|---|
 | 7724 |                                 return xpath_string_const(_data.string);
 | 
|---|
 | 7725 |                         
 | 
|---|
 | 7726 |                         case ast_func_local_name_0:
 | 
|---|
 | 7727 |                         {
 | 
|---|
 | 7728 |                                 xpath_node na = c.n;
 | 
|---|
 | 7729 |                                 
 | 
|---|
 | 7730 |                                 return xpath_string_const(local_name(na));
 | 
|---|
 | 7731 |                         }
 | 
|---|
 | 7732 | 
 | 
|---|
 | 7733 |                         case ast_func_local_name_1:
 | 
|---|
 | 7734 |                         {
 | 
|---|
 | 7735 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7736 | 
 | 
|---|
 | 7737 |                                 xpath_node_set_raw ns = _left->eval_node_set(c, stack);
 | 
|---|
 | 7738 |                                 xpath_node na = ns.first();
 | 
|---|
 | 7739 |                                 
 | 
|---|
 | 7740 |                                 return xpath_string_const(local_name(na));
 | 
|---|
 | 7741 |                         }
 | 
|---|
 | 7742 | 
 | 
|---|
 | 7743 |                         case ast_func_name_0:
 | 
|---|
 | 7744 |                         {
 | 
|---|
 | 7745 |                                 xpath_node na = c.n;
 | 
|---|
 | 7746 |                                 
 | 
|---|
 | 7747 |                                 return xpath_string_const(qualified_name(na));
 | 
|---|
 | 7748 |                         }
 | 
|---|
 | 7749 | 
 | 
|---|
 | 7750 |                         case ast_func_name_1:
 | 
|---|
 | 7751 |                         {
 | 
|---|
 | 7752 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7753 | 
 | 
|---|
 | 7754 |                                 xpath_node_set_raw ns = _left->eval_node_set(c, stack);
 | 
|---|
 | 7755 |                                 xpath_node na = ns.first();
 | 
|---|
 | 7756 |                                 
 | 
|---|
 | 7757 |                                 return xpath_string_const(qualified_name(na));
 | 
|---|
 | 7758 |                         }
 | 
|---|
 | 7759 | 
 | 
|---|
 | 7760 |                         case ast_func_namespace_uri_0:
 | 
|---|
 | 7761 |                         {
 | 
|---|
 | 7762 |                                 xpath_node na = c.n;
 | 
|---|
 | 7763 |                                 
 | 
|---|
 | 7764 |                                 return xpath_string_const(namespace_uri(na));
 | 
|---|
 | 7765 |                         }
 | 
|---|
 | 7766 | 
 | 
|---|
 | 7767 |                         case ast_func_namespace_uri_1:
 | 
|---|
 | 7768 |                         {
 | 
|---|
 | 7769 |                                 xpath_allocator_capture cr(stack.result);
 | 
|---|
 | 7770 | 
 | 
|---|
 | 7771 |                                 xpath_node_set_raw ns = _left->eval_node_set(c, stack);
 | 
|---|
 | 7772 |                                 xpath_node na = ns.first();
 | 
|---|
 | 7773 |                                 
 | 
|---|
 | 7774 |                                 return xpath_string_const(namespace_uri(na));
 | 
|---|
 | 7775 |                         }
 | 
|---|
 | 7776 | 
 | 
|---|
 | 7777 |                         case ast_func_string_0:
 | 
|---|
 | 7778 |                                 return string_value(c.n, stack.result);
 | 
|---|
 | 7779 | 
 | 
|---|
 | 7780 |                         case ast_func_string_1:
 | 
|---|
 | 7781 |                                 return _left->eval_string(c, stack);
 | 
|---|
 | 7782 | 
 | 
|---|
 | 7783 |                         case ast_func_concat:
 | 
|---|
 | 7784 |                                 return eval_string_concat(c, stack);
 | 
|---|
 | 7785 | 
 | 
|---|
 | 7786 |                         case ast_func_substring_before:
 | 
|---|
 | 7787 |                         {
 | 
|---|
 | 7788 |                                 xpath_allocator_capture cr(stack.temp);
 | 
|---|
 | 7789 | 
 | 
|---|
 | 7790 |                                 xpath_stack swapped_stack = {stack.temp, stack.result};
 | 
|---|
 | 7791 | 
 | 
|---|
 | 7792 |                                 xpath_string s = _left->eval_string(c, swapped_stack);
 | 
|---|
 | 7793 |                                 xpath_string p = _right->eval_string(c, swapped_stack);
 | 
|---|
 | 7794 | 
 | 
|---|
 | 7795 |                                 const char_t* pos = find_substring(s.c_str(), p.c_str());
 | 
|---|
 | 7796 |                                 
 | 
|---|
 | 7797 |                                 return pos ? xpath_string(s.c_str(), pos, stack.result) : xpath_string();
 | 
|---|
 | 7798 |                         }
 | 
|---|
 | 7799 |                         
 | 
|---|
 | 7800 |                         case ast_func_substring_after:
 | 
|---|
 | 7801 |                         {
 | 
|---|
 | 7802 |                                 xpath_allocator_capture cr(stack.temp);
 | 
|---|
 | 7803 | 
 | 
|---|
 | 7804 |                                 xpath_stack swapped_stack = {stack.temp, stack.result};
 | 
|---|
 | 7805 | 
 | 
|---|
 | 7806 |                                 xpath_string s = _left->eval_string(c, swapped_stack);
 | 
|---|
 | 7807 |                                 xpath_string p = _right->eval_string(c, swapped_stack);
 | 
|---|
 | 7808 |                                 
 | 
|---|
 | 7809 |                                 const char_t* pos = find_substring(s.c_str(), p.c_str());
 | 
|---|
 | 7810 |                                 if (!pos) return xpath_string();
 | 
|---|
 | 7811 | 
 | 
|---|
 | 7812 |                                 const char_t* result = pos + p.length();
 | 
|---|
 | 7813 | 
 | 
|---|
 | 7814 |                                 return s.uses_heap() ? xpath_string(result, stack.result) : xpath_string_const(result);
 | 
|---|
 | 7815 |                         }
 | 
|---|
 | 7816 | 
 | 
|---|
 | 7817 |                         case ast_func_substring_2:
 | 
|---|
 | 7818 |                         {
 | 
|---|
 | 7819 |                                 xpath_allocator_capture cr(stack.temp);
 | 
|---|
 | 7820 | 
 | 
|---|
 | 7821 |                                 xpath_stack swapped_stack = {stack.temp, stack.result};
 | 
|---|
 | 7822 | 
 | 
|---|
 | 7823 |                                 xpath_string s = _left->eval_string(c, swapped_stack);
 | 
|---|
 | 7824 |                                 size_t s_length = s.length();
 | 
|---|
 | 7825 | 
 | 
|---|
 | 7826 |                                 double first = round_nearest(_right->eval_number(c, stack));
 | 
|---|
 | 7827 |                                 
 | 
|---|
 | 7828 |                                 if (is_nan(first)) return xpath_string(); // NaN
 | 
|---|
 | 7829 |                                 else if (first >= s_length + 1) return xpath_string();
 | 
|---|
 | 7830 |                                 
 | 
|---|
 | 7831 |                                 size_t pos = first < 1 ? 1 : (size_t)first;
 | 
|---|
 | 7832 |                                 assert(1 <= pos && pos <= s_length + 1);
 | 
|---|
 | 7833 | 
 | 
|---|
 | 7834 |                                 const char_t* rbegin = s.c_str() + (pos - 1);
 | 
|---|
 | 7835 |                                 
 | 
|---|
 | 7836 |                                 return s.uses_heap() ? xpath_string(rbegin, stack.result) : xpath_string_const(rbegin);
 | 
|---|
 | 7837 |                         }
 | 
|---|
 | 7838 |                         
 | 
|---|
 | 7839 |                         case ast_func_substring_3:
 | 
|---|
 | 7840 |                         {
 | 
|---|
 | 7841 |                                 xpath_allocator_capture cr(stack.temp);
 | 
|---|
 | 7842 | 
 | 
|---|
 | 7843 |                                 xpath_stack swapped_stack = {stack.temp, stack.result};
 | 
|---|
 | 7844 | 
 | 
|---|
 | 7845 |                                 xpath_string s = _left->eval_string(c, swapped_stack);
 | 
|---|
 | 7846 |                                 size_t s_length = s.length();
 | 
|---|
 | 7847 | 
 | 
|---|
 | 7848 |                                 double first = round_nearest(_right->eval_number(c, stack));
 | 
|---|
 | 7849 |                                 double last = first + round_nearest(_right->_next->eval_number(c, stack));
 | 
|---|
 | 7850 |                                 
 | 
|---|
 | 7851 |                                 if (is_nan(first) || is_nan(last)) return xpath_string();
 | 
|---|
 | 7852 |                                 else if (first >= s_length + 1) return xpath_string();
 | 
|---|
 | 7853 |                                 else if (first >= last) return xpath_string();
 | 
|---|
 | 7854 |                                 else if (last < 1) return xpath_string();
 | 
|---|
 | 7855 |                                 
 | 
|---|
 | 7856 |                                 size_t pos = first < 1 ? 1 : (size_t)first;
 | 
|---|
 | 7857 |                                 size_t end = last >= s_length + 1 ? s_length + 1 : (size_t)last;
 | 
|---|
 | 7858 | 
 | 
|---|
 | 7859 |                                 assert(1 <= pos && pos <= end && end <= s_length + 1);
 | 
|---|
 | 7860 |                                 const char_t* rbegin = s.c_str() + (pos - 1);
 | 
|---|
 | 7861 |                                 const char_t* rend = s.c_str() + (end - 1);
 | 
|---|
 | 7862 | 
 | 
|---|
 | 7863 |                                 return (end == s_length + 1 && !s.uses_heap()) ? xpath_string_const(rbegin) : xpath_string(rbegin, rend, stack.result);
 | 
|---|
 | 7864 |                         }
 | 
|---|
 | 7865 | 
 | 
|---|
 | 7866 |                         case ast_func_normalize_space_0:
 | 
|---|
 | 7867 |                         {
 | 
|---|
 | 7868 |                                 xpath_string s = string_value(c.n, stack.result);
 | 
|---|
 | 7869 | 
 | 
|---|
 | 7870 |                                 normalize_space(s.data(stack.result));
 | 
|---|
 | 7871 | 
 | 
|---|
 | 7872 |                                 return s;
 | 
|---|
 | 7873 |                         }
 | 
|---|
 | 7874 | 
 | 
|---|
 | 7875 |                         case ast_func_normalize_space_1:
 | 
|---|
 | 7876 |                         {
 | 
|---|
 | 7877 |                                 xpath_string s = _left->eval_string(c, stack);
 | 
|---|
 | 7878 | 
 | 
|---|
 | 7879 |                                 normalize_space(s.data(stack.result));
 | 
|---|
 | 7880 |                         
 | 
|---|
 | 7881 |                                 return s;
 | 
|---|
 | 7882 |                         }
 | 
|---|
 | 7883 | 
 | 
|---|
 | 7884 |                         case ast_func_translate:
 | 
|---|
 | 7885 |                         {
 | 
|---|
 | 7886 |                                 xpath_allocator_capture cr(stack.temp);
 | 
|---|
 | 7887 | 
 | 
|---|
 | 7888 |                                 xpath_stack swapped_stack = {stack.temp, stack.result};
 | 
|---|
 | 7889 | 
 | 
|---|
 | 7890 |                                 xpath_string s = _left->eval_string(c, stack);
 | 
|---|
 | 7891 |                                 xpath_string from = _right->eval_string(c, swapped_stack);
 | 
|---|
 | 7892 |                                 xpath_string to = _right->_next->eval_string(c, swapped_stack);
 | 
|---|
 | 7893 | 
 | 
|---|
 | 7894 |                                 translate(s.data(stack.result), from.c_str(), to.c_str());
 | 
|---|
 | 7895 | 
 | 
|---|
 | 7896 |                                 return s;
 | 
|---|
 | 7897 |                         }
 | 
|---|
 | 7898 | 
 | 
|---|
 | 7899 |                         case ast_variable:
 | 
|---|
 | 7900 |                         {
 | 
|---|
 | 7901 |                                 assert(_rettype == _data.variable->type());
 | 
|---|
 | 7902 | 
 | 
|---|
 | 7903 |                                 if (_rettype == xpath_type_string)
 | 
|---|
 | 7904 |                                         return xpath_string_const(_data.variable->get_string());
 | 
|---|
 | 7905 | 
 | 
|---|
 | 7906 |                                 // fallthrough to type conversion
 | 
|---|
 | 7907 |                         }
 | 
|---|
 | 7908 | 
 | 
|---|
 | 7909 |                         default:
 | 
|---|
 | 7910 |                         {
 | 
|---|
 | 7911 |                                 switch (_rettype)
 | 
|---|
 | 7912 |                                 {
 | 
|---|
 | 7913 |                                 case xpath_type_boolean:
 | 
|---|
 | 7914 |                                         return xpath_string_const(eval_boolean(c, stack) ? PUGIXML_TEXT("true") : PUGIXML_TEXT("false"));
 | 
|---|
 | 7915 |                                         
 | 
|---|
 | 7916 |                                 case xpath_type_number:
 | 
|---|
 | 7917 |                                         return convert_number_to_string(eval_number(c, stack), stack.result);
 | 
|---|
 | 7918 |                                         
 | 
|---|
 | 7919 |                                 case xpath_type_node_set:
 | 
|---|
 | 7920 |                                 {
 | 
|---|
 | 7921 |                                         xpath_allocator_capture cr(stack.temp);
 | 
|---|
 | 7922 | 
 | 
|---|
 | 7923 |                                         xpath_stack swapped_stack = {stack.temp, stack.result};
 | 
|---|
 | 7924 | 
 | 
|---|
 | 7925 |                                         xpath_node_set_raw ns = eval_node_set(c, swapped_stack);
 | 
|---|
 | 7926 |                                         return ns.empty() ? xpath_string() : string_value(ns.first(), stack.result);
 | 
|---|
 | 7927 |                                 }
 | 
|---|
 | 7928 |                                 
 | 
|---|
 | 7929 |                                 default:
 | 
|---|
 | 7930 |                                         assert(!"Wrong expression for return type string");
 | 
|---|
 | 7931 |                                         return xpath_string();
 | 
|---|
 | 7932 |                                 }
 | 
|---|
 | 7933 |                         }
 | 
|---|
 | 7934 |                         }
 | 
|---|
 | 7935 |                 }
 | 
|---|
 | 7936 | 
 | 
|---|
 | 7937 |                 xpath_node_set_raw eval_node_set(const xpath_context& c, const xpath_stack& stack)
 | 
|---|
 | 7938 |                 {
 | 
|---|
 | 7939 |                         switch (_type)
 | 
|---|
 | 7940 |                         {
 | 
|---|
 | 7941 |                         case ast_op_union:
 | 
|---|
 | 7942 |                         {
 | 
|---|
 | 7943 |                                 xpath_allocator_capture cr(stack.temp);
 | 
|---|
 | 7944 | 
 | 
|---|
 | 7945 |                                 xpath_stack swapped_stack = {stack.temp, stack.result};
 | 
|---|
 | 7946 | 
 | 
|---|
 | 7947 |                                 xpath_node_set_raw ls = _left->eval_node_set(c, swapped_stack);
 | 
|---|
 | 7948 |                                 xpath_node_set_raw rs = _right->eval_node_set(c, stack);
 | 
|---|
 | 7949 |                                 
 | 
|---|
 | 7950 |                                 // we can optimize merging two sorted sets, but this is a very rare operation, so don't bother
 | 
|---|
 | 7951 |                         rs.set_type(xpath_node_set::type_unsorted);
 | 
|---|
 | 7952 | 
 | 
|---|
 | 7953 |                                 rs.append(ls.begin(), ls.end(), stack.result);
 | 
|---|
 | 7954 |                                 rs.remove_duplicates();
 | 
|---|
 | 7955 |                                 
 | 
|---|
 | 7956 |                                 return rs;
 | 
|---|
 | 7957 |                         }
 | 
|---|
 | 7958 | 
 | 
|---|
 | 7959 |                         case ast_filter:
 | 
|---|
 | 7960 |                         case ast_filter_posinv:
 | 
|---|
 | 7961 |                         {
 | 
|---|
 | 7962 |                                 xpath_node_set_raw set = _left->eval_node_set(c, stack);
 | 
|---|
 | 7963 | 
 | 
|---|
 | 7964 |                                 // either expression is a number or it contains position() call; sort by document order
 | 
|---|
 | 7965 |                                 if (_type == ast_filter) set.sort_do();
 | 
|---|
 | 7966 | 
 | 
|---|
 | 7967 |                                 apply_predicate(set, 0, _right, stack);
 | 
|---|
 | 7968 |                         
 | 
|---|
 | 7969 |                                 return set;
 | 
|---|
 | 7970 |                         }
 | 
|---|
 | 7971 |                         
 | 
|---|
 | 7972 |                         case ast_func_id:
 | 
|---|
 | 7973 |                                 return xpath_node_set_raw();
 | 
|---|
 | 7974 |                         
 | 
|---|
 | 7975 |                         case ast_step:
 | 
|---|
 | 7976 |                         {
 | 
|---|
 | 7977 |                                 switch (_axis)
 | 
|---|
 | 7978 |                                 {
 | 
|---|
 | 7979 |                                 case axis_ancestor:
 | 
|---|
 | 7980 |                                         return step_do(c, stack, axis_to_type<axis_ancestor>());
 | 
|---|
 | 7981 |                                         
 | 
|---|
 | 7982 |                                 case axis_ancestor_or_self:
 | 
|---|
 | 7983 |                                         return step_do(c, stack, axis_to_type<axis_ancestor_or_self>());
 | 
|---|
 | 7984 | 
 | 
|---|
 | 7985 |                                 case axis_attribute:
 | 
|---|
 | 7986 |                                         return step_do(c, stack, axis_to_type<axis_attribute>());
 | 
|---|
 | 7987 | 
 | 
|---|
 | 7988 |                                 case axis_child:
 | 
|---|
 | 7989 |                                         return step_do(c, stack, axis_to_type<axis_child>());
 | 
|---|
 | 7990 |                                 
 | 
|---|
 | 7991 |                                 case axis_descendant:
 | 
|---|
 | 7992 |                                         return step_do(c, stack, axis_to_type<axis_descendant>());
 | 
|---|
 | 7993 | 
 | 
|---|
 | 7994 |                                 case axis_descendant_or_self:
 | 
|---|
 | 7995 |                                         return step_do(c, stack, axis_to_type<axis_descendant_or_self>());
 | 
|---|
 | 7996 | 
 | 
|---|
 | 7997 |                                 case axis_following:
 | 
|---|
 | 7998 |                                         return step_do(c, stack, axis_to_type<axis_following>());
 | 
|---|
 | 7999 |                                 
 | 
|---|
 | 8000 |                                 case axis_following_sibling:
 | 
|---|
 | 8001 |                                         return step_do(c, stack, axis_to_type<axis_following_sibling>());
 | 
|---|
 | 8002 |                                 
 | 
|---|
 | 8003 |                                 case axis_namespace:
 | 
|---|
 | 8004 |                                         // namespaced axis is not supported
 | 
|---|
 | 8005 |                                         return xpath_node_set_raw();
 | 
|---|
 | 8006 |                                 
 | 
|---|
 | 8007 |                                 case axis_parent:
 | 
|---|
 | 8008 |                                         return step_do(c, stack, axis_to_type<axis_parent>());
 | 
|---|
 | 8009 |                                 
 | 
|---|
 | 8010 |                                 case axis_preceding:
 | 
|---|
 | 8011 |                                         return step_do(c, stack, axis_to_type<axis_preceding>());
 | 
|---|
 | 8012 | 
 | 
|---|
 | 8013 |                                 case axis_preceding_sibling:
 | 
|---|
 | 8014 |                                         return step_do(c, stack, axis_to_type<axis_preceding_sibling>());
 | 
|---|
 | 8015 |                                 
 | 
|---|
 | 8016 |                                 case axis_self:
 | 
|---|
 | 8017 |                                         return step_do(c, stack, axis_to_type<axis_self>());
 | 
|---|
 | 8018 |                                 }
 | 
|---|
 | 8019 |                         }
 | 
|---|
 | 8020 | 
 | 
|---|
 | 8021 |                         case ast_step_root:
 | 
|---|
 | 8022 |                         {
 | 
|---|
 | 8023 |                                 assert(!_right); // root step can't have any predicates
 | 
|---|
 | 8024 | 
 | 
|---|
 | 8025 |                                 xpath_node_set_raw ns;
 | 
|---|
 | 8026 | 
 | 
|---|
 | 8027 |                                 ns.set_type(xpath_node_set::type_sorted);
 | 
|---|
 | 8028 | 
 | 
|---|
 | 8029 |                                 if (c.n.node()) ns.push_back(c.n.node().root(), stack.result);
 | 
|---|
 | 8030 |                                 else if (c.n.attribute()) ns.push_back(c.n.parent().root(), stack.result);
 | 
|---|
 | 8031 | 
 | 
|---|
 | 8032 |                                 return ns;
 | 
|---|
 | 8033 |                         }
 | 
|---|
 | 8034 | 
 | 
|---|
 | 8035 |                         case ast_variable:
 | 
|---|
 | 8036 |                         {
 | 
|---|
 | 8037 |                                 assert(_rettype == _data.variable->type());
 | 
|---|
 | 8038 | 
 | 
|---|
 | 8039 |                                 if (_rettype == xpath_type_node_set)
 | 
|---|
 | 8040 |                                 {
 | 
|---|
 | 8041 |                                         const xpath_node_set& s = _data.variable->get_node_set();
 | 
|---|
 | 8042 | 
 | 
|---|
 | 8043 |                                         xpath_node_set_raw ns;
 | 
|---|
 | 8044 | 
 | 
|---|
 | 8045 |                                         ns.set_type(s.type());
 | 
|---|
 | 8046 |                                         ns.append(s.begin(), s.end(), stack.result);
 | 
|---|
 | 8047 | 
 | 
|---|
 | 8048 |                                         return ns;
 | 
|---|
 | 8049 |                                 }
 | 
|---|
 | 8050 | 
 | 
|---|
 | 8051 |                                 // fallthrough to type conversion
 | 
|---|
 | 8052 |                         }
 | 
|---|
 | 8053 | 
 | 
|---|
 | 8054 |                         default:
 | 
|---|
 | 8055 |                                 assert(!"Wrong expression for return type node set");
 | 
|---|
 | 8056 |                                 return xpath_node_set_raw();
 | 
|---|
 | 8057 |                         }
 | 
|---|
 | 8058 |                 }
 | 
|---|
 | 8059 |                 
 | 
|---|
 | 8060 |                 bool is_posinv()
 | 
|---|
 | 8061 |                 {
 | 
|---|
 | 8062 |                         switch (_type)
 | 
|---|
 | 8063 |                         {
 | 
|---|
 | 8064 |                         case ast_func_position:
 | 
|---|
 | 8065 |                                 return false;
 | 
|---|
 | 8066 | 
 | 
|---|
 | 8067 |                         case ast_string_constant:
 | 
|---|
 | 8068 |                         case ast_number_constant:
 | 
|---|
 | 8069 |                         case ast_variable:
 | 
|---|
 | 8070 |                                 return true;
 | 
|---|
 | 8071 | 
 | 
|---|
 | 8072 |                         case ast_step:
 | 
|---|
 | 8073 |                         case ast_step_root:
 | 
|---|
 | 8074 |                                 return true;
 | 
|---|
 | 8075 | 
 | 
|---|
 | 8076 |                         case ast_predicate:
 | 
|---|
 | 8077 |                         case ast_filter:
 | 
|---|
 | 8078 |                         case ast_filter_posinv:
 | 
|---|
 | 8079 |                                 return true;
 | 
|---|
 | 8080 | 
 | 
|---|
 | 8081 |                         default:
 | 
|---|
 | 8082 |                                 if (_left && !_left->is_posinv()) return false;
 | 
|---|
 | 8083 |                                 
 | 
|---|
 | 8084 |                                 for (xpath_ast_node* n = _right; n; n = n->_next)
 | 
|---|
 | 8085 |                                         if (!n->is_posinv()) return false;
 | 
|---|
 | 8086 |                                         
 | 
|---|
 | 8087 |                                 return true;
 | 
|---|
 | 8088 |                         }
 | 
|---|
 | 8089 |                 }
 | 
|---|
 | 8090 | 
 | 
|---|
 | 8091 |                 xpath_value_type rettype() const
 | 
|---|
 | 8092 |                 {
 | 
|---|
 | 8093 |                         return static_cast<xpath_value_type>(_rettype);
 | 
|---|
 | 8094 |                 }
 | 
|---|
 | 8095 |         };
 | 
|---|
 | 8096 | 
 | 
|---|
 | 8097 |         struct xpath_parser
 | 
|---|
 | 8098 |         {
 | 
|---|
 | 8099 |             xpath_allocator* _alloc;
 | 
|---|
 | 8100 |             xpath_lexer _lexer;
 | 
|---|
 | 8101 | 
 | 
|---|
 | 8102 |                 const char_t* _query;
 | 
|---|
 | 8103 |                 xpath_variable_set* _variables;
 | 
|---|
 | 8104 | 
 | 
|---|
 | 8105 |                 xpath_parse_result* _result;
 | 
|---|
 | 8106 | 
 | 
|---|
 | 8107 |         #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 8108 |                 jmp_buf _error_handler;
 | 
|---|
 | 8109 |         #endif
 | 
|---|
 | 8110 | 
 | 
|---|
 | 8111 |                 void throw_error(const char* message)
 | 
|---|
 | 8112 |                 {
 | 
|---|
 | 8113 |                         _result->error = message;
 | 
|---|
 | 8114 |                         _result->offset = _lexer.current_pos() - _query;
 | 
|---|
 | 8115 | 
 | 
|---|
 | 8116 |                 #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 8117 |                         longjmp(_error_handler, 1);
 | 
|---|
 | 8118 |                 #else
 | 
|---|
 | 8119 |                         throw xpath_exception(*_result);
 | 
|---|
 | 8120 |                 #endif
 | 
|---|
 | 8121 |                 }
 | 
|---|
 | 8122 | 
 | 
|---|
 | 8123 |                 void throw_error_oom()
 | 
|---|
 | 8124 |         {
 | 
|---|
 | 8125 |         #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 8126 |             throw_error("Out of memory");
 | 
|---|
 | 8127 |         #else
 | 
|---|
 | 8128 |             throw std::bad_alloc();
 | 
|---|
 | 8129 |         #endif
 | 
|---|
 | 8130 |         }
 | 
|---|
 | 8131 | 
 | 
|---|
 | 8132 |                 void* alloc_node()
 | 
|---|
 | 8133 |                 {
 | 
|---|
 | 8134 |                         void* result = _alloc->allocate_nothrow(sizeof(xpath_ast_node));
 | 
|---|
 | 8135 | 
 | 
|---|
 | 8136 |                         if (!result) throw_error_oom();
 | 
|---|
 | 8137 | 
 | 
|---|
 | 8138 |                         return result;
 | 
|---|
 | 8139 |                 }
 | 
|---|
 | 8140 | 
 | 
|---|
 | 8141 |                 const char_t* alloc_string(const xpath_lexer_string& value)
 | 
|---|
 | 8142 |                 {
 | 
|---|
 | 8143 |                         if (value.begin)
 | 
|---|
 | 8144 |                         {
 | 
|---|
 | 8145 |                                 size_t length = static_cast<size_t>(value.end - value.begin);
 | 
|---|
 | 8146 | 
 | 
|---|
 | 8147 |                                 char_t* c = static_cast<char_t*>(_alloc->allocate_nothrow((length + 1) * sizeof(char_t)));
 | 
|---|
 | 8148 |                                 if (!c) throw_error_oom();
 | 
|---|
 | 8149 | 
 | 
|---|
 | 8150 |                                 memcpy(c, value.begin, length * sizeof(char_t));
 | 
|---|
 | 8151 |                                 c[length] = 0;
 | 
|---|
 | 8152 | 
 | 
|---|
 | 8153 |                                 return c;
 | 
|---|
 | 8154 |                         }
 | 
|---|
 | 8155 |                         else return 0;
 | 
|---|
 | 8156 |                 }
 | 
|---|
 | 8157 | 
 | 
|---|
 | 8158 |                 xpath_ast_node* parse_function_helper(ast_type_t type0, ast_type_t type1, size_t argc, xpath_ast_node* args[2])
 | 
|---|
 | 8159 |                 {
 | 
|---|
 | 8160 |                         assert(argc <= 1);
 | 
|---|
 | 8161 | 
 | 
|---|
 | 8162 |                         if (argc == 1 && args[0]->rettype() != xpath_type_node_set) throw_error("Function has to be applied to node set");
 | 
|---|
 | 8163 | 
 | 
|---|
 | 8164 |                         return new (alloc_node()) xpath_ast_node(argc == 0 ? type0 : type1, xpath_type_string, args[0]);
 | 
|---|
 | 8165 |                 }
 | 
|---|
 | 8166 | 
 | 
|---|
 | 8167 |                 xpath_ast_node* parse_function(const xpath_lexer_string& name, size_t argc, xpath_ast_node* args[2])
 | 
|---|
 | 8168 |                 {
 | 
|---|
 | 8169 |                         switch (name.begin[0])
 | 
|---|
 | 8170 |                         {
 | 
|---|
 | 8171 |                         case 'b':
 | 
|---|
 | 8172 |                                 if (name == PUGIXML_TEXT("boolean") && argc == 1)
 | 
|---|
 | 8173 |                                         return new (alloc_node()) xpath_ast_node(ast_func_boolean, xpath_type_boolean, args[0]);
 | 
|---|
 | 8174 |                                         
 | 
|---|
 | 8175 |                                 break;
 | 
|---|
 | 8176 |                         
 | 
|---|
 | 8177 |                         case 'c':
 | 
|---|
 | 8178 |                                 if (name == PUGIXML_TEXT("count") && argc == 1)
 | 
|---|
 | 8179 |                                 {
 | 
|---|
 | 8180 |                                         if (args[0]->rettype() != xpath_type_node_set) throw_error("Function has to be applied to node set");
 | 
|---|
 | 8181 |                                         return new (alloc_node()) xpath_ast_node(ast_func_count, xpath_type_number, args[0]);
 | 
|---|
 | 8182 |                                 }
 | 
|---|
 | 8183 |                                 else if (name == PUGIXML_TEXT("contains") && argc == 2)
 | 
|---|
 | 8184 |                                         return new (alloc_node()) xpath_ast_node(ast_func_contains, xpath_type_string, args[0], args[1]);
 | 
|---|
 | 8185 |                                 else if (name == PUGIXML_TEXT("concat") && argc >= 2)
 | 
|---|
 | 8186 |                                         return new (alloc_node()) xpath_ast_node(ast_func_concat, xpath_type_string, args[0], args[1]);
 | 
|---|
 | 8187 |                                 else if (name == PUGIXML_TEXT("ceiling") && argc == 1)
 | 
|---|
 | 8188 |                                         return new (alloc_node()) xpath_ast_node(ast_func_ceiling, xpath_type_number, args[0]);
 | 
|---|
 | 8189 |                                         
 | 
|---|
 | 8190 |                                 break;
 | 
|---|
 | 8191 |                         
 | 
|---|
 | 8192 |                         case 'f':
 | 
|---|
 | 8193 |                                 if (name == PUGIXML_TEXT("false") && argc == 0)
 | 
|---|
 | 8194 |                                         return new (alloc_node()) xpath_ast_node(ast_func_false, xpath_type_boolean);
 | 
|---|
 | 8195 |                                 else if (name == PUGIXML_TEXT("floor") && argc == 1)
 | 
|---|
 | 8196 |                                         return new (alloc_node()) xpath_ast_node(ast_func_floor, xpath_type_number, args[0]);
 | 
|---|
 | 8197 |                                         
 | 
|---|
 | 8198 |                                 break;
 | 
|---|
 | 8199 |                         
 | 
|---|
 | 8200 |                         case 'i':
 | 
|---|
 | 8201 |                                 if (name == PUGIXML_TEXT("id") && argc == 1)
 | 
|---|
 | 8202 |                                         return new (alloc_node()) xpath_ast_node(ast_func_id, xpath_type_node_set, args[0]);
 | 
|---|
 | 8203 |                                         
 | 
|---|
 | 8204 |                                 break;
 | 
|---|
 | 8205 |                         
 | 
|---|
 | 8206 |                         case 'l':
 | 
|---|
 | 8207 |                                 if (name == PUGIXML_TEXT("last") && argc == 0)
 | 
|---|
 | 8208 |                                         return new (alloc_node()) xpath_ast_node(ast_func_last, xpath_type_number);
 | 
|---|
 | 8209 |                                 else if (name == PUGIXML_TEXT("lang") && argc == 1)
 | 
|---|
 | 8210 |                                         return new (alloc_node()) xpath_ast_node(ast_func_lang, xpath_type_boolean, args[0]);
 | 
|---|
 | 8211 |                                 else if (name == PUGIXML_TEXT("local-name") && argc <= 1)
 | 
|---|
 | 8212 |                                         return parse_function_helper(ast_func_local_name_0, ast_func_local_name_1, argc, args);
 | 
|---|
 | 8213 |                         
 | 
|---|
 | 8214 |                                 break;
 | 
|---|
 | 8215 |                         
 | 
|---|
 | 8216 |                         case 'n':
 | 
|---|
 | 8217 |                                 if (name == PUGIXML_TEXT("name") && argc <= 1)
 | 
|---|
 | 8218 |                                         return parse_function_helper(ast_func_name_0, ast_func_name_1, argc, args);
 | 
|---|
 | 8219 |                                 else if (name == PUGIXML_TEXT("namespace-uri") && argc <= 1)
 | 
|---|
 | 8220 |                                         return parse_function_helper(ast_func_namespace_uri_0, ast_func_namespace_uri_1, argc, args);
 | 
|---|
 | 8221 |                                 else if (name == PUGIXML_TEXT("normalize-space") && argc <= 1)
 | 
|---|
 | 8222 |                                         return new (alloc_node()) xpath_ast_node(argc == 0 ? ast_func_normalize_space_0 : ast_func_normalize_space_1, xpath_type_string, args[0], args[1]);
 | 
|---|
 | 8223 |                                 else if (name == PUGIXML_TEXT("not") && argc == 1)
 | 
|---|
 | 8224 |                                         return new (alloc_node()) xpath_ast_node(ast_func_not, xpath_type_boolean, args[0]);
 | 
|---|
 | 8225 |                                 else if (name == PUGIXML_TEXT("number") && argc <= 1)
 | 
|---|
 | 8226 |                                         return new (alloc_node()) xpath_ast_node(argc == 0 ? ast_func_number_0 : ast_func_number_1, xpath_type_number, args[0]);
 | 
|---|
 | 8227 |                         
 | 
|---|
 | 8228 |                                 break;
 | 
|---|
 | 8229 |                         
 | 
|---|
 | 8230 |                         case 'p':
 | 
|---|
 | 8231 |                                 if (name == PUGIXML_TEXT("position") && argc == 0)
 | 
|---|
 | 8232 |                                         return new (alloc_node()) xpath_ast_node(ast_func_position, xpath_type_number);
 | 
|---|
 | 8233 |                                 
 | 
|---|
 | 8234 |                                 break;
 | 
|---|
 | 8235 |                         
 | 
|---|
 | 8236 |                         case 'r':
 | 
|---|
 | 8237 |                                 if (name == PUGIXML_TEXT("round") && argc == 1)
 | 
|---|
 | 8238 |                                         return new (alloc_node()) xpath_ast_node(ast_func_round, xpath_type_number, args[0]);
 | 
|---|
 | 8239 | 
 | 
|---|
 | 8240 |                                 break;
 | 
|---|
 | 8241 |                         
 | 
|---|
 | 8242 |                         case 's':
 | 
|---|
 | 8243 |                                 if (name == PUGIXML_TEXT("string") && argc <= 1)
 | 
|---|
 | 8244 |                                         return new (alloc_node()) xpath_ast_node(argc == 0 ? ast_func_string_0 : ast_func_string_1, xpath_type_string, args[0]);
 | 
|---|
 | 8245 |                                 else if (name == PUGIXML_TEXT("string-length") && argc <= 1)
 | 
|---|
 | 8246 |                                         return new (alloc_node()) xpath_ast_node(argc == 0 ? ast_func_string_length_0 : ast_func_string_length_1, xpath_type_string, args[0]);
 | 
|---|
 | 8247 |                                 else if (name == PUGIXML_TEXT("starts-with") && argc == 2)
 | 
|---|
 | 8248 |                                         return new (alloc_node()) xpath_ast_node(ast_func_starts_with, xpath_type_boolean, args[0], args[1]);
 | 
|---|
 | 8249 |                                 else if (name == PUGIXML_TEXT("substring-before") && argc == 2)
 | 
|---|
 | 8250 |                                         return new (alloc_node()) xpath_ast_node(ast_func_substring_before, xpath_type_string, args[0], args[1]);
 | 
|---|
 | 8251 |                                 else if (name == PUGIXML_TEXT("substring-after") && argc == 2)
 | 
|---|
 | 8252 |                                         return new (alloc_node()) xpath_ast_node(ast_func_substring_after, xpath_type_string, args[0], args[1]);
 | 
|---|
 | 8253 |                                 else if (name == PUGIXML_TEXT("substring") && (argc == 2 || argc == 3))
 | 
|---|
 | 8254 |                                         return new (alloc_node()) xpath_ast_node(argc == 2 ? ast_func_substring_2 : ast_func_substring_3, xpath_type_string, args[0], args[1]);
 | 
|---|
 | 8255 |                                 else if (name == PUGIXML_TEXT("sum") && argc == 1)
 | 
|---|
 | 8256 |                                 {
 | 
|---|
 | 8257 |                                         if (args[0]->rettype() != xpath_type_node_set) throw_error("Function has to be applied to node set");
 | 
|---|
 | 8258 |                                         return new (alloc_node()) xpath_ast_node(ast_func_sum, xpath_type_number, args[0]);
 | 
|---|
 | 8259 |                                 }
 | 
|---|
 | 8260 | 
 | 
|---|
 | 8261 |                                 break;
 | 
|---|
 | 8262 |                         
 | 
|---|
 | 8263 |                         case 't':
 | 
|---|
 | 8264 |                                 if (name == PUGIXML_TEXT("translate") && argc == 3)
 | 
|---|
 | 8265 |                                         return new (alloc_node()) xpath_ast_node(ast_func_translate, xpath_type_string, args[0], args[1]);
 | 
|---|
 | 8266 |                                 else if (name == PUGIXML_TEXT("true") && argc == 0)
 | 
|---|
 | 8267 |                                         return new (alloc_node()) xpath_ast_node(ast_func_true, xpath_type_boolean);
 | 
|---|
 | 8268 |                                         
 | 
|---|
 | 8269 |                                 break;
 | 
|---|
 | 8270 |                         }
 | 
|---|
 | 8271 | 
 | 
|---|
 | 8272 |                         throw_error("Unrecognized function or wrong parameter count");
 | 
|---|
 | 8273 | 
 | 
|---|
 | 8274 |                         return 0;
 | 
|---|
 | 8275 |                 }
 | 
|---|
 | 8276 | 
 | 
|---|
 | 8277 |                 axis_t parse_axis_name(const xpath_lexer_string& name, bool& specified)
 | 
|---|
 | 8278 |                 {
 | 
|---|
 | 8279 |                         specified = true;
 | 
|---|
 | 8280 | 
 | 
|---|
 | 8281 |                         switch (name.begin[0])
 | 
|---|
 | 8282 |                         {
 | 
|---|
 | 8283 |                         case 'a':
 | 
|---|
 | 8284 |                                 if (name == PUGIXML_TEXT("ancestor"))
 | 
|---|
 | 8285 |                                         return axis_ancestor;
 | 
|---|
 | 8286 |                                 else if (name == PUGIXML_TEXT("ancestor-or-self"))
 | 
|---|
 | 8287 |                                         return axis_ancestor_or_self;
 | 
|---|
 | 8288 |                                 else if (name == PUGIXML_TEXT("attribute"))
 | 
|---|
 | 8289 |                                         return axis_attribute;
 | 
|---|
 | 8290 |                                 
 | 
|---|
 | 8291 |                                 break;
 | 
|---|
 | 8292 |                         
 | 
|---|
 | 8293 |                         case 'c':
 | 
|---|
 | 8294 |                                 if (name == PUGIXML_TEXT("child"))
 | 
|---|
 | 8295 |                                         return axis_child;
 | 
|---|
 | 8296 |                                 
 | 
|---|
 | 8297 |                                 break;
 | 
|---|
 | 8298 |                         
 | 
|---|
 | 8299 |                         case 'd':
 | 
|---|
 | 8300 |                                 if (name == PUGIXML_TEXT("descendant"))
 | 
|---|
 | 8301 |                                         return axis_descendant;
 | 
|---|
 | 8302 |                                 else if (name == PUGIXML_TEXT("descendant-or-self"))
 | 
|---|
 | 8303 |                                         return axis_descendant_or_self;
 | 
|---|
 | 8304 |                                 
 | 
|---|
 | 8305 |                                 break;
 | 
|---|
 | 8306 |                         
 | 
|---|
 | 8307 |                         case 'f':
 | 
|---|
 | 8308 |                                 if (name == PUGIXML_TEXT("following"))
 | 
|---|
 | 8309 |                                         return axis_following;
 | 
|---|
 | 8310 |                                 else if (name == PUGIXML_TEXT("following-sibling"))
 | 
|---|
 | 8311 |                                         return axis_following_sibling;
 | 
|---|
 | 8312 |                                 
 | 
|---|
 | 8313 |                                 break;
 | 
|---|
 | 8314 |                         
 | 
|---|
 | 8315 |                         case 'n':
 | 
|---|
 | 8316 |                                 if (name == PUGIXML_TEXT("namespace"))
 | 
|---|
 | 8317 |                                         return axis_namespace;
 | 
|---|
 | 8318 |                                 
 | 
|---|
 | 8319 |                                 break;
 | 
|---|
 | 8320 |                         
 | 
|---|
 | 8321 |                         case 'p':
 | 
|---|
 | 8322 |                                 if (name == PUGIXML_TEXT("parent"))
 | 
|---|
 | 8323 |                                         return axis_parent;
 | 
|---|
 | 8324 |                                 else if (name == PUGIXML_TEXT("preceding"))
 | 
|---|
 | 8325 |                                         return axis_preceding;
 | 
|---|
 | 8326 |                                 else if (name == PUGIXML_TEXT("preceding-sibling"))
 | 
|---|
 | 8327 |                                         return axis_preceding_sibling;
 | 
|---|
 | 8328 |                                 
 | 
|---|
 | 8329 |                                 break;
 | 
|---|
 | 8330 |                         
 | 
|---|
 | 8331 |                         case 's':
 | 
|---|
 | 8332 |                                 if (name == PUGIXML_TEXT("self"))
 | 
|---|
 | 8333 |                                         return axis_self;
 | 
|---|
 | 8334 |                                 
 | 
|---|
 | 8335 |                                 break;
 | 
|---|
 | 8336 |                         }
 | 
|---|
 | 8337 | 
 | 
|---|
 | 8338 |                         specified = false;
 | 
|---|
 | 8339 |                         return axis_child;
 | 
|---|
 | 8340 |                 }
 | 
|---|
 | 8341 | 
 | 
|---|
 | 8342 |                 nodetest_t parse_node_test_type(const xpath_lexer_string& name)
 | 
|---|
 | 8343 |                 {
 | 
|---|
 | 8344 |                         switch (name.begin[0])
 | 
|---|
 | 8345 |                         {
 | 
|---|
 | 8346 |                         case 'c':
 | 
|---|
 | 8347 |                                 if (name == PUGIXML_TEXT("comment"))
 | 
|---|
 | 8348 |                                         return nodetest_type_comment;
 | 
|---|
 | 8349 | 
 | 
|---|
 | 8350 |                                 break;
 | 
|---|
 | 8351 | 
 | 
|---|
 | 8352 |                         case 'n':
 | 
|---|
 | 8353 |                                 if (name == PUGIXML_TEXT("node"))
 | 
|---|
 | 8354 |                                         return nodetest_type_node;
 | 
|---|
 | 8355 | 
 | 
|---|
 | 8356 |                                 break;
 | 
|---|
 | 8357 | 
 | 
|---|
 | 8358 |                         case 'p':
 | 
|---|
 | 8359 |                                 if (name == PUGIXML_TEXT("processing-instruction"))
 | 
|---|
 | 8360 |                                         return nodetest_type_pi;
 | 
|---|
 | 8361 | 
 | 
|---|
 | 8362 |                                 break;
 | 
|---|
 | 8363 | 
 | 
|---|
 | 8364 |                         case 't':
 | 
|---|
 | 8365 |                                 if (name == PUGIXML_TEXT("text"))
 | 
|---|
 | 8366 |                                         return nodetest_type_text;
 | 
|---|
 | 8367 | 
 | 
|---|
 | 8368 |                                 break;
 | 
|---|
 | 8369 |                         }
 | 
|---|
 | 8370 | 
 | 
|---|
 | 8371 |                         return nodetest_none;
 | 
|---|
 | 8372 |                 }
 | 
|---|
 | 8373 | 
 | 
|---|
 | 8374 |             // PrimaryExpr ::= VariableReference | '(' Expr ')' | Literal | Number | FunctionCall
 | 
|---|
 | 8375 |             xpath_ast_node* parse_primary_expression()
 | 
|---|
 | 8376 |             {
 | 
|---|
 | 8377 |                 switch (_lexer.current())
 | 
|---|
 | 8378 |                 {
 | 
|---|
 | 8379 |                 case lex_var_ref:
 | 
|---|
 | 8380 |                 {
 | 
|---|
 | 8381 |                                 xpath_lexer_string name = _lexer.contents();
 | 
|---|
 | 8382 | 
 | 
|---|
 | 8383 |                                 if (!_variables)
 | 
|---|
 | 8384 |                                         throw_error("Unknown variable: variable set is not provided");
 | 
|---|
 | 8385 | 
 | 
|---|
 | 8386 |                                 xpath_variable* var = get_variable(_variables, name.begin, name.end);
 | 
|---|
 | 8387 | 
 | 
|---|
 | 8388 |                                 if (!var)
 | 
|---|
 | 8389 |                                         throw_error("Unknown variable: variable set does not contain the given name");
 | 
|---|
 | 8390 | 
 | 
|---|
 | 8391 |                                 _lexer.next();
 | 
|---|
 | 8392 | 
 | 
|---|
 | 8393 |                         return new (alloc_node()) xpath_ast_node(ast_variable, var->type(), var);
 | 
|---|
 | 8394 |                         }
 | 
|---|
 | 8395 | 
 | 
|---|
 | 8396 |                         case lex_open_brace:
 | 
|---|
 | 8397 |                         {
 | 
|---|
 | 8398 |                                 _lexer.next();
 | 
|---|
 | 8399 | 
 | 
|---|
 | 8400 |                                 xpath_ast_node* n = parse_expression();
 | 
|---|
 | 8401 | 
 | 
|---|
 | 8402 |                                 if (_lexer.current() != lex_close_brace)
 | 
|---|
 | 8403 |                                         throw_error("Unmatched braces");
 | 
|---|
 | 8404 | 
 | 
|---|
 | 8405 |                                 _lexer.next();
 | 
|---|
 | 8406 | 
 | 
|---|
 | 8407 |                                 return n;
 | 
|---|
 | 8408 |                         }
 | 
|---|
 | 8409 | 
 | 
|---|
 | 8410 |                         case lex_quoted_string:
 | 
|---|
 | 8411 |                         {
 | 
|---|
 | 8412 |                                 const char_t* value = alloc_string(_lexer.contents());
 | 
|---|
 | 8413 | 
 | 
|---|
 | 8414 |                                 xpath_ast_node* n = new (alloc_node()) xpath_ast_node(ast_string_constant, xpath_type_string, value);
 | 
|---|
 | 8415 |                                 _lexer.next();
 | 
|---|
 | 8416 | 
 | 
|---|
 | 8417 |                                 return n;
 | 
|---|
 | 8418 |                         }
 | 
|---|
 | 8419 | 
 | 
|---|
 | 8420 |                         case lex_number:
 | 
|---|
 | 8421 |                         {
 | 
|---|
 | 8422 |                                 double value = 0;
 | 
|---|
 | 8423 | 
 | 
|---|
 | 8424 |                                 if (!convert_string_to_number(_lexer.contents().begin, _lexer.contents().end, &value))
 | 
|---|
 | 8425 |                                         throw_error_oom();
 | 
|---|
 | 8426 | 
 | 
|---|
 | 8427 |                                 xpath_ast_node* n = new (alloc_node()) xpath_ast_node(ast_number_constant, xpath_type_number, value);
 | 
|---|
 | 8428 |                                 _lexer.next();
 | 
|---|
 | 8429 | 
 | 
|---|
 | 8430 |                                 return n;
 | 
|---|
 | 8431 |                         }
 | 
|---|
 | 8432 | 
 | 
|---|
 | 8433 |                         case lex_string:
 | 
|---|
 | 8434 |                         {
 | 
|---|
 | 8435 |                                 xpath_ast_node* args[2] = {0};
 | 
|---|
 | 8436 |                                 size_t argc = 0;
 | 
|---|
 | 8437 |                                 
 | 
|---|
 | 8438 |                                 xpath_lexer_string function = _lexer.contents();
 | 
|---|
 | 8439 |                                 _lexer.next();
 | 
|---|
 | 8440 |                                 
 | 
|---|
 | 8441 |                                 xpath_ast_node* last_arg = 0;
 | 
|---|
 | 8442 |                                 
 | 
|---|
 | 8443 |                                 if (_lexer.current() != lex_open_brace)
 | 
|---|
 | 8444 |                                         throw_error("Unrecognized function call");
 | 
|---|
 | 8445 |                                 _lexer.next();
 | 
|---|
 | 8446 | 
 | 
|---|
 | 8447 |                                 if (_lexer.current() != lex_close_brace)
 | 
|---|
 | 8448 |                                         args[argc++] = parse_expression();
 | 
|---|
 | 8449 | 
 | 
|---|
 | 8450 |                                 while (_lexer.current() != lex_close_brace)
 | 
|---|
 | 8451 |                                 {
 | 
|---|
 | 8452 |                                         if (_lexer.current() != lex_comma)
 | 
|---|
 | 8453 |                                                 throw_error("No comma between function arguments");
 | 
|---|
 | 8454 |                                         _lexer.next();
 | 
|---|
 | 8455 |                                         
 | 
|---|
 | 8456 |                                         xpath_ast_node* n = parse_expression();
 | 
|---|
 | 8457 |                                         
 | 
|---|
 | 8458 |                                         if (argc < 2) args[argc] = n;
 | 
|---|
 | 8459 |                                         else last_arg->set_next(n);
 | 
|---|
 | 8460 | 
 | 
|---|
 | 8461 |                                         argc++;
 | 
|---|
 | 8462 |                                         last_arg = n;
 | 
|---|
 | 8463 |                                 }
 | 
|---|
 | 8464 |                                 
 | 
|---|
 | 8465 |                                 _lexer.next();
 | 
|---|
 | 8466 | 
 | 
|---|
 | 8467 |                                 return parse_function(function, argc, args);
 | 
|---|
 | 8468 |                         }
 | 
|---|
 | 8469 | 
 | 
|---|
 | 8470 |                 default:
 | 
|---|
 | 8471 |                         throw_error("Unrecognizable primary expression");
 | 
|---|
 | 8472 | 
 | 
|---|
 | 8473 |                         return 0;
 | 
|---|
 | 8474 |                 }
 | 
|---|
 | 8475 |             }
 | 
|---|
 | 8476 |             
 | 
|---|
 | 8477 |             // FilterExpr ::= PrimaryExpr | FilterExpr Predicate
 | 
|---|
 | 8478 |             // Predicate ::= '[' PredicateExpr ']'
 | 
|---|
 | 8479 |             // PredicateExpr ::= Expr
 | 
|---|
 | 8480 |             xpath_ast_node* parse_filter_expression()
 | 
|---|
 | 8481 |             {
 | 
|---|
 | 8482 |                 xpath_ast_node* n = parse_primary_expression();
 | 
|---|
 | 8483 | 
 | 
|---|
 | 8484 |                 while (_lexer.current() == lex_open_square_brace)
 | 
|---|
 | 8485 |                 {
 | 
|---|
 | 8486 |                         _lexer.next();
 | 
|---|
 | 8487 | 
 | 
|---|
 | 8488 |                                 xpath_ast_node* expr = parse_expression();
 | 
|---|
 | 8489 | 
 | 
|---|
 | 8490 |                                 if (n->rettype() != xpath_type_node_set) throw_error("Predicate has to be applied to node set");
 | 
|---|
 | 8491 | 
 | 
|---|
 | 8492 |                                 bool posinv = expr->rettype() != xpath_type_number && expr->is_posinv();
 | 
|---|
 | 8493 | 
 | 
|---|
 | 8494 |                         n = new (alloc_node()) xpath_ast_node(posinv ? ast_filter_posinv : ast_filter, xpath_type_node_set, n, expr);
 | 
|---|
 | 8495 | 
 | 
|---|
 | 8496 |                         if (_lexer.current() != lex_close_square_brace)
 | 
|---|
 | 8497 |                                 throw_error("Unmatched square brace");
 | 
|---|
 | 8498 |                 
 | 
|---|
 | 8499 |                         _lexer.next();
 | 
|---|
 | 8500 |                 }
 | 
|---|
 | 8501 |                 
 | 
|---|
 | 8502 |                 return n;
 | 
|---|
 | 8503 |             }
 | 
|---|
 | 8504 |             
 | 
|---|
 | 8505 |             // Step ::= AxisSpecifier NodeTest Predicate* | AbbreviatedStep
 | 
|---|
 | 8506 |             // AxisSpecifier ::= AxisName '::' | '@'?
 | 
|---|
 | 8507 |             // NodeTest ::= NameTest | NodeType '(' ')' | 'processing-instruction' '(' Literal ')'
 | 
|---|
 | 8508 |             // NameTest ::= '*' | NCName ':' '*' | QName
 | 
|---|
 | 8509 |             // AbbreviatedStep ::= '.' | '..'
 | 
|---|
 | 8510 |             xpath_ast_node* parse_step(xpath_ast_node* set)
 | 
|---|
 | 8511 |             {
 | 
|---|
 | 8512 |                         if (set && set->rettype() != xpath_type_node_set)
 | 
|---|
 | 8513 |                                 throw_error("Step has to be applied to node set");
 | 
|---|
 | 8514 | 
 | 
|---|
 | 8515 |                         bool axis_specified = false;
 | 
|---|
 | 8516 |                         axis_t axis = axis_child; // implied child axis
 | 
|---|
 | 8517 | 
 | 
|---|
 | 8518 |                         if (_lexer.current() == lex_axis_attribute)
 | 
|---|
 | 8519 |                         {
 | 
|---|
 | 8520 |                                 axis = axis_attribute;
 | 
|---|
 | 8521 |                                 axis_specified = true;
 | 
|---|
 | 8522 |                                 
 | 
|---|
 | 8523 |                                 _lexer.next();
 | 
|---|
 | 8524 |                         }
 | 
|---|
 | 8525 |                         else if (_lexer.current() == lex_dot)
 | 
|---|
 | 8526 |                         {
 | 
|---|
 | 8527 |                                 _lexer.next();
 | 
|---|
 | 8528 |                                 
 | 
|---|
 | 8529 |                                 return new (alloc_node()) xpath_ast_node(ast_step, set, axis_self, nodetest_type_node, 0);
 | 
|---|
 | 8530 |                         }
 | 
|---|
 | 8531 |                         else if (_lexer.current() == lex_double_dot)
 | 
|---|
 | 8532 |                         {
 | 
|---|
 | 8533 |                                 _lexer.next();
 | 
|---|
 | 8534 |                                 
 | 
|---|
 | 8535 |                                 return new (alloc_node()) xpath_ast_node(ast_step, set, axis_parent, nodetest_type_node, 0);
 | 
|---|
 | 8536 |                         }
 | 
|---|
 | 8537 |             
 | 
|---|
 | 8538 |                         nodetest_t nt_type = nodetest_none;
 | 
|---|
 | 8539 |                         xpath_lexer_string nt_name;
 | 
|---|
 | 8540 |                         
 | 
|---|
 | 8541 |                         if (_lexer.current() == lex_string)
 | 
|---|
 | 8542 |                         {
 | 
|---|
 | 8543 |                                 // node name test
 | 
|---|
 | 8544 |                                 nt_name = _lexer.contents();
 | 
|---|
 | 8545 |                                 _lexer.next();
 | 
|---|
 | 8546 | 
 | 
|---|
 | 8547 |                                 // was it an axis name?
 | 
|---|
 | 8548 |                                 if (_lexer.current() == lex_double_colon)
 | 
|---|
 | 8549 |                                 {
 | 
|---|
 | 8550 |                                         // parse axis name
 | 
|---|
 | 8551 |                                         if (axis_specified) throw_error("Two axis specifiers in one step");
 | 
|---|
 | 8552 | 
 | 
|---|
 | 8553 |                                         axis = parse_axis_name(nt_name, axis_specified);
 | 
|---|
 | 8554 | 
 | 
|---|
 | 8555 |                                         if (!axis_specified) throw_error("Unknown axis");
 | 
|---|
 | 8556 | 
 | 
|---|
 | 8557 |                                         // read actual node test
 | 
|---|
 | 8558 |                                         _lexer.next();
 | 
|---|
 | 8559 | 
 | 
|---|
 | 8560 |                                         if (_lexer.current() == lex_multiply)
 | 
|---|
 | 8561 |                                         {
 | 
|---|
 | 8562 |                                                 nt_type = nodetest_all;
 | 
|---|
 | 8563 |                                                 nt_name = xpath_lexer_string();
 | 
|---|
 | 8564 |                                                 _lexer.next();
 | 
|---|
 | 8565 |                                         }
 | 
|---|
 | 8566 |                                         else if (_lexer.current() == lex_string)
 | 
|---|
 | 8567 |                                         {
 | 
|---|
 | 8568 |                                                 nt_name = _lexer.contents();
 | 
|---|
 | 8569 |                                                 _lexer.next();
 | 
|---|
 | 8570 |                                         }
 | 
|---|
 | 8571 |                                         else throw_error("Unrecognized node test");
 | 
|---|
 | 8572 |                                 }
 | 
|---|
 | 8573 |                                 
 | 
|---|
 | 8574 |                                 if (nt_type == nodetest_none)
 | 
|---|
 | 8575 |                                 {
 | 
|---|
 | 8576 |                                         // node type test or processing-instruction
 | 
|---|
 | 8577 |                                         if (_lexer.current() == lex_open_brace)
 | 
|---|
 | 8578 |                                         {
 | 
|---|
 | 8579 |                                                 _lexer.next();
 | 
|---|
 | 8580 |                                                 
 | 
|---|
 | 8581 |                                                 if (_lexer.current() == lex_close_brace)
 | 
|---|
 | 8582 |                                                 {
 | 
|---|
 | 8583 |                                                         _lexer.next();
 | 
|---|
 | 8584 | 
 | 
|---|
 | 8585 |                                                         nt_type = parse_node_test_type(nt_name);
 | 
|---|
 | 8586 | 
 | 
|---|
 | 8587 |                                                         if (nt_type == nodetest_none) throw_error("Unrecognized node type");
 | 
|---|
 | 8588 |                                                         
 | 
|---|
 | 8589 |                                                         nt_name = xpath_lexer_string();
 | 
|---|
 | 8590 |                                                 }
 | 
|---|
 | 8591 |                                                 else if (nt_name == PUGIXML_TEXT("processing-instruction"))
 | 
|---|
 | 8592 |                                                 {
 | 
|---|
 | 8593 |                                                         if (_lexer.current() != lex_quoted_string)
 | 
|---|
 | 8594 |                                                                 throw_error("Only literals are allowed as arguments to processing-instruction()");
 | 
|---|
 | 8595 |                                                 
 | 
|---|
 | 8596 |                                                         nt_type = nodetest_pi;
 | 
|---|
 | 8597 |                                                         nt_name = _lexer.contents();
 | 
|---|
 | 8598 |                                                         _lexer.next();
 | 
|---|
 | 8599 |                                                         
 | 
|---|
 | 8600 |                                                         if (_lexer.current() != lex_close_brace)
 | 
|---|
 | 8601 |                                                                 throw_error("Unmatched brace near processing-instruction()");
 | 
|---|
 | 8602 |                                                         _lexer.next();
 | 
|---|
 | 8603 |                                                 }
 | 
|---|
 | 8604 |                                                 else
 | 
|---|
 | 8605 |                                                         throw_error("Unmatched brace near node type test");
 | 
|---|
 | 8606 | 
 | 
|---|
 | 8607 |                                         }
 | 
|---|
 | 8608 |                                         // QName or NCName:*
 | 
|---|
 | 8609 |                                         else
 | 
|---|
 | 8610 |                                         {
 | 
|---|
 | 8611 |                                                 if (nt_name.end - nt_name.begin > 2 && nt_name.end[-2] == ':' && nt_name.end[-1] == '*') // NCName:*
 | 
|---|
 | 8612 |                                                 {
 | 
|---|
 | 8613 |                                                         nt_name.end--; // erase *
 | 
|---|
 | 8614 |                                                         
 | 
|---|
 | 8615 |                                                         nt_type = nodetest_all_in_namespace;
 | 
|---|
 | 8616 |                                                 }
 | 
|---|
 | 8617 |                                                 else nt_type = nodetest_name;
 | 
|---|
 | 8618 |                                         }
 | 
|---|
 | 8619 |                                 }
 | 
|---|
 | 8620 |                         }
 | 
|---|
 | 8621 |                         else if (_lexer.current() == lex_multiply)
 | 
|---|
 | 8622 |                         {
 | 
|---|
 | 8623 |                                 nt_type = nodetest_all;
 | 
|---|
 | 8624 |                                 _lexer.next();
 | 
|---|
 | 8625 |                         }
 | 
|---|
 | 8626 |                         else throw_error("Unrecognized node test");
 | 
|---|
 | 8627 |                         
 | 
|---|
 | 8628 |                         xpath_ast_node* n = new (alloc_node()) xpath_ast_node(ast_step, set, axis, nt_type, alloc_string(nt_name));
 | 
|---|
 | 8629 |                         
 | 
|---|
 | 8630 |                         xpath_ast_node* last = 0;
 | 
|---|
 | 8631 |                         
 | 
|---|
 | 8632 |                         while (_lexer.current() == lex_open_square_brace)
 | 
|---|
 | 8633 |                         {
 | 
|---|
 | 8634 |                                 _lexer.next();
 | 
|---|
 | 8635 |                                 
 | 
|---|
 | 8636 |                                 xpath_ast_node* expr = parse_expression();
 | 
|---|
 | 8637 | 
 | 
|---|
 | 8638 |                                 xpath_ast_node* pred = new (alloc_node()) xpath_ast_node(ast_predicate, xpath_type_node_set, expr);
 | 
|---|
 | 8639 |                                 
 | 
|---|
 | 8640 |                                 if (_lexer.current() != lex_close_square_brace)
 | 
|---|
 | 8641 |                                 throw_error("Unmatched square brace");
 | 
|---|
 | 8642 |                                 _lexer.next();
 | 
|---|
 | 8643 |                                 
 | 
|---|
 | 8644 |                                 if (last) last->set_next(pred);
 | 
|---|
 | 8645 |                                 else n->set_right(pred);
 | 
|---|
 | 8646 |                                 
 | 
|---|
 | 8647 |                                 last = pred;
 | 
|---|
 | 8648 |                         }
 | 
|---|
 | 8649 |                         
 | 
|---|
 | 8650 |                         return n;
 | 
|---|
 | 8651 |             }
 | 
|---|
 | 8652 |             
 | 
|---|
 | 8653 |             // RelativeLocationPath ::= Step | RelativeLocationPath '/' Step | RelativeLocationPath '//' Step
 | 
|---|
 | 8654 |             xpath_ast_node* parse_relative_location_path(xpath_ast_node* set)
 | 
|---|
 | 8655 |             {
 | 
|---|
 | 8656 |                         xpath_ast_node* n = parse_step(set);
 | 
|---|
 | 8657 |                         
 | 
|---|
 | 8658 |                         while (_lexer.current() == lex_slash || _lexer.current() == lex_double_slash)
 | 
|---|
 | 8659 |                         {
 | 
|---|
 | 8660 |                                 lexeme_t l = _lexer.current();
 | 
|---|
 | 8661 |                                 _lexer.next();
 | 
|---|
 | 8662 | 
 | 
|---|
 | 8663 |                                 if (l == lex_double_slash)
 | 
|---|
 | 8664 |                                         n = new (alloc_node()) xpath_ast_node(ast_step, n, axis_descendant_or_self, nodetest_type_node, 0);
 | 
|---|
 | 8665 |                                 
 | 
|---|
 | 8666 |                                 n = parse_step(n);
 | 
|---|
 | 8667 |                         }
 | 
|---|
 | 8668 |                         
 | 
|---|
 | 8669 |                         return n;
 | 
|---|
 | 8670 |             }
 | 
|---|
 | 8671 |             
 | 
|---|
 | 8672 |             // LocationPath ::= RelativeLocationPath | AbsoluteLocationPath
 | 
|---|
 | 8673 |             // AbsoluteLocationPath ::= '/' RelativeLocationPath? | '//' RelativeLocationPath
 | 
|---|
 | 8674 |             xpath_ast_node* parse_location_path()
 | 
|---|
 | 8675 |             {
 | 
|---|
 | 8676 |                         if (_lexer.current() == lex_slash)
 | 
|---|
 | 8677 |                         {
 | 
|---|
 | 8678 |                                 _lexer.next();
 | 
|---|
 | 8679 |                                 
 | 
|---|
 | 8680 |                                 xpath_ast_node* n = new (alloc_node()) xpath_ast_node(ast_step_root, xpath_type_node_set);
 | 
|---|
 | 8681 | 
 | 
|---|
 | 8682 |                                 // relative location path can start from axis_attribute, dot, double_dot, multiply and string lexemes; any other lexeme means standalone root path
 | 
|---|
 | 8683 |                                 lexeme_t l = _lexer.current();
 | 
|---|
 | 8684 | 
 | 
|---|
 | 8685 |                                 if (l == lex_string || l == lex_axis_attribute || l == lex_dot || l == lex_double_dot || l == lex_multiply)
 | 
|---|
 | 8686 |                                         return parse_relative_location_path(n);
 | 
|---|
 | 8687 |                                 else
 | 
|---|
 | 8688 |                                         return n;
 | 
|---|
 | 8689 |                         }
 | 
|---|
 | 8690 |                         else if (_lexer.current() == lex_double_slash)
 | 
|---|
 | 8691 |                         {
 | 
|---|
 | 8692 |                                 _lexer.next();
 | 
|---|
 | 8693 |                                 
 | 
|---|
 | 8694 |                                 xpath_ast_node* n = new (alloc_node()) xpath_ast_node(ast_step_root, xpath_type_node_set);
 | 
|---|
 | 8695 |                                 n = new (alloc_node()) xpath_ast_node(ast_step, n, axis_descendant_or_self, nodetest_type_node, 0);
 | 
|---|
 | 8696 |                                 
 | 
|---|
 | 8697 |                                 return parse_relative_location_path(n);
 | 
|---|
 | 8698 |                         }
 | 
|---|
 | 8699 | 
 | 
|---|
 | 8700 |                         // else clause moved outside of if because of bogus warning 'control may reach end of non-void function being inlined' in gcc 4.0.1
 | 
|---|
 | 8701 |                         return parse_relative_location_path(0);
 | 
|---|
 | 8702 |             }
 | 
|---|
 | 8703 |             
 | 
|---|
 | 8704 |             // PathExpr ::= LocationPath
 | 
|---|
 | 8705 |             //                          | FilterExpr
 | 
|---|
 | 8706 |             //                          | FilterExpr '/' RelativeLocationPath
 | 
|---|
 | 8707 |             //                          | FilterExpr '//' RelativeLocationPath
 | 
|---|
 | 8708 |             xpath_ast_node* parse_path_expression()
 | 
|---|
 | 8709 |             {
 | 
|---|
 | 8710 |                         // Clarification.
 | 
|---|
 | 8711 |                         // PathExpr begins with either LocationPath or FilterExpr.
 | 
|---|
 | 8712 |                         // FilterExpr begins with PrimaryExpr
 | 
|---|
 | 8713 |                         // PrimaryExpr begins with '$' in case of it being a variable reference,
 | 
|---|
 | 8714 |                         // '(' in case of it being an expression, string literal, number constant or
 | 
|---|
 | 8715 |                         // function call.
 | 
|---|
 | 8716 | 
 | 
|---|
 | 8717 |                         if (_lexer.current() == lex_var_ref || _lexer.current() == lex_open_brace || 
 | 
|---|
 | 8718 |                                 _lexer.current() == lex_quoted_string || _lexer.current() == lex_number ||
 | 
|---|
 | 8719 |                                 _lexer.current() == lex_string)
 | 
|---|
 | 8720 |                 {
 | 
|---|
 | 8721 |                         if (_lexer.current() == lex_string)
 | 
|---|
 | 8722 |                         {
 | 
|---|
 | 8723 |                                 // This is either a function call, or not - if not, we shall proceed with location path
 | 
|---|
 | 8724 |                                 const char_t* state = _lexer.state();
 | 
|---|
 | 8725 |                                 
 | 
|---|
 | 8726 |                                         while (IS_CHARTYPE(*state, ct_space)) ++state;
 | 
|---|
 | 8727 |                                 
 | 
|---|
 | 8728 |                                 if (*state != '(') return parse_location_path();
 | 
|---|
 | 8729 | 
 | 
|---|
 | 8730 |                                         // This looks like a function call; however this still can be a node-test. Check it.
 | 
|---|
 | 8731 |                                         if (parse_node_test_type(_lexer.contents()) != nodetest_none) return parse_location_path();
 | 
|---|
 | 8732 |                         }
 | 
|---|
 | 8733 |                         
 | 
|---|
 | 8734 |                         xpath_ast_node* n = parse_filter_expression();
 | 
|---|
 | 8735 | 
 | 
|---|
 | 8736 |                         if (_lexer.current() == lex_slash || _lexer.current() == lex_double_slash)
 | 
|---|
 | 8737 |                         {
 | 
|---|
 | 8738 |                                         lexeme_t l = _lexer.current();
 | 
|---|
 | 8739 |                                 _lexer.next();
 | 
|---|
 | 8740 |                                 
 | 
|---|
 | 8741 |                                         if (l == lex_double_slash)
 | 
|---|
 | 8742 |                                         {
 | 
|---|
 | 8743 |                                                 if (n->rettype() != xpath_type_node_set) throw_error("Step has to be applied to node set");
 | 
|---|
 | 8744 | 
 | 
|---|
 | 8745 |                                                 n = new (alloc_node()) xpath_ast_node(ast_step, n, axis_descendant_or_self, nodetest_type_node, 0);
 | 
|---|
 | 8746 |                                         }
 | 
|---|
 | 8747 |         
 | 
|---|
 | 8748 |                                 // select from location path
 | 
|---|
 | 8749 |                                 return parse_relative_location_path(n);
 | 
|---|
 | 8750 |                         }
 | 
|---|
 | 8751 | 
 | 
|---|
 | 8752 |                         return n;
 | 
|---|
 | 8753 |                 }
 | 
|---|
 | 8754 |                 else return parse_location_path();
 | 
|---|
 | 8755 |             }
 | 
|---|
 | 8756 | 
 | 
|---|
 | 8757 |             // UnionExpr ::= PathExpr | UnionExpr '|' PathExpr
 | 
|---|
 | 8758 |             xpath_ast_node* parse_union_expression()
 | 
|---|
 | 8759 |             {
 | 
|---|
 | 8760 |                 xpath_ast_node* n = parse_path_expression();
 | 
|---|
 | 8761 | 
 | 
|---|
 | 8762 |                 while (_lexer.current() == lex_union)
 | 
|---|
 | 8763 |                 {
 | 
|---|
 | 8764 |                         _lexer.next();
 | 
|---|
 | 8765 | 
 | 
|---|
 | 8766 |                                 xpath_ast_node* expr = parse_union_expression();
 | 
|---|
 | 8767 | 
 | 
|---|
 | 8768 |                                 if (n->rettype() != xpath_type_node_set || expr->rettype() != xpath_type_node_set)
 | 
|---|
 | 8769 |                                         throw_error("Union operator has to be applied to node sets");
 | 
|---|
 | 8770 | 
 | 
|---|
 | 8771 |                         n = new (alloc_node()) xpath_ast_node(ast_op_union, xpath_type_node_set, n, expr);
 | 
|---|
 | 8772 |                 }
 | 
|---|
 | 8773 | 
 | 
|---|
 | 8774 |                 return n;
 | 
|---|
 | 8775 |             }
 | 
|---|
 | 8776 | 
 | 
|---|
 | 8777 |             // UnaryExpr ::= UnionExpr | '-' UnaryExpr
 | 
|---|
 | 8778 |             xpath_ast_node* parse_unary_expression()
 | 
|---|
 | 8779 |             {
 | 
|---|
 | 8780 |                 if (_lexer.current() == lex_minus)
 | 
|---|
 | 8781 |                 {
 | 
|---|
 | 8782 |                         _lexer.next();
 | 
|---|
 | 8783 | 
 | 
|---|
 | 8784 |                                 xpath_ast_node* expr = parse_unary_expression();
 | 
|---|
 | 8785 | 
 | 
|---|
 | 8786 |                         return new (alloc_node()) xpath_ast_node(ast_op_negate, xpath_type_number, expr);
 | 
|---|
 | 8787 |                 }
 | 
|---|
 | 8788 |                 else return parse_union_expression();
 | 
|---|
 | 8789 |             }
 | 
|---|
 | 8790 |             
 | 
|---|
 | 8791 |             // MultiplicativeExpr ::= UnaryExpr
 | 
|---|
 | 8792 |             //                                            | MultiplicativeExpr '*' UnaryExpr
 | 
|---|
 | 8793 |             //                                            | MultiplicativeExpr 'div' UnaryExpr
 | 
|---|
 | 8794 |             //                                            | MultiplicativeExpr 'mod' UnaryExpr
 | 
|---|
 | 8795 |             xpath_ast_node* parse_multiplicative_expression()
 | 
|---|
 | 8796 |             {
 | 
|---|
 | 8797 |                 xpath_ast_node* n = parse_unary_expression();
 | 
|---|
 | 8798 | 
 | 
|---|
 | 8799 |                 while (_lexer.current() == lex_multiply || (_lexer.current() == lex_string &&
 | 
|---|
 | 8800 |                            (_lexer.contents() == PUGIXML_TEXT("mod") || _lexer.contents() == PUGIXML_TEXT("div"))))
 | 
|---|
 | 8801 |                 {
 | 
|---|
 | 8802 |                         ast_type_t op = _lexer.current() == lex_multiply ? ast_op_multiply :
 | 
|---|
 | 8803 |                                 _lexer.contents().begin[0] == 'd' ? ast_op_divide : ast_op_mod;
 | 
|---|
 | 8804 |                         _lexer.next();
 | 
|---|
 | 8805 | 
 | 
|---|
 | 8806 |                                 xpath_ast_node* expr = parse_unary_expression();
 | 
|---|
 | 8807 | 
 | 
|---|
 | 8808 |                         n = new (alloc_node()) xpath_ast_node(op, xpath_type_number, n, expr);
 | 
|---|
 | 8809 |                 }
 | 
|---|
 | 8810 | 
 | 
|---|
 | 8811 |                 return n;
 | 
|---|
 | 8812 |             }
 | 
|---|
 | 8813 | 
 | 
|---|
 | 8814 |             // AdditiveExpr ::= MultiplicativeExpr
 | 
|---|
 | 8815 |             //                                  | AdditiveExpr '+' MultiplicativeExpr
 | 
|---|
 | 8816 |             //                                  | AdditiveExpr '-' MultiplicativeExpr
 | 
|---|
 | 8817 |             xpath_ast_node* parse_additive_expression()
 | 
|---|
 | 8818 |             {
 | 
|---|
 | 8819 |                 xpath_ast_node* n = parse_multiplicative_expression();
 | 
|---|
 | 8820 | 
 | 
|---|
 | 8821 |                 while (_lexer.current() == lex_plus || _lexer.current() == lex_minus)
 | 
|---|
 | 8822 |                 {
 | 
|---|
 | 8823 |                         lexeme_t l = _lexer.current();
 | 
|---|
 | 8824 | 
 | 
|---|
 | 8825 |                         _lexer.next();
 | 
|---|
 | 8826 | 
 | 
|---|
 | 8827 |                                 xpath_ast_node* expr = parse_multiplicative_expression();
 | 
|---|
 | 8828 | 
 | 
|---|
 | 8829 |                         n = new (alloc_node()) xpath_ast_node(l == lex_plus ? ast_op_add : ast_op_subtract, xpath_type_number, n, expr);
 | 
|---|
 | 8830 |                 }
 | 
|---|
 | 8831 | 
 | 
|---|
 | 8832 |                 return n;
 | 
|---|
 | 8833 |             }
 | 
|---|
 | 8834 | 
 | 
|---|
 | 8835 |             // RelationalExpr ::= AdditiveExpr
 | 
|---|
 | 8836 |             //                                    | RelationalExpr '<' AdditiveExpr
 | 
|---|
 | 8837 |             //                                    | RelationalExpr '>' AdditiveExpr
 | 
|---|
 | 8838 |             //                                    | RelationalExpr '<=' AdditiveExpr
 | 
|---|
 | 8839 |             //                                    | RelationalExpr '>=' AdditiveExpr
 | 
|---|
 | 8840 |             xpath_ast_node* parse_relational_expression()
 | 
|---|
 | 8841 |             {
 | 
|---|
 | 8842 |                 xpath_ast_node* n = parse_additive_expression();
 | 
|---|
 | 8843 | 
 | 
|---|
 | 8844 |                 while (_lexer.current() == lex_less || _lexer.current() == lex_less_or_equal || 
 | 
|---|
 | 8845 |                            _lexer.current() == lex_greater || _lexer.current() == lex_greater_or_equal)
 | 
|---|
 | 8846 |                 {
 | 
|---|
 | 8847 |                         lexeme_t l = _lexer.current();
 | 
|---|
 | 8848 |                         _lexer.next();
 | 
|---|
 | 8849 | 
 | 
|---|
 | 8850 |                                 xpath_ast_node* expr = parse_additive_expression();
 | 
|---|
 | 8851 | 
 | 
|---|
 | 8852 |                         n = new (alloc_node()) xpath_ast_node(l == lex_less ? ast_op_less : l == lex_greater ? ast_op_greater :
 | 
|---|
 | 8853 |                                                         l == lex_less_or_equal ? ast_op_less_or_equal : ast_op_greater_or_equal, xpath_type_boolean, n, expr);
 | 
|---|
 | 8854 |                 }
 | 
|---|
 | 8855 | 
 | 
|---|
 | 8856 |                 return n;
 | 
|---|
 | 8857 |             }
 | 
|---|
 | 8858 |             
 | 
|---|
 | 8859 |             // EqualityExpr ::= RelationalExpr
 | 
|---|
 | 8860 |             //                                  | EqualityExpr '=' RelationalExpr
 | 
|---|
 | 8861 |             //                                  | EqualityExpr '!=' RelationalExpr
 | 
|---|
 | 8862 |             xpath_ast_node* parse_equality_expression()
 | 
|---|
 | 8863 |             {
 | 
|---|
 | 8864 |                 xpath_ast_node* n = parse_relational_expression();
 | 
|---|
 | 8865 | 
 | 
|---|
 | 8866 |                 while (_lexer.current() == lex_equal || _lexer.current() == lex_not_equal)
 | 
|---|
 | 8867 |                 {
 | 
|---|
 | 8868 |                         lexeme_t l = _lexer.current();
 | 
|---|
 | 8869 | 
 | 
|---|
 | 8870 |                         _lexer.next();
 | 
|---|
 | 8871 | 
 | 
|---|
 | 8872 |                                 xpath_ast_node* expr = parse_relational_expression();
 | 
|---|
 | 8873 | 
 | 
|---|
 | 8874 |                         n = new (alloc_node()) xpath_ast_node(l == lex_equal ? ast_op_equal : ast_op_not_equal, xpath_type_boolean, n, expr);
 | 
|---|
 | 8875 |                 }
 | 
|---|
 | 8876 | 
 | 
|---|
 | 8877 |                 return n;
 | 
|---|
 | 8878 |             }
 | 
|---|
 | 8879 |             
 | 
|---|
 | 8880 |             // AndExpr ::= EqualityExpr | AndExpr 'and' EqualityExpr
 | 
|---|
 | 8881 |             xpath_ast_node* parse_and_expression()
 | 
|---|
 | 8882 |             {
 | 
|---|
 | 8883 |                 xpath_ast_node* n = parse_equality_expression();
 | 
|---|
 | 8884 | 
 | 
|---|
 | 8885 |                 while (_lexer.current() == lex_string && _lexer.contents() == PUGIXML_TEXT("and"))
 | 
|---|
 | 8886 |                 {
 | 
|---|
 | 8887 |                         _lexer.next();
 | 
|---|
 | 8888 | 
 | 
|---|
 | 8889 |                                 xpath_ast_node* expr = parse_equality_expression();
 | 
|---|
 | 8890 | 
 | 
|---|
 | 8891 |                         n = new (alloc_node()) xpath_ast_node(ast_op_and, xpath_type_boolean, n, expr);
 | 
|---|
 | 8892 |                 }
 | 
|---|
 | 8893 | 
 | 
|---|
 | 8894 |                 return n;
 | 
|---|
 | 8895 |             }
 | 
|---|
 | 8896 | 
 | 
|---|
 | 8897 |             // OrExpr ::= AndExpr | OrExpr 'or' AndExpr
 | 
|---|
 | 8898 |             xpath_ast_node* parse_or_expression()
 | 
|---|
 | 8899 |             {
 | 
|---|
 | 8900 |                 xpath_ast_node* n = parse_and_expression();
 | 
|---|
 | 8901 | 
 | 
|---|
 | 8902 |                 while (_lexer.current() == lex_string && _lexer.contents() == PUGIXML_TEXT("or"))
 | 
|---|
 | 8903 |                 {
 | 
|---|
 | 8904 |                         _lexer.next();
 | 
|---|
 | 8905 | 
 | 
|---|
 | 8906 |                                 xpath_ast_node* expr = parse_and_expression();
 | 
|---|
 | 8907 | 
 | 
|---|
 | 8908 |                         n = new (alloc_node()) xpath_ast_node(ast_op_or, xpath_type_boolean, n, expr);
 | 
|---|
 | 8909 |                 }
 | 
|---|
 | 8910 | 
 | 
|---|
 | 8911 |                 return n;
 | 
|---|
 | 8912 |             }
 | 
|---|
 | 8913 |                 
 | 
|---|
 | 8914 |                 // Expr ::= OrExpr
 | 
|---|
 | 8915 |                 xpath_ast_node* parse_expression()
 | 
|---|
 | 8916 |                 {
 | 
|---|
 | 8917 |                         return parse_or_expression();
 | 
|---|
 | 8918 |                 }
 | 
|---|
 | 8919 | 
 | 
|---|
 | 8920 |                 xpath_parser(const char_t* query, xpath_variable_set* variables, xpath_allocator* alloc, xpath_parse_result* result): _alloc(alloc), _lexer(query), _query(query), _variables(variables), _result(result)
 | 
|---|
 | 8921 |                 {
 | 
|---|
 | 8922 |                 }
 | 
|---|
 | 8923 | 
 | 
|---|
 | 8924 |                 xpath_ast_node* parse()
 | 
|---|
 | 8925 |                 {
 | 
|---|
 | 8926 |                         xpath_ast_node* result = parse_expression();
 | 
|---|
 | 8927 |                         
 | 
|---|
 | 8928 |                         if (_lexer.current() != lex_eof)
 | 
|---|
 | 8929 |                         {
 | 
|---|
 | 8930 |                                 // there are still unparsed tokens left, error
 | 
|---|
 | 8931 |                                 throw_error("Incorrect query");
 | 
|---|
 | 8932 |                         }
 | 
|---|
 | 8933 |                         
 | 
|---|
 | 8934 |                         return result;
 | 
|---|
 | 8935 |                 }
 | 
|---|
 | 8936 | 
 | 
|---|
 | 8937 |                 static xpath_ast_node* parse(const char_t* query, xpath_variable_set* variables, xpath_allocator* alloc, xpath_parse_result* result)
 | 
|---|
 | 8938 |                 {
 | 
|---|
 | 8939 |                         xpath_parser parser(query, variables, alloc, result);
 | 
|---|
 | 8940 | 
 | 
|---|
 | 8941 |                 #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 8942 |                         int error = setjmp(parser._error_handler);
 | 
|---|
 | 8943 | 
 | 
|---|
 | 8944 |                         return (error == 0) ? parser.parse() : 0;
 | 
|---|
 | 8945 |                 #else
 | 
|---|
 | 8946 |                         return parser.parse();
 | 
|---|
 | 8947 |                 #endif
 | 
|---|
 | 8948 |                 }
 | 
|---|
 | 8949 |         };
 | 
|---|
 | 8950 | 
 | 
|---|
 | 8951 |     struct xpath_query_impl
 | 
|---|
 | 8952 |     {
 | 
|---|
 | 8953 |                 static xpath_query_impl* create()
 | 
|---|
 | 8954 |                 {
 | 
|---|
 | 8955 |                         void* memory = global_allocate(sizeof(xpath_query_impl));
 | 
|---|
 | 8956 | 
 | 
|---|
 | 8957 |             return new (memory) xpath_query_impl();
 | 
|---|
 | 8958 |                 }
 | 
|---|
 | 8959 | 
 | 
|---|
 | 8960 |                 static void destroy(void* ptr)
 | 
|---|
 | 8961 |                 {
 | 
|---|
 | 8962 |                         if (!ptr) return;
 | 
|---|
 | 8963 |                         
 | 
|---|
 | 8964 |                         // free all allocated pages
 | 
|---|
 | 8965 |                         static_cast<xpath_query_impl*>(ptr)->alloc.release();
 | 
|---|
 | 8966 | 
 | 
|---|
 | 8967 |                         // free allocator memory (with the first page)
 | 
|---|
 | 8968 |                         global_deallocate(ptr);
 | 
|---|
 | 8969 |                 }
 | 
|---|
 | 8970 | 
 | 
|---|
 | 8971 |         xpath_query_impl(): root(0), alloc(&block)
 | 
|---|
 | 8972 |         {
 | 
|---|
 | 8973 |             block.next = 0;
 | 
|---|
 | 8974 |         }
 | 
|---|
 | 8975 | 
 | 
|---|
 | 8976 |         xpath_ast_node* root;
 | 
|---|
 | 8977 |         xpath_allocator alloc;
 | 
|---|
 | 8978 |         xpath_memory_block block;
 | 
|---|
 | 8979 |     };
 | 
|---|
 | 8980 | 
 | 
|---|
 | 8981 |         xpath_string evaluate_string_impl(xpath_query_impl* impl, const xpath_node& n, xpath_stack_data& sd)
 | 
|---|
 | 8982 |         {
 | 
|---|
 | 8983 |                 if (!impl) return xpath_string();
 | 
|---|
 | 8984 | 
 | 
|---|
 | 8985 |         #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 8986 |                 if (setjmp(sd.error_handler)) return xpath_string();
 | 
|---|
 | 8987 |         #endif
 | 
|---|
 | 8988 | 
 | 
|---|
 | 8989 |                 xpath_context c(n, 1, 1);
 | 
|---|
 | 8990 | 
 | 
|---|
 | 8991 |                 return impl->root->eval_string(c, sd.stack);
 | 
|---|
 | 8992 |         }
 | 
|---|
 | 8993 | }
 | 
|---|
 | 8994 | 
 | 
|---|
 | 8995 | namespace pugi
 | 
|---|
 | 8996 | {
 | 
|---|
 | 8997 | #ifndef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 8998 |         xpath_exception::xpath_exception(const xpath_parse_result& result): _result(result)
 | 
|---|
 | 8999 |         {
 | 
|---|
 | 9000 |                 assert(result.error);
 | 
|---|
 | 9001 |         }
 | 
|---|
 | 9002 |         
 | 
|---|
 | 9003 |         const char* xpath_exception::what() const throw()
 | 
|---|
 | 9004 |         {
 | 
|---|
 | 9005 |                 return _result.error;
 | 
|---|
 | 9006 |         }
 | 
|---|
 | 9007 | 
 | 
|---|
 | 9008 |         const xpath_parse_result& xpath_exception::result() const
 | 
|---|
 | 9009 |         {
 | 
|---|
 | 9010 |                 return _result;
 | 
|---|
 | 9011 |         }
 | 
|---|
 | 9012 | #endif
 | 
|---|
 | 9013 |         
 | 
|---|
 | 9014 |         xpath_node::xpath_node()
 | 
|---|
 | 9015 |         {
 | 
|---|
 | 9016 |         }
 | 
|---|
 | 9017 |                 
 | 
|---|
 | 9018 |         xpath_node::xpath_node(const xml_node& node): _node(node)
 | 
|---|
 | 9019 |         {
 | 
|---|
 | 9020 |         }
 | 
|---|
 | 9021 |                 
 | 
|---|
 | 9022 |         xpath_node::xpath_node(const xml_attribute& attribute, const xml_node& parent): _node(attribute ? parent : xml_node()), _attribute(attribute)
 | 
|---|
 | 9023 |         {
 | 
|---|
 | 9024 |         }
 | 
|---|
 | 9025 | 
 | 
|---|
 | 9026 |         xml_node xpath_node::node() const
 | 
|---|
 | 9027 |         {
 | 
|---|
 | 9028 |                 return _attribute ? xml_node() : _node;
 | 
|---|
 | 9029 |         }
 | 
|---|
 | 9030 |                 
 | 
|---|
 | 9031 |         xml_attribute xpath_node::attribute() const
 | 
|---|
 | 9032 |         {
 | 
|---|
 | 9033 |                 return _attribute;
 | 
|---|
 | 9034 |         }
 | 
|---|
 | 9035 |         
 | 
|---|
 | 9036 |         xml_node xpath_node::parent() const
 | 
|---|
 | 9037 |         {
 | 
|---|
 | 9038 |                 return _attribute ? _node : _node.parent();
 | 
|---|
 | 9039 |         }
 | 
|---|
 | 9040 | 
 | 
|---|
 | 9041 |         xpath_node::operator xpath_node::unspecified_bool_type() const
 | 
|---|
 | 9042 |         {
 | 
|---|
 | 9043 |                 return (_node || _attribute) ? &xpath_node::_node : 0;
 | 
|---|
 | 9044 |         }
 | 
|---|
 | 9045 |         
 | 
|---|
 | 9046 |         bool xpath_node::operator!() const
 | 
|---|
 | 9047 |         {
 | 
|---|
 | 9048 |                 return !(_node || _attribute);
 | 
|---|
 | 9049 |         }
 | 
|---|
 | 9050 | 
 | 
|---|
 | 9051 |         bool xpath_node::operator==(const xpath_node& n) const
 | 
|---|
 | 9052 |         {
 | 
|---|
 | 9053 |                 return _node == n._node && _attribute == n._attribute;
 | 
|---|
 | 9054 |         }
 | 
|---|
 | 9055 |         
 | 
|---|
 | 9056 |         bool xpath_node::operator!=(const xpath_node& n) const
 | 
|---|
 | 9057 |         {
 | 
|---|
 | 9058 |                 return _node != n._node || _attribute != n._attribute;
 | 
|---|
 | 9059 |         }
 | 
|---|
 | 9060 | 
 | 
|---|
 | 9061 | #ifdef __BORLANDC__
 | 
|---|
 | 9062 |         bool operator&&(const xpath_node& lhs, bool rhs)
 | 
|---|
 | 9063 |         {
 | 
|---|
 | 9064 |                 return (bool)lhs && rhs;
 | 
|---|
 | 9065 |         }
 | 
|---|
 | 9066 | 
 | 
|---|
 | 9067 |         bool operator||(const xpath_node& lhs, bool rhs)
 | 
|---|
 | 9068 |         {
 | 
|---|
 | 9069 |                 return (bool)lhs || rhs;
 | 
|---|
 | 9070 |         }
 | 
|---|
 | 9071 | #endif
 | 
|---|
 | 9072 | 
 | 
|---|
 | 9073 |         void xpath_node_set::_assign(const_iterator begin, const_iterator end)
 | 
|---|
 | 9074 |         {
 | 
|---|
 | 9075 |                 assert(begin <= end);
 | 
|---|
 | 9076 | 
 | 
|---|
 | 9077 |                 size_t size = static_cast<size_t>(end - begin);
 | 
|---|
 | 9078 | 
 | 
|---|
 | 9079 |                 if (size <= 1)
 | 
|---|
 | 9080 |                 {
 | 
|---|
 | 9081 |                         // deallocate old buffer
 | 
|---|
 | 9082 |                         if (_begin != &_storage) global_deallocate(_begin);
 | 
|---|
 | 9083 | 
 | 
|---|
 | 9084 |                         // use internal buffer
 | 
|---|
 | 9085 |                         if (begin != end) _storage = *begin;
 | 
|---|
 | 9086 | 
 | 
|---|
 | 9087 |                         _begin = &_storage;
 | 
|---|
 | 9088 |                         _end = &_storage + size;
 | 
|---|
 | 9089 |                 }
 | 
|---|
 | 9090 |                 else
 | 
|---|
 | 9091 |                 {
 | 
|---|
 | 9092 |                         // make heap copy
 | 
|---|
 | 9093 |                         xpath_node* storage = static_cast<xpath_node*>(global_allocate(size * sizeof(xpath_node)));
 | 
|---|
 | 9094 | 
 | 
|---|
 | 9095 |                         if (!storage)
 | 
|---|
 | 9096 |                         {
 | 
|---|
 | 9097 |                         #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 9098 |                                 return;
 | 
|---|
 | 9099 |                         #else
 | 
|---|
 | 9100 |                                 throw std::bad_alloc();
 | 
|---|
 | 9101 |                         #endif
 | 
|---|
 | 9102 |                         }
 | 
|---|
 | 9103 | 
 | 
|---|
 | 9104 |                         memcpy(storage, begin, size * sizeof(xpath_node));
 | 
|---|
 | 9105 |                         
 | 
|---|
 | 9106 |                         // deallocate old buffer
 | 
|---|
 | 9107 |                         if (_begin != &_storage) global_deallocate(_begin);
 | 
|---|
 | 9108 | 
 | 
|---|
 | 9109 |                         // finalize
 | 
|---|
 | 9110 |                         _begin = storage;
 | 
|---|
 | 9111 |                         _end = storage + size;
 | 
|---|
 | 9112 |                 }
 | 
|---|
 | 9113 |         }
 | 
|---|
 | 9114 | 
 | 
|---|
 | 9115 |         xpath_node_set::xpath_node_set(): _type(type_unsorted), _begin(&_storage), _end(&_storage)
 | 
|---|
 | 9116 |         {
 | 
|---|
 | 9117 |         }
 | 
|---|
 | 9118 | 
 | 
|---|
 | 9119 |         xpath_node_set::xpath_node_set(const_iterator begin, const_iterator end, type_t type): _type(type), _begin(&_storage), _end(&_storage)
 | 
|---|
 | 9120 |         {
 | 
|---|
 | 9121 |                 _assign(begin, end);
 | 
|---|
 | 9122 |         }
 | 
|---|
 | 9123 | 
 | 
|---|
 | 9124 |         xpath_node_set::~xpath_node_set()
 | 
|---|
 | 9125 |         {
 | 
|---|
 | 9126 |                 if (_begin != &_storage) global_deallocate(_begin);
 | 
|---|
 | 9127 |         }
 | 
|---|
 | 9128 |                 
 | 
|---|
 | 9129 |         xpath_node_set::xpath_node_set(const xpath_node_set& ns): _type(ns._type), _begin(&_storage), _end(&_storage)
 | 
|---|
 | 9130 |         {
 | 
|---|
 | 9131 |                 _assign(ns._begin, ns._end);
 | 
|---|
 | 9132 |         }
 | 
|---|
 | 9133 |         
 | 
|---|
 | 9134 |         xpath_node_set& xpath_node_set::operator=(const xpath_node_set& ns)
 | 
|---|
 | 9135 |         {
 | 
|---|
 | 9136 |                 if (this == &ns) return *this;
 | 
|---|
 | 9137 |                 
 | 
|---|
 | 9138 |                 _type = ns._type;
 | 
|---|
 | 9139 |                 _assign(ns._begin, ns._end);
 | 
|---|
 | 9140 | 
 | 
|---|
 | 9141 |                 return *this;
 | 
|---|
 | 9142 |         }
 | 
|---|
 | 9143 | 
 | 
|---|
 | 9144 |         xpath_node_set::type_t xpath_node_set::type() const
 | 
|---|
 | 9145 |         {
 | 
|---|
 | 9146 |                 return _type;
 | 
|---|
 | 9147 |         }
 | 
|---|
 | 9148 |                 
 | 
|---|
 | 9149 |         size_t xpath_node_set::size() const
 | 
|---|
 | 9150 |         {
 | 
|---|
 | 9151 |                 return _end - _begin;
 | 
|---|
 | 9152 |         }
 | 
|---|
 | 9153 |                 
 | 
|---|
 | 9154 |         bool xpath_node_set::empty() const
 | 
|---|
 | 9155 |         {
 | 
|---|
 | 9156 |                 return _begin == _end;
 | 
|---|
 | 9157 |         }
 | 
|---|
 | 9158 |                 
 | 
|---|
 | 9159 |         const xpath_node& xpath_node_set::operator[](size_t index) const
 | 
|---|
 | 9160 |         {
 | 
|---|
 | 9161 |                 assert(index < size());
 | 
|---|
 | 9162 |                 return _begin[index];
 | 
|---|
 | 9163 |         }
 | 
|---|
 | 9164 | 
 | 
|---|
 | 9165 |         xpath_node_set::const_iterator xpath_node_set::begin() const
 | 
|---|
 | 9166 |         {
 | 
|---|
 | 9167 |                 return _begin;
 | 
|---|
 | 9168 |         }
 | 
|---|
 | 9169 |                 
 | 
|---|
 | 9170 |         xpath_node_set::const_iterator xpath_node_set::end() const
 | 
|---|
 | 9171 |         {
 | 
|---|
 | 9172 |                 return _end;
 | 
|---|
 | 9173 |         }
 | 
|---|
 | 9174 |         
 | 
|---|
 | 9175 |         void xpath_node_set::sort(bool reverse)
 | 
|---|
 | 9176 |         {
 | 
|---|
 | 9177 |                 _type = xpath_sort(_begin, _end, _type, reverse);
 | 
|---|
 | 9178 |         }
 | 
|---|
 | 9179 | 
 | 
|---|
 | 9180 |         xpath_node xpath_node_set::first() const
 | 
|---|
 | 9181 |         {
 | 
|---|
 | 9182 |                 return xpath_first(_begin, _end, _type);
 | 
|---|
 | 9183 |         }
 | 
|---|
 | 9184 | 
 | 
|---|
 | 9185 |     xpath_parse_result::xpath_parse_result(): error("Internal error"), offset(0)
 | 
|---|
 | 9186 |     {
 | 
|---|
 | 9187 |     }
 | 
|---|
 | 9188 | 
 | 
|---|
 | 9189 |     xpath_parse_result::operator bool() const
 | 
|---|
 | 9190 |     {
 | 
|---|
 | 9191 |         return error == 0;
 | 
|---|
 | 9192 |     }
 | 
|---|
 | 9193 |         const char* xpath_parse_result::description() const
 | 
|---|
 | 9194 |         {
 | 
|---|
 | 9195 |                 return error ? error : "No error";
 | 
|---|
 | 9196 |         }
 | 
|---|
 | 9197 | 
 | 
|---|
 | 9198 |         xpath_variable::xpath_variable()
 | 
|---|
 | 9199 |     {
 | 
|---|
 | 9200 |     }
 | 
|---|
 | 9201 | 
 | 
|---|
 | 9202 |         const char_t* xpath_variable::name() const
 | 
|---|
 | 9203 |         {
 | 
|---|
 | 9204 |                 switch (_type)
 | 
|---|
 | 9205 |                 {
 | 
|---|
 | 9206 |                 case xpath_type_node_set:
 | 
|---|
 | 9207 |                         return static_cast<const xpath_variable_node_set*>(this)->name;
 | 
|---|
 | 9208 | 
 | 
|---|
 | 9209 |                 case xpath_type_number:
 | 
|---|
 | 9210 |                         return static_cast<const xpath_variable_number*>(this)->name;
 | 
|---|
 | 9211 | 
 | 
|---|
 | 9212 |                 case xpath_type_string:
 | 
|---|
 | 9213 |                         return static_cast<const xpath_variable_string*>(this)->name;
 | 
|---|
 | 9214 | 
 | 
|---|
 | 9215 |                 case xpath_type_boolean:
 | 
|---|
 | 9216 |                         return static_cast<const xpath_variable_boolean*>(this)->name;
 | 
|---|
 | 9217 | 
 | 
|---|
 | 9218 |                 default:
 | 
|---|
 | 9219 |                         assert(!"Invalid variable type");
 | 
|---|
 | 9220 |                         return 0;
 | 
|---|
 | 9221 |                 }
 | 
|---|
 | 9222 |         }
 | 
|---|
 | 9223 | 
 | 
|---|
 | 9224 |         xpath_value_type xpath_variable::type() const
 | 
|---|
 | 9225 |         {
 | 
|---|
 | 9226 |                 return _type;
 | 
|---|
 | 9227 |         }
 | 
|---|
 | 9228 | 
 | 
|---|
 | 9229 |         bool xpath_variable::get_boolean() const
 | 
|---|
 | 9230 |         {
 | 
|---|
 | 9231 |                 return (_type == xpath_type_boolean) ? static_cast<const xpath_variable_boolean*>(this)->value : false;
 | 
|---|
 | 9232 |         }
 | 
|---|
 | 9233 | 
 | 
|---|
 | 9234 |         double xpath_variable::get_number() const
 | 
|---|
 | 9235 |         {
 | 
|---|
 | 9236 |                 return (_type == xpath_type_number) ? static_cast<const xpath_variable_number*>(this)->value : gen_nan();
 | 
|---|
 | 9237 |         }
 | 
|---|
 | 9238 | 
 | 
|---|
 | 9239 |         const char_t* xpath_variable::get_string() const
 | 
|---|
 | 9240 |         {
 | 
|---|
 | 9241 |                 const char_t* value = (_type == xpath_type_string) ? static_cast<const xpath_variable_string*>(this)->value : 0;
 | 
|---|
 | 9242 |                 return value ? value : PUGIXML_TEXT("");
 | 
|---|
 | 9243 |         }
 | 
|---|
 | 9244 | 
 | 
|---|
 | 9245 |         const xpath_node_set& xpath_variable::get_node_set() const
 | 
|---|
 | 9246 |         {
 | 
|---|
 | 9247 |                 return (_type == xpath_type_node_set) ? static_cast<const xpath_variable_node_set*>(this)->value : dummy_node_set;
 | 
|---|
 | 9248 |         }
 | 
|---|
 | 9249 | 
 | 
|---|
 | 9250 |         bool xpath_variable::set(bool value)
 | 
|---|
 | 9251 |         {
 | 
|---|
 | 9252 |                 if (_type != xpath_type_boolean) return false;
 | 
|---|
 | 9253 | 
 | 
|---|
 | 9254 |                 static_cast<xpath_variable_boolean*>(this)->value = value;
 | 
|---|
 | 9255 |                 return true;
 | 
|---|
 | 9256 |         }
 | 
|---|
 | 9257 | 
 | 
|---|
 | 9258 |         bool xpath_variable::set(double value)
 | 
|---|
 | 9259 |         {
 | 
|---|
 | 9260 |                 if (_type != xpath_type_number) return false;
 | 
|---|
 | 9261 | 
 | 
|---|
 | 9262 |                 static_cast<xpath_variable_number*>(this)->value = value;
 | 
|---|
 | 9263 |                 return true;
 | 
|---|
 | 9264 |         }
 | 
|---|
 | 9265 | 
 | 
|---|
 | 9266 |         bool xpath_variable::set(const char_t* value)
 | 
|---|
 | 9267 |         {
 | 
|---|
 | 9268 |                 if (_type != xpath_type_string) return false;
 | 
|---|
 | 9269 | 
 | 
|---|
 | 9270 |                 xpath_variable_string* var = static_cast<xpath_variable_string*>(this);
 | 
|---|
 | 9271 | 
 | 
|---|
 | 9272 |                 // duplicate string
 | 
|---|
 | 9273 |                 size_t size = (strlength(value) + 1) * sizeof(char_t);
 | 
|---|
 | 9274 | 
 | 
|---|
 | 9275 |                 char_t* copy = static_cast<char_t*>(global_allocate(size));
 | 
|---|
 | 9276 |                 if (!copy) return false;
 | 
|---|
 | 9277 | 
 | 
|---|
 | 9278 |                 memcpy(copy, value, size);
 | 
|---|
 | 9279 | 
 | 
|---|
 | 9280 |                 // replace old string
 | 
|---|
 | 9281 |                 if (var->value) global_deallocate(var->value);
 | 
|---|
 | 9282 |                 var->value = copy;
 | 
|---|
 | 9283 | 
 | 
|---|
 | 9284 |                 return true;
 | 
|---|
 | 9285 |         }
 | 
|---|
 | 9286 | 
 | 
|---|
 | 9287 |         bool xpath_variable::set(const xpath_node_set& value)
 | 
|---|
 | 9288 |         {
 | 
|---|
 | 9289 |                 if (_type != xpath_type_node_set) return false;
 | 
|---|
 | 9290 | 
 | 
|---|
 | 9291 |                 static_cast<xpath_variable_node_set*>(this)->value = value;
 | 
|---|
 | 9292 |                 return true;
 | 
|---|
 | 9293 |         }
 | 
|---|
 | 9294 | 
 | 
|---|
 | 9295 |         xpath_variable_set::xpath_variable_set()
 | 
|---|
 | 9296 |         {
 | 
|---|
 | 9297 |                 for (size_t i = 0; i < sizeof(_data) / sizeof(_data[0]); ++i) _data[i] = 0;
 | 
|---|
 | 9298 |         }
 | 
|---|
 | 9299 | 
 | 
|---|
 | 9300 |         xpath_variable_set::~xpath_variable_set()
 | 
|---|
 | 9301 |         {
 | 
|---|
 | 9302 |                 for (size_t i = 0; i < sizeof(_data) / sizeof(_data[0]); ++i)
 | 
|---|
 | 9303 |                 {
 | 
|---|
 | 9304 |                         xpath_variable* var = _data[i];
 | 
|---|
 | 9305 | 
 | 
|---|
 | 9306 |                         while (var)
 | 
|---|
 | 9307 |                         {
 | 
|---|
 | 9308 |                                 xpath_variable* next = var->_next;
 | 
|---|
 | 9309 | 
 | 
|---|
 | 9310 |                                 delete_xpath_variable(var->_type, var);
 | 
|---|
 | 9311 | 
 | 
|---|
 | 9312 |                                 var = next;
 | 
|---|
 | 9313 |                         }
 | 
|---|
 | 9314 |                 }
 | 
|---|
 | 9315 |         }
 | 
|---|
 | 9316 | 
 | 
|---|
 | 9317 |         xpath_variable* xpath_variable_set::find(const char_t* name) const
 | 
|---|
 | 9318 |         {
 | 
|---|
 | 9319 |                 const size_t hash_size = sizeof(_data) / sizeof(_data[0]);
 | 
|---|
 | 9320 |                 size_t hash = hash_string(name) % hash_size;
 | 
|---|
 | 9321 | 
 | 
|---|
 | 9322 |                 // look for existing variable
 | 
|---|
 | 9323 |                 for (xpath_variable* var = _data[hash]; var; var = var->_next)
 | 
|---|
 | 9324 |                         if (strequal(var->name(), name))
 | 
|---|
 | 9325 |                                 return var;
 | 
|---|
 | 9326 | 
 | 
|---|
 | 9327 |                 return 0;
 | 
|---|
 | 9328 |         }
 | 
|---|
 | 9329 | 
 | 
|---|
 | 9330 |         xpath_variable* xpath_variable_set::add(const char_t* name, xpath_value_type type)
 | 
|---|
 | 9331 |         {
 | 
|---|
 | 9332 |                 const size_t hash_size = sizeof(_data) / sizeof(_data[0]);
 | 
|---|
 | 9333 |                 size_t hash = hash_string(name) % hash_size;
 | 
|---|
 | 9334 | 
 | 
|---|
 | 9335 |                 // look for existing variable
 | 
|---|
 | 9336 |                 for (xpath_variable* var = _data[hash]; var; var = var->_next)
 | 
|---|
 | 9337 |                         if (strequal(var->name(), name))
 | 
|---|
 | 9338 |                                 return var->type() == type ? var : 0;
 | 
|---|
 | 9339 | 
 | 
|---|
 | 9340 |                 // add new variable
 | 
|---|
 | 9341 |                 xpath_variable* result = new_xpath_variable(type, name);
 | 
|---|
 | 9342 | 
 | 
|---|
 | 9343 |                 if (result)
 | 
|---|
 | 9344 |                 {
 | 
|---|
 | 9345 |                         result->_type = type;
 | 
|---|
 | 9346 |                         result->_next = _data[hash];
 | 
|---|
 | 9347 | 
 | 
|---|
 | 9348 |                         _data[hash] = result;
 | 
|---|
 | 9349 |                 }
 | 
|---|
 | 9350 | 
 | 
|---|
 | 9351 |                 return result;
 | 
|---|
 | 9352 |         }
 | 
|---|
 | 9353 | 
 | 
|---|
 | 9354 |         bool xpath_variable_set::set(const char_t* name, bool value)
 | 
|---|
 | 9355 |         {
 | 
|---|
 | 9356 |                 xpath_variable* var = add(name, xpath_type_boolean);
 | 
|---|
 | 9357 |                 return var ? var->set(value) : false;
 | 
|---|
 | 9358 |         }
 | 
|---|
 | 9359 | 
 | 
|---|
 | 9360 |         bool xpath_variable_set::set(const char_t* name, double value)
 | 
|---|
 | 9361 |         {
 | 
|---|
 | 9362 |                 xpath_variable* var = add(name, xpath_type_number);
 | 
|---|
 | 9363 |                 return var ? var->set(value) : false;
 | 
|---|
 | 9364 |         }
 | 
|---|
 | 9365 | 
 | 
|---|
 | 9366 |         bool xpath_variable_set::set(const char_t* name, const char_t* value)
 | 
|---|
 | 9367 |         {
 | 
|---|
 | 9368 |                 xpath_variable* var = add(name, xpath_type_string);
 | 
|---|
 | 9369 |                 return var ? var->set(value) : false;
 | 
|---|
 | 9370 |         }
 | 
|---|
 | 9371 | 
 | 
|---|
 | 9372 |         bool xpath_variable_set::set(const char_t* name, const xpath_node_set& value)
 | 
|---|
 | 9373 |         {
 | 
|---|
 | 9374 |                 xpath_variable* var = add(name, xpath_type_node_set);
 | 
|---|
 | 9375 |                 return var ? var->set(value) : false;
 | 
|---|
 | 9376 |         }
 | 
|---|
 | 9377 | 
 | 
|---|
 | 9378 |         xpath_variable* xpath_variable_set::get(const char_t* name)
 | 
|---|
 | 9379 |         {
 | 
|---|
 | 9380 |                 return find(name);
 | 
|---|
 | 9381 |         }
 | 
|---|
 | 9382 | 
 | 
|---|
 | 9383 |         const xpath_variable* xpath_variable_set::get(const char_t* name) const
 | 
|---|
 | 9384 |         {
 | 
|---|
 | 9385 |                 return find(name);
 | 
|---|
 | 9386 |         }
 | 
|---|
 | 9387 | 
 | 
|---|
 | 9388 |         xpath_query::xpath_query(const char_t* query, xpath_variable_set* variables): _impl(0)
 | 
|---|
 | 9389 |         {
 | 
|---|
 | 9390 |                 xpath_query_impl* impl = xpath_query_impl::create();
 | 
|---|
 | 9391 | 
 | 
|---|
 | 9392 |                 if (!impl)
 | 
|---|
 | 9393 |                 {
 | 
|---|
 | 9394 |                 #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 9395 |                         _result.error = "Out of memory";
 | 
|---|
 | 9396 |         #else
 | 
|---|
 | 9397 |                         throw std::bad_alloc();
 | 
|---|
 | 9398 |                 #endif
 | 
|---|
 | 9399 |                 }
 | 
|---|
 | 9400 |                 else
 | 
|---|
 | 9401 |                 {
 | 
|---|
 | 9402 |                         buffer_holder impl_holder(impl, xpath_query_impl::destroy);
 | 
|---|
 | 9403 | 
 | 
|---|
 | 9404 |                         impl->root = xpath_parser::parse(query, variables, &impl->alloc, &_result);
 | 
|---|
 | 9405 | 
 | 
|---|
 | 9406 |                         if (impl->root)
 | 
|---|
 | 9407 |                         {
 | 
|---|
 | 9408 |                 _impl = static_cast<xpath_query_impl*>(impl_holder.release());
 | 
|---|
 | 9409 |                                 _result.error = 0;
 | 
|---|
 | 9410 |                         }
 | 
|---|
 | 9411 |                 }
 | 
|---|
 | 9412 |         }
 | 
|---|
 | 9413 | 
 | 
|---|
 | 9414 |         xpath_query::~xpath_query()
 | 
|---|
 | 9415 |         {
 | 
|---|
 | 9416 |                 xpath_query_impl::destroy(_impl);
 | 
|---|
 | 9417 |         }
 | 
|---|
 | 9418 | 
 | 
|---|
 | 9419 |         xpath_value_type xpath_query::return_type() const
 | 
|---|
 | 9420 |         {
 | 
|---|
 | 9421 |                 if (!_impl) return xpath_type_none;
 | 
|---|
 | 9422 | 
 | 
|---|
 | 9423 |                 return static_cast<xpath_query_impl*>(_impl)->root->rettype();
 | 
|---|
 | 9424 |         }
 | 
|---|
 | 9425 | 
 | 
|---|
 | 9426 |         bool xpath_query::evaluate_boolean(const xpath_node& n) const
 | 
|---|
 | 9427 |         {
 | 
|---|
 | 9428 |                 if (!_impl) return false;
 | 
|---|
 | 9429 |                 
 | 
|---|
 | 9430 |                 xpath_context c(n, 1, 1);
 | 
|---|
 | 9431 |                 xpath_stack_data sd;
 | 
|---|
 | 9432 | 
 | 
|---|
 | 9433 |         #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 9434 |                 if (setjmp(sd.error_handler)) return false;
 | 
|---|
 | 9435 |         #endif
 | 
|---|
 | 9436 |                 
 | 
|---|
 | 9437 |                 return static_cast<xpath_query_impl*>(_impl)->root->eval_boolean(c, sd.stack);
 | 
|---|
 | 9438 |         }
 | 
|---|
 | 9439 |         
 | 
|---|
 | 9440 |         double xpath_query::evaluate_number(const xpath_node& n) const
 | 
|---|
 | 9441 |         {
 | 
|---|
 | 9442 |                 if (!_impl) return gen_nan();
 | 
|---|
 | 9443 |                 
 | 
|---|
 | 9444 |                 xpath_context c(n, 1, 1);
 | 
|---|
 | 9445 |                 xpath_stack_data sd;
 | 
|---|
 | 9446 | 
 | 
|---|
 | 9447 |         #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 9448 |                 if (setjmp(sd.error_handler)) return gen_nan();
 | 
|---|
 | 9449 |         #endif
 | 
|---|
 | 9450 | 
 | 
|---|
 | 9451 |                 return static_cast<xpath_query_impl*>(_impl)->root->eval_number(c, sd.stack);
 | 
|---|
 | 9452 |         }
 | 
|---|
 | 9453 | 
 | 
|---|
 | 9454 | #ifndef PUGIXML_NO_STL
 | 
|---|
 | 9455 |         string_t xpath_query::evaluate_string(const xpath_node& n) const
 | 
|---|
 | 9456 |         {
 | 
|---|
 | 9457 |                 xpath_stack_data sd;
 | 
|---|
 | 9458 | 
 | 
|---|
 | 9459 |                 return evaluate_string_impl(static_cast<xpath_query_impl*>(_impl), n, sd).c_str();
 | 
|---|
 | 9460 |         }
 | 
|---|
 | 9461 | #endif
 | 
|---|
 | 9462 | 
 | 
|---|
 | 9463 |         size_t xpath_query::evaluate_string(char_t* buffer, size_t capacity, const xpath_node& n) const
 | 
|---|
 | 9464 |         {
 | 
|---|
 | 9465 |                 xpath_stack_data sd;
 | 
|---|
 | 9466 | 
 | 
|---|
 | 9467 |                 xpath_string r = evaluate_string_impl(static_cast<xpath_query_impl*>(_impl), n, sd);
 | 
|---|
 | 9468 | 
 | 
|---|
 | 9469 |                 size_t full_size = r.length() + 1;
 | 
|---|
 | 9470 |                 
 | 
|---|
 | 9471 |                 if (capacity > 0)
 | 
|---|
 | 9472 |         {
 | 
|---|
 | 9473 |             size_t size = (full_size < capacity) ? full_size : capacity;
 | 
|---|
 | 9474 |             assert(size > 0);
 | 
|---|
 | 9475 | 
 | 
|---|
 | 9476 |             memcpy(buffer, r.c_str(), (size - 1) * sizeof(char_t));
 | 
|---|
 | 9477 |             buffer[size - 1] = 0;
 | 
|---|
 | 9478 |         }
 | 
|---|
 | 9479 |                 
 | 
|---|
 | 9480 |                 return full_size;
 | 
|---|
 | 9481 |         }
 | 
|---|
 | 9482 | 
 | 
|---|
 | 9483 |         xpath_node_set xpath_query::evaluate_node_set(const xpath_node& n) const
 | 
|---|
 | 9484 |         {
 | 
|---|
 | 9485 |                 if (!_impl) return xpath_node_set();
 | 
|---|
 | 9486 | 
 | 
|---|
 | 9487 |         xpath_ast_node* root = static_cast<xpath_query_impl*>(_impl)->root;
 | 
|---|
 | 9488 | 
 | 
|---|
 | 9489 |                 if (root->rettype() != xpath_type_node_set)
 | 
|---|
 | 9490 |                 {
 | 
|---|
 | 9491 |                 #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 9492 |                         return xpath_node_set();
 | 
|---|
 | 9493 |                 #else
 | 
|---|
 | 9494 |                         xpath_parse_result result;
 | 
|---|
 | 9495 |                         result.error = "Expression does not evaluate to node set";
 | 
|---|
 | 9496 | 
 | 
|---|
 | 9497 |                         throw xpath_exception(result);
 | 
|---|
 | 9498 |                 #endif
 | 
|---|
 | 9499 |                 }
 | 
|---|
 | 9500 |                 
 | 
|---|
 | 9501 |                 xpath_context c(n, 1, 1);
 | 
|---|
 | 9502 |                 xpath_stack_data sd;
 | 
|---|
 | 9503 | 
 | 
|---|
 | 9504 |         #ifdef PUGIXML_NO_EXCEPTIONS
 | 
|---|
 | 9505 |                 if (setjmp(sd.error_handler)) return xpath_node_set();
 | 
|---|
 | 9506 |         #endif
 | 
|---|
 | 9507 | 
 | 
|---|
 | 9508 |                 xpath_node_set_raw r = root->eval_node_set(c, sd.stack);
 | 
|---|
 | 9509 | 
 | 
|---|
 | 9510 |                 return xpath_node_set(r.begin(), r.end(), r.type());
 | 
|---|
 | 9511 |         }
 | 
|---|
 | 9512 | 
 | 
|---|
 | 9513 |         const xpath_parse_result& xpath_query::result() const
 | 
|---|
 | 9514 |         {
 | 
|---|
 | 9515 |                 return _result;
 | 
|---|
 | 9516 |         }
 | 
|---|
 | 9517 | 
 | 
|---|
 | 9518 |         xpath_query::operator xpath_query::unspecified_bool_type() const
 | 
|---|
 | 9519 |         {
 | 
|---|
 | 9520 |                 return _impl ? &xpath_query::_impl : 0;
 | 
|---|
 | 9521 |         }
 | 
|---|
 | 9522 | 
 | 
|---|
 | 9523 |         bool xpath_query::operator!() const
 | 
|---|
 | 9524 |         {
 | 
|---|
 | 9525 |                 return !_impl;
 | 
|---|
 | 9526 |         }
 | 
|---|
 | 9527 | 
 | 
|---|
 | 9528 |         xpath_node xml_node::select_single_node(const char_t* query, xpath_variable_set* variables) const
 | 
|---|
 | 9529 |         {
 | 
|---|
 | 9530 |                 xpath_query q(query, variables);
 | 
|---|
 | 9531 |                 return select_single_node(q);
 | 
|---|
 | 9532 |         }
 | 
|---|
 | 9533 | 
 | 
|---|
 | 9534 |         xpath_node xml_node::select_single_node(const xpath_query& query) const
 | 
|---|
 | 9535 |         {
 | 
|---|
 | 9536 |                 xpath_node_set s = query.evaluate_node_set(*this);
 | 
|---|
 | 9537 |                 return s.empty() ? xpath_node() : s.first();
 | 
|---|
 | 9538 |         }
 | 
|---|
 | 9539 | 
 | 
|---|
 | 9540 |         xpath_node_set xml_node::select_nodes(const char_t* query, xpath_variable_set* variables) const
 | 
|---|
 | 9541 |         {
 | 
|---|
 | 9542 |                 xpath_query q(query, variables);
 | 
|---|
 | 9543 |                 return select_nodes(q);
 | 
|---|
 | 9544 |         }
 | 
|---|
 | 9545 | 
 | 
|---|
 | 9546 |         xpath_node_set xml_node::select_nodes(const xpath_query& query) const
 | 
|---|
 | 9547 |         {
 | 
|---|
 | 9548 |                 return query.evaluate_node_set(*this);
 | 
|---|
 | 9549 |         }
 | 
|---|
 | 9550 | }
 | 
|---|
 | 9551 | 
 | 
|---|
 | 9552 | #endif
 | 
|---|
 | 9553 | 
 | 
|---|
 | 9554 | /**
 | 
|---|
 | 9555 |  * Copyright (c) 2006-2010 Arseny Kapoulkine
 | 
|---|
 | 9556 |  *
 | 
|---|
 | 9557 |  * Permission is hereby granted, free of charge, to any person
 | 
|---|
 | 9558 |  * obtaining a copy of this software and associated documentation
 | 
|---|
 | 9559 |  * files (the "Software"), to deal in the Software without
 | 
|---|
 | 9560 |  * restriction, including without limitation the rights to use,
 | 
|---|
 | 9561 |  * copy, modify, merge, publish, distribute, sublicense, and/or sell
 | 
|---|
 | 9562 |  * copies of the Software, and to permit persons to whom the
 | 
|---|
 | 9563 |  * Software is furnished to do so, subject to the following
 | 
|---|
 | 9564 |  * conditions:
 | 
|---|
 | 9565 |  *
 | 
|---|
 | 9566 |  * The above copyright notice and this permission notice shall be
 | 
|---|
 | 9567 |  * included in all copies or substantial portions of the Software.
 | 
|---|
 | 9568 |  * 
 | 
|---|
 | 9569 |  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
 | 
|---|
 | 9570 |  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
 | 
|---|
 | 9571 |  * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
 | 
|---|
 | 9572 |  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
 | 
|---|
 | 9573 |  * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
 | 
|---|
 | 9574 |  * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 | 
|---|
 | 9575 |  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 | 
|---|
 | 9576 |  * OTHER DEALINGS IN THE SOFTWARE.
 | 
|---|
 | 9577 |  */
 | 
|---|