mirror of
https://github.com/zeux/pugixml.git
synced 2025-01-15 02:17:56 +08:00
47c15ad949
Introduce a notable behavior change in default parsing mode: documents without a document element node are now considered invalid. This is technically a breaking change, however the amount of documents it affects is very small, all parsed data still persists, and lack of this check results in very confusing behavior in a number of cases. In order to be able to parse documents without an element node, a fragment parsing flag is introduced. Parsing a buffer in fragment mode treats the buffer as a fragment of a valid XML. As a consequence, top-level PCDATA is added to the tree; additionally, there are no restrictions on the number of nodes -- so documents without a document element are considered valid. Due to the way parsing works internally, load_buffer_inplace occasionally can not preserve the document contents if it's parsed in a fragment mode. While unfortunate, this problem is fundamental; since the use case is relatively obscure, hopefully documenting this shortcoming will be enough. git-svn-id: https://pugixml.googlecode.com/svn/trunk@980 99668b35-9821-0410-8761-19e4c4f06640
237 lines
4.9 KiB
C++
237 lines
4.9 KiB
C++
#include "common.hpp"
|
|
|
|
#include "writer_string.hpp"
|
|
|
|
#include <string>
|
|
|
|
namespace
|
|
{
|
|
int allocate_count = 0;
|
|
int deallocate_count = 0;
|
|
|
|
void* allocate(size_t size)
|
|
{
|
|
++allocate_count;
|
|
return new char[size];
|
|
}
|
|
|
|
void deallocate(void* ptr)
|
|
{
|
|
++deallocate_count;
|
|
delete[] reinterpret_cast<char*>(ptr);
|
|
}
|
|
}
|
|
|
|
TEST(memory_custom_memory_management)
|
|
{
|
|
allocate_count = deallocate_count = 0;
|
|
|
|
// remember old functions
|
|
allocation_function old_allocate = get_memory_allocation_function();
|
|
deallocation_function old_deallocate = get_memory_deallocation_function();
|
|
|
|
// replace functions
|
|
set_memory_management_functions(allocate, deallocate);
|
|
|
|
{
|
|
// parse document
|
|
xml_document doc;
|
|
|
|
CHECK(allocate_count == 0 && deallocate_count == 0);
|
|
|
|
CHECK(doc.load(STR("<node />")));
|
|
|
|
CHECK(allocate_count == 2 && deallocate_count == 0);
|
|
|
|
// modify document (no new page)
|
|
CHECK(doc.first_child().set_name(STR("foobars")));
|
|
CHECK(allocate_count == 2 && deallocate_count == 0);
|
|
|
|
// modify document (new page)
|
|
std::basic_string<pugi::char_t> s(65536, 'x');
|
|
|
|
CHECK(doc.first_child().set_name(s.c_str()));
|
|
CHECK(allocate_count == 3 && deallocate_count == 0);
|
|
|
|
// modify document (new page, old one should die)
|
|
s += s;
|
|
|
|
CHECK(doc.first_child().set_name(s.c_str()));
|
|
CHECK(allocate_count == 4 && deallocate_count == 1);
|
|
}
|
|
|
|
CHECK(allocate_count == 4 && deallocate_count == 4);
|
|
|
|
// restore old functions
|
|
set_memory_management_functions(old_allocate, old_deallocate);
|
|
}
|
|
|
|
TEST(memory_large_allocations)
|
|
{
|
|
allocate_count = deallocate_count = 0;
|
|
|
|
// remember old functions
|
|
allocation_function old_allocate = get_memory_allocation_function();
|
|
deallocation_function old_deallocate = get_memory_deallocation_function();
|
|
|
|
// replace functions
|
|
set_memory_management_functions(allocate, deallocate);
|
|
|
|
{
|
|
xml_document doc;
|
|
|
|
CHECK(allocate_count == 0 && deallocate_count == 0);
|
|
|
|
// initial fill
|
|
for (size_t i = 0; i < 128; ++i)
|
|
{
|
|
std::basic_string<pugi::char_t> s(i * 128, 'x');
|
|
|
|
CHECK(doc.append_child(node_pcdata).set_value(s.c_str()));
|
|
}
|
|
|
|
CHECK(allocate_count > 0 && deallocate_count == 0);
|
|
|
|
// grow-prune loop
|
|
while (doc.first_child())
|
|
{
|
|
pugi::xml_node node;
|
|
|
|
// grow
|
|
for (node = doc.first_child(); node; node = node.next_sibling())
|
|
{
|
|
std::basic_string<pugi::char_t> s = node.value();
|
|
|
|
CHECK(node.set_value((s + s).c_str()));
|
|
}
|
|
|
|
// prune
|
|
for (node = doc.first_child(); node; )
|
|
{
|
|
pugi::xml_node next = node.next_sibling().next_sibling();
|
|
|
|
node.parent().remove_child(node);
|
|
|
|
node = next;
|
|
}
|
|
}
|
|
|
|
CHECK(allocate_count == deallocate_count + 1); // only one live page left (it waits for new allocations)
|
|
|
|
char buffer;
|
|
CHECK(doc.load_buffer_inplace(&buffer, 0, parse_fragment, get_native_encoding()));
|
|
|
|
CHECK(allocate_count == deallocate_count); // no live pages left
|
|
}
|
|
|
|
CHECK(allocate_count == deallocate_count); // everything is freed
|
|
|
|
// restore old functions
|
|
set_memory_management_functions(old_allocate, old_deallocate);
|
|
}
|
|
|
|
TEST(memory_string_allocate_increasing)
|
|
{
|
|
xml_document doc;
|
|
|
|
doc.append_child(node_pcdata).set_value(STR("x"));
|
|
|
|
std::basic_string<char_t> s = STR("ab");
|
|
|
|
for (int i = 0; i < 17; ++i)
|
|
{
|
|
doc.append_child(node_pcdata).set_value(s.c_str());
|
|
|
|
s += s;
|
|
}
|
|
|
|
std::string result = save_narrow(doc, format_no_declaration | format_raw, encoding_utf8);
|
|
|
|
CHECK(result.size() == 262143);
|
|
CHECK(result[0] == 'x');
|
|
|
|
for (size_t j = 1; j < result.size(); ++j)
|
|
{
|
|
CHECK(result[j] == (j % 2 ? 'a' : 'b'));
|
|
}
|
|
}
|
|
|
|
TEST(memory_string_allocate_decreasing)
|
|
{
|
|
xml_document doc;
|
|
|
|
std::basic_string<char_t> s = STR("ab");
|
|
|
|
for (int i = 0; i < 17; ++i) s += s;
|
|
|
|
for (int j = 0; j < 17; ++j)
|
|
{
|
|
s.resize(s.size() / 2);
|
|
|
|
doc.append_child(node_pcdata).set_value(s.c_str());
|
|
}
|
|
|
|
doc.append_child(node_pcdata).set_value(STR("x"));
|
|
|
|
std::string result = save_narrow(doc, format_no_declaration | format_raw, encoding_utf8);
|
|
|
|
CHECK(result.size() == 262143);
|
|
CHECK(result[result.size() - 1] == 'x');
|
|
|
|
for (size_t k = 0; k + 1 < result.size(); ++k)
|
|
{
|
|
CHECK(result[k] == (k % 2 ? 'b' : 'a'));
|
|
}
|
|
}
|
|
|
|
TEST(memory_string_allocate_increasing_inplace)
|
|
{
|
|
xml_document doc;
|
|
|
|
xml_node node = doc.append_child(node_pcdata);
|
|
|
|
node.set_value(STR("x"));
|
|
|
|
std::basic_string<char_t> s = STR("ab");
|
|
|
|
for (int i = 0; i < 17; ++i)
|
|
{
|
|
node.set_value(s.c_str());
|
|
|
|
s += s;
|
|
}
|
|
|
|
std::string result = save_narrow(doc, format_no_declaration | format_raw, encoding_utf8);
|
|
|
|
CHECK(result.size() == 131072);
|
|
|
|
for (size_t j = 0; j < result.size(); ++j)
|
|
{
|
|
CHECK(result[j] == (j % 2 ? 'b' : 'a'));
|
|
}
|
|
}
|
|
|
|
TEST(memory_string_allocate_decreasing_inplace)
|
|
{
|
|
xml_document doc;
|
|
|
|
xml_node node = doc.append_child(node_pcdata);
|
|
|
|
std::basic_string<char_t> s = STR("ab");
|
|
|
|
for (int i = 0; i < 17; ++i) s += s;
|
|
|
|
for (int j = 0; j < 17; ++j)
|
|
{
|
|
s.resize(s.size() / 2);
|
|
|
|
node.set_value(s.c_str());
|
|
}
|
|
|
|
node.set_value(STR("x"));
|
|
|
|
std::string result = save_narrow(doc, format_no_declaration | format_raw, encoding_utf8);
|
|
|
|
CHECK(result == "x");
|
|
}
|