/* The code in this file is released into the Public Domain. */ #define CATCH_CONFIG_MAIN #include "catch.hpp" #include #include #include #include #include #include #include #include std::string S_(const char* s) { return std::string(s); } std::string filename(const char* test_id, const char* suffix = "osm") { const char* testdir = getenv("TESTDIR"); if (!testdir) { std::cerr << "You have to set TESTDIR environment variable before running testdata-xml\n"; exit(2); } std::string f; f += testdir; f += "/"; f += test_id; f += "/data."; f += suffix; return f; } struct header_buffer_type { osmium::io::Header header; osmium::memory::Buffer buffer; }; // ============================================= // The following helper functions are used to call different parts of the // Osmium internals used to read and parse XML files. This way those parts // can be tested individually. These function can not be used in normal // operations, because they make certain assumptions, for instance that // file contents fit into small buffers. std::string read_file(const char* test_id) { int fd = osmium::io::detail::open_for_reading(filename(test_id)); assert(fd >= 0); std::string input(10000, '\0'); auto n = ::read(fd, reinterpret_cast(const_cast(input.data())), 10000); assert(n >= 0); input.resize(static_cast(n)); close(fd); return input; } std::string read_gz_file(const char* test_id, const char* suffix) { int fd = osmium::io::detail::open_for_reading(filename(test_id, suffix)); assert(fd >= 0); osmium::io::GzipDecompressor gzip_decompressor(fd); std::string input = gzip_decompressor.read(); gzip_decompressor.close(); return input; } header_buffer_type parse_xml(std::string input) { osmium::io::detail::future_string_queue_type input_queue; osmium::io::detail::future_buffer_queue_type output_queue; std::promise header_promise; std::future header_future = header_promise.get_future(); osmium::io::detail::add_to_queue(input_queue, std::move(input)); osmium::io::detail::add_to_queue(input_queue, std::string{}); osmium::io::detail::XMLParser parser(input_queue, output_queue, header_promise, osmium::osm_entity_bits::all); parser.parse(); header_buffer_type result; result.header = header_future.get(); std::future future_buffer; output_queue.wait_and_pop(future_buffer); result.buffer = future_buffer.get(); if (result.buffer) { std::future future_buffer2; output_queue.wait_and_pop(future_buffer2); assert(!future_buffer2.get()); } return result; } header_buffer_type read_xml(const char* test_id) { std::string input = read_file(test_id); return parse_xml(input); } // ============================================= TEST_CASE("Reading OSM XML 100") { SECTION("Direct") { header_buffer_type r = read_xml("100-correct_but_no_data"); REQUIRE(r.header.get("generator") == "testdata"); REQUIRE(0 == r.buffer.committed()); REQUIRE(! r.buffer); } SECTION("Using Reader") { osmium::io::Reader reader(filename("100-correct_but_no_data")); osmium::io::Header header = reader.header(); REQUIRE(header.get("generator") == "testdata"); osmium::memory::Buffer buffer = reader.read(); REQUIRE(0 == buffer.committed()); REQUIRE(! buffer); reader.close(); } SECTION("Using Reader asking for header only") { osmium::io::Reader reader(filename("100-correct_but_no_data"), osmium::osm_entity_bits::nothing); osmium::io::Header header = reader.header(); REQUIRE(header.get("generator") == "testdata"); reader.close(); } } // ============================================= TEST_CASE("Reading OSM XML 101") { SECTION("Direct") { REQUIRE_THROWS_AS(read_xml("101-missing_version"), osmium::format_version_error); try { read_xml("101-missing_version"); } catch (osmium::format_version_error& e) { REQUIRE(e.version.empty()); } } SECTION("Using Reader") { REQUIRE_THROWS_AS({ osmium::io::Reader reader(filename("101-missing_version")); osmium::io::Header header = reader.header(); osmium::memory::Buffer buffer = reader.read(); reader.close(); }, osmium::format_version_error); } } // ============================================= TEST_CASE("Reading OSM XML 102") { SECTION("Direct") { REQUIRE_THROWS_AS(read_xml("102-wrong_version"), osmium::format_version_error); try { read_xml("102-wrong_version"); } catch (osmium::format_version_error& e) { REQUIRE(e.version == "0.1"); } } SECTION("Using Reader") { REQUIRE_THROWS_AS({ osmium::io::Reader reader(filename("102-wrong_version")); osmium::io::Header header = reader.header(); osmium::memory::Buffer buffer = reader.read(); reader.close(); }, osmium::format_version_error); } } // ============================================= TEST_CASE("Reading OSM XML 103") { SECTION("Direct") { REQUIRE_THROWS_AS(read_xml("103-old_version"), osmium::format_version_error); try { read_xml("103-old_version"); } catch (osmium::format_version_error& e) { REQUIRE(e.version == "0.5"); } } SECTION("Using Reader") { REQUIRE_THROWS_AS({ osmium::io::Reader reader(filename("103-old_version")); osmium::io::Header header = reader.header(); osmium::memory::Buffer buffer = reader.read(); reader.close(); }, osmium::format_version_error); } } // ============================================= TEST_CASE("Reading OSM XML 104") { SECTION("Direct") { REQUIRE_THROWS_AS(read_xml("104-empty_file"), osmium::xml_error); try { read_xml("104-empty_file"); } catch (osmium::xml_error& e) { REQUIRE(e.line == 1); REQUIRE(e.column == 0); } } SECTION("Using Reader") { REQUIRE_THROWS_AS({ osmium::io::Reader reader(filename("104-empty_file")); osmium::io::Header header = reader.header(); osmium::memory::Buffer buffer = reader.read(); reader.close(); }, osmium::xml_error); } } // ============================================= TEST_CASE("Reading OSM XML 105") { SECTION("Direct") { REQUIRE_THROWS_AS(read_xml("105-incomplete_xml_file"), osmium::xml_error); } SECTION("Using Reader") { REQUIRE_THROWS_AS({ osmium::io::Reader reader(filename("105-incomplete_xml_file")); osmium::io::Header header = reader.header(); osmium::memory::Buffer buffer = reader.read(); reader.close(); }, osmium::xml_error); } } // ============================================= TEST_CASE("Reading OSM XML 120") { SECTION("Direct") { std::string data = read_gz_file("120-correct_gzip_file_without_data", "osm.gz"); REQUIRE(data.size() == 102); header_buffer_type r = parse_xml(data); REQUIRE(r.header.get("generator") == "testdata"); REQUIRE(0 == r.buffer.committed()); REQUIRE(! r.buffer); } SECTION("Using Reader") { osmium::io::Reader reader(filename("120-correct_gzip_file_without_data", "osm.gz")); osmium::io::Header header = reader.header(); REQUIRE(header.get("generator") == "testdata"); osmium::memory::Buffer buffer = reader.read(); REQUIRE(0 == buffer.committed()); REQUIRE(! buffer); reader.close(); } } // ============================================= TEST_CASE("Reading OSM XML 121") { SECTION("Direct") { REQUIRE_THROWS_AS( { read_gz_file("121-truncated_gzip_file", "osm.gz"); }, osmium::gzip_error); } SECTION("Using Reader") { // can throw osmium::gzip_error or osmium::xml_error REQUIRE_THROWS({ osmium::io::Reader reader(filename("121-truncated_gzip_file", "osm.gz")); osmium::io::Header header = reader.header(); osmium::memory::Buffer buffer = reader.read(); reader.close(); }); } } // ============================================= TEST_CASE("Reading OSM XML 122") { SECTION("Direct") { REQUIRE_THROWS_AS( { read_xml("122-no_osm_element"); }, osmium::xml_error); } SECTION("Using Reader") { REQUIRE_THROWS_AS({ osmium::io::Reader reader(filename("122-no_osm_element")); osmium::io::Header header = reader.header(); osmium::memory::Buffer buffer = reader.read(); reader.close(); }, osmium::xml_error); } } // ============================================= TEST_CASE("Reading OSM XML 140") { SECTION("Using Reader") { osmium::io::Reader reader(filename("140-unicode")); osmium::memory::Buffer buffer = reader.read(); reader.close(); int count = 0; for (auto it = buffer.begin(); it != buffer.end(); ++it) { ++count; REQUIRE(it->id() == count); const osmium::TagList& t = it->tags(); const char* uc = t["unicode_char"]; auto len = atoi(t["unicode_utf8_length"]); REQUIRE(len == strlen(uc)); REQUIRE(S_(uc) == t["unicode_xml"]); // workaround for missing support for u8 string literals on Windows #if !defined(_MSC_VER) switch (count) { case 1: REQUIRE(S_(uc) == u8"a"); break; case 2: REQUIRE(S_(uc) == u8"\u00e4"); break; case 3: REQUIRE(S_(uc) == u8"\u30dc"); break; case 4: REQUIRE(S_(uc) == u8"\U0001d11e"); break; case 5: REQUIRE(S_(uc) == u8"\U0001f6eb"); break; default: REQUIRE(false); // should not be here } #endif } REQUIRE(count == 5); } } // ============================================= TEST_CASE("Reading OSM XML 141") { SECTION("Using Reader") { osmium::io::Reader reader(filename("141-entities")); osmium::memory::Buffer buffer = reader.read(); reader.close(); REQUIRE(buffer.committed() > 0); REQUIRE(buffer.get(0).type() == osmium::item_type::node); const osmium::Node& node = buffer.get(0); const osmium::TagList& tags = node.tags(); REQUIRE(S_(tags["less-than"]) == "<"); REQUIRE(S_(tags["greater-than"]) == ">"); REQUIRE(S_(tags["apostrophe"]) == "'"); REQUIRE(S_(tags["ampersand"]) == "&"); REQUIRE(S_(tags["quote"]) == "\""); } } // ============================================= TEST_CASE("Reading OSM XML 142") { SECTION("Using Reader to read nodes") { osmium::io::Reader reader(filename("142-whitespace")); osmium::memory::Buffer buffer = reader.read(); reader.close(); int count = 0; for (auto it = buffer.begin(); it != buffer.end(); ++it) { ++count; REQUIRE(it->id() == count); REQUIRE(it->tags().size() == 1); const osmium::Tag& tag = *(it->tags().begin()); switch (count) { case 1: REQUIRE(S_(it->user()) == "user name"); REQUIRE(S_(tag.key()) == "key with space"); REQUIRE(S_(tag.value()) == "value with space"); break; case 2: REQUIRE(S_(it->user()) == "line\nfeed"); REQUIRE(S_(tag.key()) == "key with\nlinefeed"); REQUIRE(S_(tag.value()) == "value with\nlinefeed"); break; case 3: REQUIRE(S_(it->user()) == "carriage\rreturn"); REQUIRE(S_(tag.key()) == "key with\rcarriage\rreturn"); REQUIRE(S_(tag.value()) == "value with\rcarriage\rreturn"); break; case 4: REQUIRE(S_(it->user()) == "tab\tulator"); REQUIRE(S_(tag.key()) == "key with\ttab"); REQUIRE(S_(tag.value()) == "value with\ttab"); break; case 5: REQUIRE(S_(it->user()) == "unencoded linefeed"); REQUIRE(S_(tag.key()) == "key with unencoded linefeed"); REQUIRE(S_(tag.value()) == "value with unencoded linefeed"); break; default: REQUIRE(false); // should not be here } } REQUIRE(count == 5); } SECTION("Using Reader to read relation") { osmium::io::Reader reader(filename("142-whitespace")); osmium::memory::Buffer buffer = reader.read(); reader.close(); auto it = buffer.begin(); REQUIRE(it != buffer.end()); REQUIRE(it->id() == 21); const auto& members = it->members(); REQUIRE(members.size() == 5); int count = 0; for (const auto& member : members) { ++count; switch (count) { case 1: REQUIRE(S_(member.role()) == "role with whitespace"); break; case 2: REQUIRE(S_(member.role()) == "role with\nlinefeed"); break; case 3: REQUIRE(S_(member.role()) == "role with\rcarriage\rreturn"); break; case 4: REQUIRE(S_(member.role()) == "role with\ttab"); break; case 5: REQUIRE(S_(member.role()) == "role with unencoded linefeed"); break; default: REQUIRE(false); // should not be here } } REQUIRE(count == 5); } } // ============================================= TEST_CASE("Reading OSM XML 200") { SECTION("Direct") { header_buffer_type r = read_xml("200-nodes"); REQUIRE(r.header.get("generator") == "testdata"); REQUIRE(r.buffer.committed() > 0); REQUIRE(r.buffer.get(0).type() == osmium::item_type::node); REQUIRE(r.buffer.get(0).id() == 36966060); REQUIRE(std::distance(r.buffer.begin(), r.buffer.end()) == 3); } SECTION("Using Reader") { osmium::io::Reader reader(filename("200-nodes")); osmium::io::Header header = reader.header(); REQUIRE(header.get("generator") == "testdata"); osmium::memory::Buffer buffer = reader.read(); REQUIRE(buffer.committed() > 0); REQUIRE(buffer.get(0).type() == osmium::item_type::node); REQUIRE(buffer.get(0).id() == 36966060); REQUIRE(std::distance(buffer.begin(), buffer.end()) == 3); reader.close(); } SECTION("Using Reader asking for nodes") { osmium::io::Reader reader(filename("200-nodes"), osmium::osm_entity_bits::node); osmium::io::Header header = reader.header(); REQUIRE(header.get("generator") == "testdata"); osmium::memory::Buffer buffer = reader.read(); REQUIRE(buffer.committed() > 0); REQUIRE(buffer.get(0).type() == osmium::item_type::node); REQUIRE(buffer.get(0).id() == 36966060); REQUIRE(std::distance(buffer.begin(), buffer.end()) == 3); reader.close(); } SECTION("Using Reader asking for header only") { osmium::io::Reader reader(filename("200-nodes"), osmium::osm_entity_bits::nothing); osmium::io::Header header = reader.header(); REQUIRE(header.get("generator") == "testdata"); REQUIRE_THROWS({ reader.read(); }); reader.close(); } SECTION("Using Reader asking for ways") { osmium::io::Reader reader(filename("200-nodes"), osmium::osm_entity_bits::way); osmium::io::Header header = reader.header(); REQUIRE(header.get("generator") == "testdata"); osmium::memory::Buffer buffer = reader.read(); REQUIRE(0 == buffer.committed()); REQUIRE(! buffer); reader.close(); } }