/* The code in this file is released into the Public Domain. */ #define CATCH_CONFIG_MAIN #include "catch.hpp" #include #include #include #include #include #include #include #include #include #include static std::string S_(const char* s) { return std::string{s}; } static std::string filename(const char* test_id, const char* suffix = "osm") { const char* testdir = getenv("TESTDIR"); if (!testdir) { std::cerr << "You have to set TESTDIR environment variable before running testdata-xml\n"; std::exit(2); } std::string f; f += testdir; f += "/"; f += test_id; f += "/data."; f += suffix; return f; } struct header_buffer_type { osmium::io::Header header; osmium::memory::Buffer buffer; }; // ============================================= // The following helper functions are used to call different parts of the // Osmium internals used to read and parse XML files. This way those parts // can be tested individually. These function can not be used in normal // operations, because they make certain assumptions, for instance that // file contents fit into small buffers. static std::string read_file(const char* test_id) { const int fd = osmium::io::detail::open_for_reading(filename(test_id)); assert(fd >= 0); std::string input(10000, '\0'); const auto n = ::read(fd, reinterpret_cast(const_cast(input.data())), 10000); assert(n >= 0); input.resize(static_cast(n)); close(fd); return input; } static std::string read_gz_file(const char* test_id, const char* suffix) { const int fd = osmium::io::detail::open_for_reading(filename(test_id, suffix)); assert(fd >= 0); osmium::io::GzipDecompressor gzip_decompressor{fd}; const std::string input = gzip_decompressor.read(); gzip_decompressor.close(); return input; } // cppcheck-suppress passedByValue static header_buffer_type parse_xml(std::string input) { osmium::thread::Pool pool; osmium::io::detail::future_string_queue_type input_queue; osmium::io::detail::future_buffer_queue_type output_queue; std::promise header_promise; std::future header_future = header_promise.get_future(); osmium::io::detail::add_to_queue(input_queue, std::move(input)); osmium::io::detail::add_to_queue(input_queue, std::string{}); osmium::io::detail::parser_arguments args = { pool, input_queue, output_queue, header_promise, osmium::osm_entity_bits::all, osmium::io::read_meta::yes }; osmium::io::detail::XMLParser parser{args}; parser.parse(); header_buffer_type result; result.header = header_future.get(); std::future future_buffer; output_queue.wait_and_pop(future_buffer); result.buffer = future_buffer.get(); if (result.buffer) { std::future future_buffer2; output_queue.wait_and_pop(future_buffer2); assert(!future_buffer2.get()); } return result; } static header_buffer_type read_xml(const char* test_id) { const std::string input = read_file(test_id); return parse_xml(input); } // ============================================= TEST_CASE("Reading OSM XML 100: Direct") { header_buffer_type r = read_xml("100-correct_but_no_data"); REQUIRE(r.header.get("generator") == "testdata"); REQUIRE(0 == r.buffer.committed()); REQUIRE(! r.buffer); } TEST_CASE("Reading OSM XML 100: Using Reader") { osmium::io::Reader reader{filename("100-correct_but_no_data")}; const osmium::io::Header header{reader.header()}; REQUIRE(header.get("generator") == "testdata"); osmium::memory::Buffer buffer = reader.read(); REQUIRE(0 == buffer.committed()); REQUIRE(! buffer); reader.close(); } TEST_CASE("Reading OSM XML 100: Using Reader asking for header only") { osmium::io::Reader reader{filename("100-correct_but_no_data"), osmium::osm_entity_bits::nothing}; const osmium::io::Header header{reader.header()}; REQUIRE(header.get("generator") == "testdata"); reader.close(); } // ============================================= TEST_CASE("Reading OSM XML 101: Direct") { REQUIRE_THROWS_AS(read_xml("101-missing_version"), osmium::format_version_error); try { read_xml("101-missing_version"); } catch (const osmium::format_version_error& e) { REQUIRE(e.version.empty()); } } TEST_CASE("Reading OSM XML 101: Using Reader") { REQUIRE_THROWS_AS([](){ osmium::io::Reader reader{filename("101-missing_version")}; const osmium::io::Header header{reader.header()}; osmium::memory::Buffer buffer = reader.read(); reader.close(); }(), osmium::format_version_error); } // ============================================= TEST_CASE("Reading OSM XML 102: Direct") { REQUIRE_THROWS_AS(read_xml("102-wrong_version"), osmium::format_version_error); try { read_xml("102-wrong_version"); } catch (const osmium::format_version_error& e) { REQUIRE(e.version == "0.1"); } } TEST_CASE("Reading OSM XML 102: Using Reader") { REQUIRE_THROWS_AS([](){ osmium::io::Reader reader{filename("102-wrong_version")}; const osmium::io::Header header{reader.header()}; osmium::memory::Buffer buffer = reader.read(); reader.close(); }(), osmium::format_version_error); } // ============================================= TEST_CASE("Reading OSM XML 103: Direct") { REQUIRE_THROWS_AS(read_xml("103-old_version"), osmium::format_version_error); try { read_xml("103-old_version"); } catch (const osmium::format_version_error& e) { REQUIRE(e.version == "0.5"); } } TEST_CASE("Reading OSM XML 103: Using Reader") { REQUIRE_THROWS_AS([](){ osmium::io::Reader reader{filename("103-old_version")}; const osmium::io::Header header{reader.header()}; osmium::memory::Buffer buffer = reader.read(); reader.close(); }(), osmium::format_version_error); } // ============================================= TEST_CASE("Reading OSM XML 104: Direct") { REQUIRE_THROWS_AS(read_xml("104-empty_file"), osmium::xml_error); try { read_xml("104-empty_file"); } catch (const osmium::xml_error& e) { REQUIRE(e.line == 1); REQUIRE(e.column == 0); } } TEST_CASE("Reading OSM XML 104: Using Reader") { REQUIRE_THROWS_AS([](){ osmium::io::Reader reader{filename("104-empty_file")}; const osmium::io::Header header{reader.header()}; osmium::memory::Buffer buffer = reader.read(); reader.close(); }(), osmium::xml_error); } // ============================================= TEST_CASE("Reading OSM XML 105: Direct") { REQUIRE_THROWS_AS(read_xml("105-incomplete_xml_file"), osmium::xml_error); } TEST_CASE("Reading OSM XML 105: Using Reader") { REQUIRE_THROWS_AS([](){ osmium::io::Reader reader{filename("105-incomplete_xml_file")}; const osmium::io::Header header{reader.header()}; osmium::memory::Buffer buffer = reader.read(); reader.close(); }(), osmium::xml_error); } // ============================================= TEST_CASE("Reading OSM XML 120: Direct") { std::string data = read_gz_file("120-correct_gzip_file_without_data", "osm.gz"); REQUIRE(data.size() == 102); header_buffer_type r = parse_xml(data); REQUIRE(r.header.get("generator") == "testdata"); REQUIRE(0 == r.buffer.committed()); REQUIRE(! r.buffer); } TEST_CASE("Reading OSM XML 120: Using Reader") { osmium::io::Reader reader{filename("120-correct_gzip_file_without_data", "osm.gz")}; const osmium::io::Header header{reader.header()}; REQUIRE(header.get("generator") == "testdata"); osmium::memory::Buffer buffer = reader.read(); REQUIRE(0 == buffer.committed()); REQUIRE(! buffer); reader.close(); } // ============================================= TEST_CASE("Reading OSM XML 121: Direct") { REQUIRE_THROWS_AS(read_gz_file("121-truncated_gzip_file", "osm.gz"), osmium::gzip_error); } TEST_CASE("Reading OSM XML 121: Using Reader") { // can throw osmium::gzip_error or osmium::xml_error REQUIRE_THROWS([](){ osmium::io::Reader reader{filename("121-truncated_gzip_file", "osm.gz")}; const osmium::io::Header header{reader.header()}; osmium::memory::Buffer buffer = reader.read(); reader.close(); }()); } // ============================================= TEST_CASE("Reading OSM XML 122: Direct") { REQUIRE_THROWS_AS(read_xml("122-no_osm_element"), osmium::xml_error); } TEST_CASE("Reading OSM XML 122: Using Reader") { REQUIRE_THROWS_AS([](){ osmium::io::Reader reader{filename("122-no_osm_element")}; const osmium::io::Header header{reader.header()}; osmium::memory::Buffer buffer = reader.read(); reader.close(); }(), osmium::xml_error); } // ============================================= TEST_CASE("Reading OSM XML 140: Using Reader") { osmium::io::Reader reader{filename("140-unicode")}; osmium::memory::Buffer buffer = reader.read(); reader.close(); int count = 0; for (const auto& node : buffer.select()) { ++count; REQUIRE(node.id() == count); const osmium::TagList& t = node.tags(); const char* uc = t["unicode_char"]; const auto len = atoi(t["unicode_utf8_length"]); REQUIRE(len == strlen(uc)); REQUIRE(S_(uc) == t["unicode_xml"]); // workaround for missing support for u8 string literals on Windows #if !defined(_MSC_VER) switch (count) { case 1: REQUIRE(S_(uc) == u8"a"); break; case 2: REQUIRE(S_(uc) == u8"\u00e4"); break; case 3: REQUIRE(S_(uc) == u8"\u30dc"); break; case 4: REQUIRE(S_(uc) == u8"\U0001d11e"); break; case 5: REQUIRE(S_(uc) == u8"\U0001f6eb"); break; default: REQUIRE(false); // should not be here } #endif } REQUIRE(count == 5); } // ============================================= TEST_CASE("Reading OSM XML 141: Using Reader") { osmium::io::Reader reader{filename("141-entities")}; osmium::memory::Buffer buffer = reader.read(); reader.close(); REQUIRE(buffer.committed() > 0); REQUIRE(buffer.get(0).type() == osmium::item_type::node); const osmium::Node& node = buffer.get(0); const osmium::TagList& tags = node.tags(); REQUIRE(S_(tags["less-than"]) == "<"); REQUIRE(S_(tags["greater-than"]) == ">"); REQUIRE(S_(tags["apostrophe"]) == "'"); REQUIRE(S_(tags["ampersand"]) == "&"); REQUIRE(S_(tags["quote"]) == "\""); } // ============================================= TEST_CASE("Reading OSM XML 142: Using Reader to read nodes") { osmium::io::Reader reader{filename("142-whitespace")}; osmium::memory::Buffer buffer = reader.read(); reader.close(); int count = 0; for (const auto& node : buffer.select()) { ++count; REQUIRE(node.id() == count); REQUIRE(node.tags().size() == 1); const osmium::Tag& tag = *(node.tags().begin()); switch (count) { case 1: REQUIRE(S_(node.user()) == "user name"); REQUIRE(S_(tag.key()) == "key with space"); REQUIRE(S_(tag.value()) == "value with space"); break; case 2: REQUIRE(S_(node.user()) == "line\nfeed"); REQUIRE(S_(tag.key()) == "key with\nlinefeed"); REQUIRE(S_(tag.value()) == "value with\nlinefeed"); break; case 3: REQUIRE(S_(node.user()) == "carriage\rreturn"); REQUIRE(S_(tag.key()) == "key with\rcarriage\rreturn"); REQUIRE(S_(tag.value()) == "value with\rcarriage\rreturn"); break; case 4: REQUIRE(S_(node.user()) == "tab\tulator"); REQUIRE(S_(tag.key()) == "key with\ttab"); REQUIRE(S_(tag.value()) == "value with\ttab"); break; case 5: REQUIRE(S_(node.user()) == "unencoded linefeed"); REQUIRE(S_(tag.key()) == "key with unencoded linefeed"); REQUIRE(S_(tag.value()) == "value with unencoded linefeed"); break; default: REQUIRE(false); // should not be here } } REQUIRE(count == 5); } TEST_CASE("Reading OSM XML 142: Using Reader to read relation") { osmium::io::Reader reader{filename("142-whitespace")}; osmium::memory::Buffer buffer = reader.read(); reader.close(); auto it = buffer.select().begin(); REQUIRE(it != buffer.select().end()); REQUIRE(it->id() == 21); const auto& members = it->members(); REQUIRE(members.size() == 5); int count = 0; for (const auto& member : members) { ++count; switch (count) { case 1: REQUIRE(S_(member.role()) == "role with whitespace"); break; case 2: REQUIRE(S_(member.role()) == "role with\nlinefeed"); break; case 3: REQUIRE(S_(member.role()) == "role with\rcarriage\rreturn"); break; case 4: REQUIRE(S_(member.role()) == "role with\ttab"); break; case 5: REQUIRE(S_(member.role()) == "role with unencoded linefeed"); break; default: REQUIRE(false); // should not be here } } REQUIRE(count == 5); } // ============================================= TEST_CASE("Reading OSM XML 200: Direct") { header_buffer_type r = read_xml("200-nodes"); REQUIRE(r.header.get("generator") == "testdata"); REQUIRE(r.buffer.committed() > 0); REQUIRE(r.buffer.get(0).type() == osmium::item_type::node); REQUIRE(r.buffer.get(0).id() == 36966060); REQUIRE(std::distance(r.buffer.begin(), r.buffer.end()) == 3); } TEST_CASE("Reading OSM XML 200: Using Reader") { osmium::io::Reader reader{filename("200-nodes")}; const osmium::io::Header header{reader.header()}; REQUIRE(header.get("generator") == "testdata"); osmium::memory::Buffer buffer = reader.read(); REQUIRE(buffer.committed() > 0); REQUIRE(buffer.get(0).type() == osmium::item_type::node); REQUIRE(buffer.get(0).id() == 36966060); REQUIRE(std::distance(buffer.begin(), buffer.end()) == 3); reader.close(); } TEST_CASE("Reading OSM XML 200: Using Reader asking for nodes") { osmium::io::Reader reader{filename("200-nodes"), osmium::osm_entity_bits::node}; const osmium::io::Header header{reader.header()}; REQUIRE(header.get("generator") == "testdata"); osmium::memory::Buffer buffer = reader.read(); REQUIRE(buffer.committed() > 0); REQUIRE(buffer.get(0).type() == osmium::item_type::node); REQUIRE(buffer.get(0).id() == 36966060); REQUIRE(std::distance(buffer.begin(), buffer.end()) == 3); reader.close(); } TEST_CASE("Reading OSM XML 200: Using Reader asking for header only") { osmium::io::Reader reader{filename("200-nodes"), osmium::osm_entity_bits::nothing}; const osmium::io::Header header{reader.header()}; REQUIRE(header.get("generator") == "testdata"); REQUIRE_FALSE(reader.read()); REQUIRE_THROWS(reader.read()); reader.close(); } TEST_CASE("Reading OSM XML 200: Using Reader asking for ways") { osmium::io::Reader reader{filename("200-nodes"), osmium::osm_entity_bits::way}; const osmium::io::Header header{reader.header()}; REQUIRE(header.get("generator") == "testdata"); osmium::memory::Buffer buffer = reader.read(); REQUIRE(0 == buffer.committed()); REQUIRE(! buffer); reader.close(); }