/* Copyright (c) 2013, Project OSRM, Dennis Luxen, others All rights reserved. Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met: Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer. Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include "Extractor.h" #include "ExtractionContainers.h" #include "ExtractionNode.h" #include "ExtractionWay.h" #include "ExtractorCallbacks.h" #include "RestrictionParser.h" #include "ScriptingEnvironment.h" #include "../Util/GitDescription.h" #include "../Util/IniFileUtil.h" #include "../Util/OSRMException.h" #include "../Util/simple_logger.hpp" #include "../Util/TimingUtil.h" #include "../Util/make_unique.hpp" #include "../typedefs.h" #include #include #include #include #include #include #include #include #include #include Extractor::Extractor() : requested_num_threads(0), file_has_pbf_format(false) { } int lua_error_callback(lua_State *L) // This is so I can use my own function as an // exception handler, pcall_log() { luabind::object error_msg(luabind::from_stack(L, -1)); std::ostringstream error_stream; error_stream << error_msg; throw OSRMException("ERROR occured in profile script:\n" + error_stream.str()); } bool Extractor::ParseArguments(int argc, char *argv[]) { // declare a group of options that will be allowed only on command line boost::program_options::options_description generic_options("Options"); generic_options.add_options()("version,v", "Show version")("help,h", "Show this help message")( "config,c", boost::program_options::value(&config_file_path) ->default_value("extractor.ini"), "Path to a configuration file."); // declare a group of options that will be allowed both on command line and in config file boost::program_options::options_description config_options("Configuration"); config_options.add_options()("profile,p", boost::program_options::value( &profile_path)->default_value("profile.lua"), "Path to LUA routing profile")( "threads,t", boost::program_options::value(&requested_num_threads) ->default_value(tbb::task_scheduler_init::default_num_threads()), "Number of threads to use"); // hidden options, will be allowed both on command line and in config file, but will not be // shown to the user boost::program_options::options_description hidden_options("Hidden options"); hidden_options.add_options()( "input,i", boost::program_options::value(&input_path), "Input file in .osm, .osm.bz2 or .osm.pbf format"); // positional option boost::program_options::positional_options_description positional_options; positional_options.add("input", 1); // combine above options for parsing boost::program_options::options_description cmdline_options; cmdline_options.add(generic_options).add(config_options).add(hidden_options); boost::program_options::options_description config_file_options; config_file_options.add(config_options).add(hidden_options); boost::program_options::options_description visible_options( boost::filesystem::basename(argv[0]) + " [options]"); visible_options.add(generic_options).add(config_options); // parse command line options boost::program_options::variables_map option_variables; boost::program_options::store(boost::program_options::command_line_parser(argc, argv) .options(cmdline_options) .positional(positional_options) .run(), option_variables); if (option_variables.count("version")) { SimpleLogger().Write() << g_GIT_DESCRIPTION; return false; } if (option_variables.count("help")) { SimpleLogger().Write() << visible_options; return false; } boost::program_options::notify(option_variables); // parse config file if (boost::filesystem::is_regular_file(config_file_path)) { SimpleLogger().Write() << "Reading options from: " << config_file_path.string(); std::string ini_file_contents = ReadIniFileAndLowerContents(config_file_path); std::stringstream config_stream(ini_file_contents); boost::program_options::store(parse_config_file(config_stream, config_file_options), option_variables); boost::program_options::notify(option_variables); } if (!option_variables.count("input")) { SimpleLogger().Write() << visible_options; return false; } return true; } void Extractor::GenerateOutputFilesNames() { output_file_name = input_path.string(); restriction_file_name = input_path.string(); std::string::size_type pos = output_file_name.find(".osm.bz2"); if (pos == std::string::npos) { pos = output_file_name.find(".osm.pbf"); if (pos != std::string::npos) { file_has_pbf_format = true; } else { pos = output_file_name.find(".osm.xml"); } } if (pos == std::string::npos) { pos = output_file_name.find(".pbf"); if (pos != std::string::npos) { file_has_pbf_format = true; } } if (pos == std::string::npos) { pos = output_file_name.find(".osm"); if (pos == std::string::npos) { output_file_name.append(".osrm"); restriction_file_name.append(".osrm.restrictions"); timestamp_file_name.append(".osrm.timestamp"); } else { output_file_name.replace(pos, 5, ".osrm"); restriction_file_name.replace(pos, 5, ".osrm.restrictions"); timestamp_file_name.replace(pos, 5, ".osrm.timestamp"); } } else { output_file_name.replace(pos, 8, ".osrm"); restriction_file_name.replace(pos, 8, ".osrm.restrictions"); timestamp_file_name.replace(pos, 8, ".osrm.timestamp"); } } int Extractor::Run(int argc, char *argv[]) { try { LogPolicy::GetInstance().Unmute(); TIMER_START(extracting); if (!ParseArguments(argc, argv)) return 0; if (1 > requested_num_threads) { SimpleLogger().Write(logWARNING) << "Number of threads must be 1 or larger"; return 1; } if (!boost::filesystem::is_regular_file(input_path)) { SimpleLogger().Write(logWARNING) << "Input file " << input_path.string() << " not found!"; return 1; } if (!boost::filesystem::is_regular_file(profile_path)) { SimpleLogger().Write(logWARNING) << "Profile " << profile_path.string() << " not found!"; return 1; } const unsigned recommended_num_threads = tbb::task_scheduler_init::default_num_threads(); SimpleLogger().Write() << "Input file: " << input_path.filename().string(); SimpleLogger().Write() << "Profile: " << profile_path.filename().string(); SimpleLogger().Write() << "Threads: " << requested_num_threads; if (recommended_num_threads != requested_num_threads) { SimpleLogger().Write(logWARNING) << "The recommended number of threads is " << recommended_num_threads << "! This setting may have performance side-effects."; } tbb::task_scheduler_init init(requested_num_threads); /*** Setup Scripting Environment ***/ ScriptingEnvironment scripting_environment(profile_path.string().c_str()); GenerateOutputFilesNames(); std::unordered_map string_map; ExtractionContainers extraction_containers; string_map[""] = 0; auto extractor_callbacks = osrm::make_unique(extraction_containers, string_map); osmium::io::File infile(input_path.string()); osmium::io::Reader reader(infile); osmium::io::Header header = reader.header(); unsigned number_of_nodes = 0; unsigned number_of_ways = 0; unsigned number_of_relations = 0; unsigned number_of_others = 0; SimpleLogger().Write() << "Parsing in progress.."; TIMER_START(parsing); std::string generator = header.get("generator"); if (generator.empty()) { generator = "unknown tool"; } SimpleLogger().Write() << "input file generated by " << generator; // TODO: write timestamp if non-empty std::string timestamp = header.get("osmosis_replication_timestamp"); if (timestamp.empty()) { timestamp = "n/a"; } SimpleLogger().Write() << "timestamp: " << timestamp; boost::filesystem::ofstream timestamp_out(timestamp_file_name); timestamp_out.write(timestamp.c_str(), timestamp.length()); timestamp_out.close(); lua_State *lua_state = scripting_environment.getLuaState(); luabind::set_pcall_callback(&lua_error_callback); RestrictionParser restriction_parser(scripting_environment); ExtractionNode result_node; ExtractionWay result_way; while (osmium::memory::Buffer buffer = reader.read()) { for (osmium::OSMEntity &entity : buffer) { switch (entity.type()) { case osmium::item_type::node: ++number_of_nodes; result_node.Clear(); luabind::call_function( lua_state, "node_function", boost::cref(static_cast(entity)), boost::ref(result_node)); extractor_callbacks->ProcessNode(static_cast(entity), result_node); break; case osmium::item_type::way: ++number_of_ways; result_way.Clear(); luabind::call_function( lua_state, "way_function", boost::cref(static_cast(entity)), boost::ref(result_way)); extractor_callbacks->ProcessWay(static_cast(entity), result_way); break; case osmium::item_type::relation: ++number_of_relations; extractor_callbacks->ProcessRestriction( restriction_parser.TryParse(static_cast(entity))); break; default: ++number_of_others; break; } } } TIMER_STOP(parsing); SimpleLogger().Write() << "Parsing finished after " << TIMER_SEC(parsing) << " seconds"; extractor_callbacks.reset(); if (extraction_containers.all_edges_list.empty()) { SimpleLogger().Write(logWARNING) << "The input data is empty, exiting."; return 1; } extraction_containers.PrepareData(output_file_name, restriction_file_name); TIMER_STOP(extracting); SimpleLogger().Write() << "extraction finished after " << TIMER_SEC(extracting) << "s"; SimpleLogger().Write() << "To prepare the data for routing, run: " << "./osrm-prepare " << output_file_name << std::endl; } catch (boost::program_options::too_many_positional_options_error &) { SimpleLogger().Write(logWARNING) << "Only one input file can be specified"; return 1; } catch (std::exception &e) { SimpleLogger().Write(logWARNING) << e.what(); return 1; } return 0; }