diff --git a/coding/files_container.hpp b/coding/files_container.hpp index 7f2e13b96b..48c025472c 100644 --- a/coding/files_container.hpp +++ b/coding/files_container.hpp @@ -19,6 +19,16 @@ class FilesContainerBase public: using Tag = std::string; + struct Info + { + Tag m_tag; + uint64_t m_offset; + uint64_t m_size; + + Info() {} + Info(Tag const & tag, uint64_t offset) : m_tag(tag), m_offset(offset) {} + }; + /// Alignment of each new section that will be added to a file /// container, i.e. section's offset in bytes will be a multiple of /// this value. @@ -32,22 +42,12 @@ public: } template - void ForEachTag(ToDo && toDo) const + void ForEachInfo(ToDo && toDo) const { std::for_each(m_info.begin(), m_info.end(), std::forward(toDo)); } protected: - struct Info - { - Tag m_tag; - uint64_t m_offset; - uint64_t m_size; - - Info() {} - Info(Tag const & tag, uint64_t offset) : m_tag(tag), m_offset(offset) {} - }; - struct LessInfo { bool operator() (Info const & t1, Info const & t2) const @@ -100,8 +100,6 @@ protected: Tag const & m_tag; }; - friend std::string DebugPrint(Info const & info); - Info const * GetInfo(Tag const & tag) const; template @@ -111,6 +109,8 @@ protected: InfoContainer m_info; }; +std::string DebugPrint(FilesContainerBase::Info const & info); + class FilesContainerR : public FilesContainerBase { public: diff --git a/generator/CMakeLists.txt b/generator/CMakeLists.txt index 3630b8e919..173fad176e 100644 --- a/generator/CMakeLists.txt +++ b/generator/CMakeLists.txt @@ -253,6 +253,7 @@ set( omim_add_library(${PROJECT_NAME} ${SRC}) +omim_add_pybindings_subdirectory(pygen) omim_add_test_subdirectory(generator_tests_support) omim_add_test_subdirectory(generator_tests) omim_add_test_subdirectory(generator_integration_tests) diff --git a/generator/pygen/CMakeLists.txt b/generator/pygen/CMakeLists.txt new file mode 100644 index 0000000000..5d94ce4c56 --- /dev/null +++ b/generator/pygen/CMakeLists.txt @@ -0,0 +1,53 @@ +project(pygen) + +set( + SRC + pygen.cpp +) + +include_directories(${CMAKE_BINARY_DIR}) + +omim_add_library(${PROJECT_NAME} MODULE ${SRC}) + +omim_link_libraries( + ${PROJECT_NAME} + generator + routing + traffic + routing_common + descriptions + transit + ugc + search + storage + editor + indexer + mwm_diff + platform + geometry + coding + base + opening_hours + freetype + expat + icu + jansson + protobuf + bsdiff + stats_client + minizip + succinct + pugixml + tess2 + gflags + oauthcpp + sqlite3 + ${CMAKE_DL_LIBS} + ${LIBZ} + ${Boost_LIBRARIES} +) + +link_qt5_core(${PROJECT_NAME}) +link_qt5_network(${PROJECT_NAME}) + +set_target_properties(${PROJECT_NAME} PROPERTIES PREFIX "") diff --git a/generator/pygen/example.py b/generator/pygen/example.py new file mode 100644 index 0000000000..f99dba4b8c --- /dev/null +++ b/generator/pygen/example.py @@ -0,0 +1,50 @@ +#!/usr/bin/env python + +import argparse + +from pygen import classif +from pygen import mwm + + +def main(args): + map = mwm.Mwm(args.m) + print("{} with type {} has {} features.".format(args.m, map.type(), len(map))) + print("Mwm version is {}".format(map.version())) + print("Bounds are {}".format(map.bounds())) + print("Sections info is {}".format(map.sections_info())) + + fts_with_metadata = [ft for ft in map if ft.metadata()] + print("{} features have metadata.".format(len(fts_with_metadata))) + + first = fts_with_metadata[0] + print(first) + + metadata = first.metadata() + if mwm.EType.FMD_CUISINE in metadata: + print("Metadata has mwm.EType.FMD_CUISINE.") + + if mwm.EType.FMD_WEBSITE in metadata: + print("Metadata has mwm.EType.FMD_WEBSITE.") + + for k, v in metadata.items(): + print("{}: {}".format(k, v)) + + last = fts_with_metadata[-1] + print(last.metadata()) + for t in last.types(): + print(classif.readable_type(t)) + + print("Index is {}".format(last.index())) + print("Center is {}".format(last.center())) + print( + "Names are {}, readable name is {}.".format(last.names(), last.readable_name()) + ) + + +if __name__ == "__main__": + parser = argparse.ArgumentParser(description="Example usage of pygen module.") + parser.add_argument( + "-m", metavar="MWM_PATH", type=str, default="", help="Path to mwm files." + ) + args = parser.parse_args() + main(args) diff --git a/generator/pygen/pygen.cpp b/generator/pygen/pygen.cpp new file mode 100644 index 0000000000..25f3dd5deb --- /dev/null +++ b/generator/pygen/pygen.cpp @@ -0,0 +1,311 @@ +#include "generator/utils.hpp" + +#include "indexer/classificator.hpp" +#include "indexer/classificator_loader.hpp" +#include "indexer/feature.hpp" +#include "indexer/feature_decl.hpp" +#include "indexer/feature_meta.hpp" +#include "indexer/feature_processor.hpp" +#include "indexer/features_vector.hpp" + +#include "platform/mwm_version.hpp" + +#include "coding/string_utf8_multilang.hpp" + +#include "geometry/point2d.hpp" +#include "geometry/rect2d.hpp" + +#include "base/assert.hpp" +#include "base/logging.hpp" + +#include "pyhelpers/module_version.hpp" + +#include +#include + +#include "3party/boost/boost/noncopyable.hpp" +#include "3party/boost/boost/python.hpp" +#include "3party/boost/boost/shared_ptr.hpp" + +using namespace feature; +namespace bp = boost::python; + +namespace +{ +class MwmIter; + +class Mwm +{ +public: + explicit Mwm(std::string const & filename) + : m_ds(filename) + , m_mwmValue(m_ds.GetLocalCountryFile()) + , m_guard(std::make_unique(m_ds.GetDataSource(), m_ds.GetMwmId())) + { + } + + version::MwmVersion const & GetVersion() const { return m_mwmValue.GetMwmVersion(); } + DataHeader::MapType GetType() const { return m_mwmValue.GetHeader().GetType(); } + m2::RectD GetBounds() const { return m_mwmValue.GetHeader().GetBounds(); } + size_t Size() const { return m_guard->GetNumFeatures(); } + boost::shared_ptr GetNthFeature(uint32_t index) + { + return m_guard->GetFeatureByIndex(index); + } + + bp::dict GetSectionsInfo() const + { + bp::dict sectionsInfo; + m_mwmValue.m_cont.ForEachInfo([&](auto const & info) { sectionsInfo[info.m_tag] = info; }); + return sectionsInfo; + } + + MwmIter MakeMwmIter(); + +private: + generator::SingleMwmDataSource m_ds; + MwmValue m_mwmValue; + std::unique_ptr m_guard; +}; + +class MwmIter +{ +public: + MwmIter(Mwm & mwm) : m_mwm(mwm) {} + + boost::shared_ptr Next() + { + if (m_current == m_mwm.Size()) + { + PyErr_SetNone(PyExc_StopIteration); + bp::throw_error_already_set(); + } + + return m_mwm.GetNthFeature(m_current++); + } + +private: + Mwm & m_mwm; + uint32_t m_current = 0; +}; + +MwmIter Mwm::MakeMwmIter() { return MwmIter(*this); } + +struct GeometryNamespace +{ +}; + +struct MwmNamespace +{ +}; + +struct ClassifNamespace +{ +}; +} // namespace + +BOOST_PYTHON_MODULE(pygen) +{ + bp::scope().attr("__version__") = PYBINDINGS_VERSION; + + classificator::Load(); + + { + bp::scope geometryNamespace = bp::class_("geometry"); + + bp::class_("PointD", bp::init()) + .def_readwrite("x", &m2::PointD::x) + .def_readwrite("y", &m2::PointD::y) + .def("__repr__", static_cast(m2::DebugPrint)); + + bp::class_("RectD", bp::init()) + .def(bp::init()) + .add_property("min_x", &m2::RectD::minX, &m2::RectD::setMinX) + .add_property("min_y", &m2::RectD::minY, &m2::RectD::setMinY) + .add_property("max_x", &m2::RectD::maxX, &m2::RectD::setMaxX) + .add_property("max_y", &m2::RectD::maxY, &m2::RectD::setMaxY) + .add_property( + "right_top", &m2::RectD::RightTop, + +[](m2::RectD & self, m2::RectD const & p) { + self.setMaxX(p.maxX()); + self.setMaxY(p.maxY()); + }) + .add_property( + "left_bottom", &m2::RectD::LeftBottom, + +[](m2::RectD & self, m2::RectD const & p) { + self.setMinX(p.minX()); + self.setMinY(p.minY()); + }) + .def("__repr__", static_cast(m2::DebugPrint)); + } + { + bp::scope mwmNamespace = bp::class_("mwm"); + + bp::enum_("EType") + .value("FMD_CUISINE", Metadata::EType::FMD_CUISINE) + .value("FMD_OPEN_HOURS", Metadata::EType::FMD_OPEN_HOURS) + .value("FMD_PHONE_NUMBER", Metadata::EType::FMD_PHONE_NUMBER) + .value("FMD_FAX_NUMBER", Metadata::EType::FMD_FAX_NUMBER) + .value("FMD_STARS", Metadata::EType::FMD_STARS) + .value("FMD_OPERATOR", Metadata::EType::FMD_OPERATOR) + .value("FMD_URL", Metadata::EType::FMD_URL) + .value("FMD_WEBSITE", Metadata::EType::FMD_WEBSITE) + .value("FMD_INTERNET", Metadata::EType::FMD_INTERNET) + .value("FMD_ELE", Metadata::EType::FMD_ELE) + .value("FMD_TURN_LANES", Metadata::EType::FMD_TURN_LANES) + .value("FMD_TURN_LANES_FORWARD", Metadata::EType::FMD_TURN_LANES_FORWARD) + .value("FMD_TURN_LANES_BACKWARD", Metadata::EType::FMD_TURN_LANES_BACKWARD) + .value("FMD_EMAIL", Metadata::EType::FMD_EMAIL) + .value("FMD_POSTCODE", Metadata::EType::FMD_POSTCODE) + .value("FMD_WIKIPEDIA", Metadata::EType::FMD_WIKIPEDIA) + .value("FMD_FLATS", Metadata::EType::FMD_FLATS) + .value("FMD_HEIGHT", Metadata::EType::FMD_HEIGHT) + .value("FMD_MIN_HEIGHT", Metadata::EType::FMD_MIN_HEIGHT) + .value("FMD_DENOMINATION", Metadata::EType::FMD_DENOMINATION) + .value("FMD_BUILDING_LEVELS", Metadata::EType::FMD_BUILDING_LEVELS) + .value("FMD_TEST_ID", Metadata::EType::FMD_TEST_ID) + .value("FMD_SPONSORED_ID", Metadata::EType::FMD_SPONSORED_ID) + .value("FMD_PRICE_RATE", Metadata::EType::FMD_PRICE_RATE) + .value("FMD_RATING", Metadata::EType::FMD_RATING) + .value("FMD_BANNER_URL", Metadata::EType::FMD_BANNER_URL) + .value("FMD_LEVEL", Metadata::EType::FMD_LEVEL) + .value("FMD_AIRPORT_IATA", Metadata::EType::FMD_AIRPORT_IATA) + .value("FMD_BRAND", Metadata::EType::FMD_BRAND) + .value("FMD_DURATION", Metadata::EType::FMD_DURATION); + + bp::enum_("GeomType") + .value("Undefined", GeomType::Undefined) + .value("Point", GeomType::Point) + .value("Line", GeomType::Line) + .value("Area", GeomType::Area); + + bp::enum_("MapType") + .value("World", DataHeader::MapType::World) + .value("WorldCoasts", DataHeader::MapType::WorldCoasts) + .value("Country", DataHeader::MapType::Country); + + bp::enum_("MwmFormat") + .value("unknown", version::Format::unknownFormat) + .value("v1", version::Format::v1) + .value("v2", version::Format::v2) + .value("v3", version::Format::v3) + .value("v4", version::Format::v4) + .value("v5", version::Format::v5) + .value("v6", version::Format::v6) + .value("v7", version::Format::v7) + .value("v8", version::Format::v8) + .value("v9", version::Format::v9) + .value("last", version::Format::lastFormat); + + bp::class_("SectionInfo", bp::no_init) + .def_readwrite("tag", &FilesContainerR::Info::m_tag) + .def_readwrite("offset", &FilesContainerR::Info::m_offset) + .def_readwrite("size", &FilesContainerR::Info::m_size) + .def("__repr__", static_cast(DebugPrint)); + + bp::class_("MwmVersion", bp::no_init) + .def("format", &version::MwmVersion::GetFormat) + .def("seconds_since_epoch", &version::MwmVersion::GetSecondsSinceEpoch) + .def("version", &version::MwmVersion::GetVersion) + .def("__repr__", + static_cast(version::DebugPrint)); + + bp::class_, boost::noncopyable>("FeatureType", + bp::no_init) + .def( + "index", +[](FeatureType const & self) { return self.GetID().m_index; }) + .def( + "types", + +[](FeatureType & self) { + bp::list types; + self.ForEachType([&](auto t) { types.append(t); }); + return types; + }) + .def( + "metadata", + +[](FeatureType & self) { + bp::dict mmetadata; + auto const & metadata = self.GetMetadata(); + for (auto k : metadata.GetKeys()) + mmetadata[k] = metadata.Get(k); + + return mmetadata; + }) + .def( + "names", + +[](FeatureType & self) { + bp::dict mnames; + auto const & name = self.GetNames(); + name.ForEach([&](auto code, auto && str) { + mnames[StringUtf8Multilang::GetLangByCode(code)] = std::move(str); + }); + + return mnames; + }) + .def( + "readable_name", + +[](FeatureType & self) { + std::string name; + self.GetReadableName(name); + return name; + }) + .def("rank", &FeatureType::GetRank) + .def("population", &FeatureType::GetPopulation) + .def("road_number", &FeatureType::GetRoadNumber) + .def("house_number", &FeatureType::GetHouseNumber) + .def("postcode", &FeatureType::GetPostcode, bp::return_internal_reference<>()) + .def("layer", &FeatureType::GetLayer) + .def("geom_type", &FeatureType::GetGeomType) + .def("center", &FeatureType::GetCenter) + .def( + "geometry", + +[](FeatureType & self) { + bp::list points; + switch (self.GetGeomType()) + { + case GeomType::Point: + case GeomType::Line: + { + self.ForEachPoint([&](auto const & p) { points.append(p); }, + FeatureType::BEST_GEOMETRY); + } + break; + case GeomType::Area: + { + for (auto const & p : self.GetTrianglesAsPoints(FeatureType::BEST_GEOMETRY)) + points.append(p); + } + break; + case GeomType::Undefined: break; + default: UNREACHABLE(); + } + return points; + }) + .def( + "limit_rect", + +[](FeatureType & self) { return self.GetLimitRect(FeatureType::BEST_GEOMETRY); }) + .def( + "__repr__", + +[](FeatureType & self) { return self.DebugString(FeatureType::BEST_GEOMETRY); }); + + bp::class_("MwmIter", bp::no_init) + .def( + "__iter__", +[](MwmIter self) { return self; }) + .def("__next__", &MwmIter::Next) + .def("next", &MwmIter::Next); + + bp::class_("Mwm", bp::init()) + .def("version", &Mwm::GetVersion, bp::return_internal_reference<>()) + .def("type", &Mwm::GetType) + .def("bounds", &Mwm::GetBounds) + .def("sections_info", &Mwm::GetSectionsInfo) + .def("__iter__", &Mwm::MakeMwmIter) + .def("__len__", &Mwm::Size); + } + { + bp::scope classifNamespace = bp::class_("classif"); + + bp::def( + "readable_type", +[](uint32_t t) { return classif().GetReadableObjectName(t); }); + } +} diff --git a/generator/utils.hpp b/generator/utils.hpp index b8c2108863..07f170936d 100644 --- a/generator/utils.hpp +++ b/generator/utils.hpp @@ -43,7 +43,7 @@ public: explicit SingleMwmDataSource(std::string const & mwmPath); DataSource & GetDataSource() { return m_dataSource; } - std::string GetPath(MapFileType type) const { return m_countryFile.GetPath(type); } + platform::LocalCountryFile const & GetLocalCountryFile() const { return m_countryFile; } MwmSet::MwmId const & GetMwmId() const { return m_mwmId; } private: diff --git a/indexer/editable_map_object.cpp b/indexer/editable_map_object.cpp index d307d03d1d..6df6fdbe82 100644 --- a/indexer/editable_map_object.cpp +++ b/indexer/editable_map_object.cpp @@ -301,11 +301,11 @@ string EditableMapObject::GetWikipedia() const void EditableMapObject::ForEachMetadataItem( bool skipSponsored, function const & fn) const { - for (auto const type : m_metadata.GetPresentTypes()) + for (auto const type : m_metadata.GetKeys()) { - if (skipSponsored && m_metadata.IsSponsoredType(static_cast(type))) + if (skipSponsored && m_metadata.IsSponsoredType(type)) continue; - auto const attributeName = ToString(static_cast(type)); + auto const attributeName = ToString(type); fn(attributeName, m_metadata.Get(type)); } } diff --git a/indexer/feature_meta.cpp b/indexer/feature_meta.cpp index 1e96878117..d6ead842e1 100644 --- a/indexer/feature_meta.cpp +++ b/indexer/feature_meta.cpp @@ -18,6 +18,17 @@ char constexpr const * kBaseWikiUrl = #endif } // namespace +std::vector Metadata::GetKeys() const +{ + std::vector types; + types.reserve(m_metadata.size()); + + for (auto const & item : m_metadata) + types.push_back(static_cast(item.first)); + + return types; +} + string Metadata::GetWikiURL() const { string v = this->Get(FMD_WIKIPEDIA); diff --git a/indexer/feature_meta.hpp b/indexer/feature_meta.hpp index 15c07945c5..dbf415d3b0 100644 --- a/indexer/feature_meta.hpp +++ b/indexer/feature_meta.hpp @@ -148,7 +148,16 @@ public: static bool TypeFromString(std::string const & osmTagKey, EType & outType); static bool IsSponsoredType(EType const & type); - void Set(EType type, std::string const & value) { MetadataBase::Set(type, value); } + std::vector GetKeys() const; + + using MetadataBase::Has; + using MetadataBase::Get; + bool Has(EType type) const { return MetadataBase::Has(static_cast(type)); } + std::string Get(EType type) const { return MetadataBase::Get(static_cast(type)); } + bool Get(EType type, std::string & value) const { return MetadataBase::Get(static_cast(type), value); } + + using MetadataBase::Set; + void Set(EType type, std::string const & value) { MetadataBase::Set(static_cast(type), value); } void Drop(EType type) { Set(type, std::string()); } std::string GetWikiURL() const; diff --git a/platform/mwm_version.cpp b/platform/mwm_version.cpp index 5315e8a8f4..4b99f13c22 100644 --- a/platform/mwm_version.cpp +++ b/platform/mwm_version.cpp @@ -13,6 +13,8 @@ #include "defines.hpp" +#include + namespace version { namespace @@ -69,6 +71,13 @@ std::string DebugPrint(Format f) return "v" + strings::to_string(static_cast(f) + 1); } +std::string DebugPrint(MwmVersion const & mwmVersion) +{ + std::stringstream s; + s << DebugPrint(mwmVersion.GetFormat()) << ":" << mwmVersion.GetSecondsSinceEpoch() << "s"; + return s.str(); +} + void WriteVersion(Writer & w, uint64_t secondsSinceEpoch) { w.Write(MWM_PROLOG, ARRAY_SIZE(MWM_PROLOG)); diff --git a/platform/mwm_version.hpp b/platform/mwm_version.hpp index 3da53f23d6..2235576285 100644 --- a/platform/mwm_version.hpp +++ b/platform/mwm_version.hpp @@ -53,6 +53,8 @@ private: uint64_t m_secondsSinceEpoch{0}; }; +std::string DebugPrint(MwmVersion const & mwmVersion); + /// Writes latest format and current timestamp to the writer. void WriteVersion(Writer & w, uint64_t secondsSinceEpoch);