diff --git a/indexer/mwm_set.cpp b/indexer/mwm_set.cpp index 164748f53a..b0224cc0c3 100644 --- a/indexer/mwm_set.cpp +++ b/indexer/mwm_set.cpp @@ -193,7 +193,8 @@ unique_ptr MwmSet::LockValue(MwmId const & id) unique_ptr MwmSet::LockValueImpl(MwmId const & id) { - CHECK(id.IsAlive(), (id)); + if (!id.IsAlive()) + return nullptr; shared_ptr info = id.GetInfo(); // It's better to return valid "value pointer" even for "out-of-date" files, diff --git a/search/intermediate_result.cpp b/search/intermediate_result.cpp index 9737bba17e..cac42bc674 100644 --- a/search/intermediate_result.cpp +++ b/search/intermediate_result.cpp @@ -54,78 +54,36 @@ void ProcessMetadata(FeatureType const & ft, Result::Metadata & meta) namespace impl { - -template bool LessRankT(T const & r1, T const & r2) -{ - if (r1.m_rank != r2.m_rank) - return (r1.m_rank > r2.m_rank); - - return (r1.m_distance < r2.m_distance); -} - -template bool LessDistanceT(T const & r1, T const & r2) -{ - if (r1.m_distance != r2.m_distance) - return (r1.m_distance < r2.m_distance); - - return (r1.m_rank > r2.m_rank); -} - -PreResult1::PreResult1(FeatureID const & fID, uint8_t rank, m2::PointD const & center, - m2::PointD const & pivot, int8_t viewportID) - : m_id(fID), - m_center(center), - m_rank(rank), - m_viewportID(viewportID) +PreResult1::PreResult1(FeatureID const & fID, uint8_t rank, double priority, int8_t viewportID) + : m_id(fID), m_priority(priority), m_rank(rank), m_viewportID(viewportID) { ASSERT(m_id.IsValid(), ()); - - CalcParams(pivot); } -PreResult1::PreResult1(m2::PointD const & center, m2::PointD const & pivot) - : m_center(center) -{ - CalcParams(pivot); -} - -namespace -{ - -void AssertValid(m2::PointD const & p) -{ - ASSERT ( my::between_s(-180.0, 180.0, p.x), (p.x) ); - ASSERT ( my::between_s(-180.0, 180.0, p.y), (p.y) ); -} - -} - -void PreResult1::CalcParams(m2::PointD const & pivot) -{ - AssertValid(m_center); - m_distance = PointDistance(m_center, pivot); -} +PreResult1::PreResult1(double priority) : m_priority(priority) {} +// static bool PreResult1::LessRank(PreResult1 const & r1, PreResult1 const & r2) { - return LessRankT(r1, r2); + if (r1.m_rank != r2.m_rank) + return r1.m_rank > r2.m_rank; + return r1.m_priority < r2.m_priority; } -bool PreResult1::LessDistance(PreResult1 const & r1, PreResult1 const & r2) +// static +bool PreResult1::LessPriority(PreResult1 const & r1, PreResult1 const & r2) { - return LessDistanceT(r1, r2); + if (r1.m_priority != r2.m_priority) + return r1.m_priority < r2.m_priority; + return r1.m_rank > r2.m_rank; } +// static bool PreResult1::LessPointsForViewport(PreResult1 const & r1, PreResult1 const & r2) { return r1.m_id < r2.m_id; } -void PreResult2::CalcParams(m2::PointD const & pivot) -{ - m_distance = PointDistance(GetCenter(), pivot); -} - PreResult2::PreResult2(FeatureType const & f, PreResult1 const * p, m2::PointD const & pivot, string const & displayName, string const & fileName) : m_id(f.GetID()), @@ -142,16 +100,10 @@ PreResult2::PreResult2(FeatureType const & f, PreResult1 const * p, m2::PointD c m_rank = p ? p->GetRank() : 0; m2::PointD fCenter; - if (p && f.GetFeatureType() != feature::GEOM_POINT) - { - // Optimization tip - use precalculated center point if possible. - fCenter = p->GetCenter(); - } - else - fCenter = f.GetLimitRect(FeatureType::WORST_GEOMETRY).Center(); + fCenter = f.GetLimitRect(FeatureType::WORST_GEOMETRY).Center(); m_region.SetParams(fileName, fCenter); - CalcParams(pivot); + m_distance = PointDistance(GetCenter(), pivot); ProcessMetadata(f, m_metadata); } @@ -248,14 +200,20 @@ Result PreResult2::GeneratePointResult(CategoriesHolder const * pCat, set r2.m_rank; + return r1.m_distance < r2.m_distance; } +// static bool PreResult2::LessDistance(PreResult2 const & r1, PreResult2 const & r2) { - return LessDistanceT(r1, r2); + if (r1.m_distance != r2.m_distance) + return r1.m_distance < r2.m_distance; + return r1.m_rank > r2.m_rank; } bool PreResult2::StrictEqualF::operator() (PreResult2 const & r) const diff --git a/search/intermediate_result.hpp b/search/intermediate_result.hpp index 6e076e4b6e..ef050857b6 100644 --- a/search/intermediate_result.hpp +++ b/search/intermediate_result.hpp @@ -17,37 +17,26 @@ namespace search { namespace impl { - -template bool LessRankT(T const & r1, T const & r2); -template bool LessDistanceT(T const & r1, T const & r2); - /// First pass results class. Objects are creating during search in trie. /// Works fast without feature loading and provide ranking. class PreResult1 { friend class PreResult2; - template friend bool LessRankT(T const & r1, T const & r2); - template friend bool LessDistanceT(T const & r1, T const & r2); FeatureID m_id; - m2::PointD m_center; - double m_distance; + double m_priority; uint8_t m_rank; int8_t m_viewportID; - void CalcParams(m2::PointD const & pivot); - public: - PreResult1(FeatureID const & fID, uint8_t rank, m2::PointD const & center, - m2::PointD const & pivot, int8_t viewportID); - PreResult1(m2::PointD const & center, m2::PointD const & pivot); + PreResult1(FeatureID const & fID, uint8_t rank, double priority, int8_t viewportID); + PreResult1(double priority); static bool LessRank(PreResult1 const & r1, PreResult1 const & r2); - static bool LessDistance(PreResult1 const & r1, PreResult1 const & r2); + static bool LessPriority(PreResult1 const & r1, PreResult1 const & r2); static bool LessPointsForViewport(PreResult1 const & r1, PreResult1 const & r2); inline FeatureID GetID() const { return m_id; } - inline m2::PointD GetCenter() const { return m_center; } inline uint8_t GetRank() const { return m_rank; } inline int8_t GetViewportID() const { return m_viewportID; } }; @@ -59,8 +48,6 @@ class PreResult2 { friend class PreResult2Maker; - void CalcParams(m2::PointD const & pivot); - public: enum ResultType { @@ -124,9 +111,6 @@ public: inline feature::TypesHolder const & GetTypes() const { return m_types; } private: - template friend bool LessRankT(T const & r1, T const & r2); - template friend bool LessDistanceT(T const & r1, T const & r2); - bool IsEqualCommon(PreResult2 const & r) const; string ReadableFeatureType(CategoriesHolder const * pCat, diff --git a/search/locality.cpp b/search/locality.cpp new file mode 100644 index 0000000000..d07240528d --- /dev/null +++ b/search/locality.cpp @@ -0,0 +1,117 @@ +#include "search/locality.hpp" + +#include "indexer/search_delimiters.hpp" +#include "indexer/search_string_utils.hpp" + +#include "base/assert.hpp" + +#include "std/algorithm.hpp" + +namespace search +{ +Locality::Locality() : m_type(ftypes::NONE), m_featureId(-1), m_rank(-1), m_radius(0) {} + +Locality::Locality(ftypes::Type type, uint32_t featureId, m2::PointD const & center, uint8_t rank) + : m_type(type), m_featureId(featureId), m_center(center), m_rank(rank), m_radius(0) +{ +} + +bool Locality::IsValid() const +{ + if (m_type == ftypes::NONE) + return false; + ASSERT(!m_matchedTokens.empty(), ()); + return true; +} + +bool Locality::IsSuitable(TTokensArray const & tokens, TToken const & prefix) const +{ + bool const isMatched = IsFullNameMatched(); + + // Do filtering of possible localities. + using namespace ftypes; + + switch (m_type) + { + case STATE: // we process USA, Canada states only for now + // USA states has 2-symbol synonyms + return (isMatched || GetSynonymTokenLength(tokens, prefix) == 2); + + case COUNTRY: + // USA has synonyms: "US" or "USA" + return (isMatched || (m_enName == "usa" && GetSynonymTokenLength(tokens, prefix) <= 3) || + (m_enName == "uk" && GetSynonymTokenLength(tokens, prefix) == 2)); + + case CITY: + // need full name match for cities + return isMatched; + + default: + ASSERT(false, ()); + return false; + } +} + +void Locality::Swap(Locality & rhs) +{ + using std::swap; + + m_name.swap(rhs.m_name); + m_enName.swap(rhs.m_enName); + m_matchedTokens.swap(rhs.m_matchedTokens); + + swap(m_type, rhs.m_type); + swap(m_featureId, rhs.m_featureId); + swap(m_center, rhs.m_center); + swap(m_rank, rhs.m_rank); + swap(m_radius, rhs.m_radius); +} + +bool Locality::operator<(Locality const & rhs) const +{ + if (m_type != rhs.m_type) + return (m_type < rhs.m_type); + + if (m_matchedTokens.size() != rhs.m_matchedTokens.size()) + return (m_matchedTokens.size() < rhs.m_matchedTokens.size()); + + return m_rank < rhs.m_rank; +} + +bool Locality::IsFullNameMatched() const +{ + size_t count = 0; + SplitUniString(NormalizeAndSimplifyString(m_name), [&count](strings::UniString const &) + { + ++count; + }, + search::Delimiters()); + return count <= m_matchedTokens.size(); +} + +size_t Locality::GetSynonymTokenLength(TTokensArray const & tokens, TToken const & prefix) const +{ + // check only one token as a synonym + if (m_matchedTokens.size() == 1) + { + size_t const index = m_matchedTokens[0]; + if (index < tokens.size()) + return tokens[index].size(); + ASSERT_EQUAL(index, tokens.size(), ()); + ASSERT(!prefix.empty(), ()); + return prefix.size(); + } + + return size_t(-1); +} + +string DebugPrint(Locality const & l) +{ + stringstream ss; + ss << "{ Locality: " + << "Name = " + l.m_name << "; Name English = " << l.m_enName + << "; Rank = " << static_cast(l.m_rank) + << "; Matched: " << l.m_matchedTokens.size() << " }"; + return ss.str(); +} +} // namespace search diff --git a/search/locality.hpp b/search/locality.hpp new file mode 100644 index 0000000000..481aff060f --- /dev/null +++ b/search/locality.hpp @@ -0,0 +1,51 @@ +#pragma once + +#include "indexer/ftypes_matcher.hpp" +#include "indexer/search_trie.hpp" + +#include "base/buffer_vector.hpp" +#include "base/string_utils.hpp" + +#include "std/string.hpp" +#include "std/vector.hpp" + +namespace search +{ +struct Locality +{ + using TToken = strings::UniString; + using TTokensArray = buffer_vector; + + // Native and English names of locality. + string m_name; + string m_enName; + + // Indexes of matched tokens for locality. + vector m_matchedTokens; + + ftypes::Type m_type; + uint32_t m_featureId; + m2::PointD m_center; + uint8_t m_rank; + double m_radius; + + Locality(); + + Locality(ftypes::Type type, uint32_t featureId, m2::PointD const & center, uint8_t rank); + + bool IsValid() const; + + bool IsSuitable(TTokensArray const & tokens, TToken const & prefix) const; + + void Swap(Locality & rhs); + + bool operator<(Locality const & rhs) const; + +private: + bool IsFullNameMatched() const; + + size_t GetSynonymTokenLength(TTokensArray const & tokens, TToken const & prefix) const; +}; + +string DebugPrint(Locality const & l); +} // namespace search diff --git a/search/region.cpp b/search/region.cpp new file mode 100644 index 0000000000..4c7f4291fe --- /dev/null +++ b/search/region.cpp @@ -0,0 +1,35 @@ +#include "search/region.hpp" + +#include "base/assert.hpp" + +namespace search +{ +bool Region::operator<(Region const & rhs) const +{ + return (m_matchedTokens.size() < rhs.m_matchedTokens.size()); +} + +bool Region::IsValid() const +{ + if (m_ids.empty()) + return false; + ASSERT(!m_matchedTokens.empty(), ()); + ASSERT(!m_enName.empty(), ()); + return true; +} + +void Region::Swap(Region & rhs) +{ + m_ids.swap(rhs.m_ids); + m_matchedTokens.swap(rhs.m_matchedTokens); + m_enName.swap(rhs.m_enName); +} + +string DebugPrint(Region const & r) +{ + string res("Region: "); + res += "Name English: " + r.m_enName; + res += "; Matched: " + ::DebugPrint(r.m_matchedTokens.size()); + return res; +} +} // namespace search diff --git a/search/region.hpp b/search/region.hpp new file mode 100644 index 0000000000..5e830292c7 --- /dev/null +++ b/search/region.hpp @@ -0,0 +1,22 @@ +#pragma once + +#include "std/string.hpp" +#include "std/vector.hpp" + +namespace search +{ +struct Region +{ + vector m_ids; + vector m_matchedTokens; + string m_enName; + + bool IsValid() const; + + void Swap(Region & rhs); + + bool operator<(Region const & rhs) const; +}; + +string DebugPrint(Region const & r); +} // namespace search diff --git a/search/retrieval.cpp b/search/retrieval.cpp index 204dd8f335..9a020cc2f8 100644 --- a/search/retrieval.cpp +++ b/search/retrieval.cpp @@ -357,6 +357,8 @@ bool Retrieval::RetrieveForScale(double scale, Callback & callback) } bucket.m_intersectsWithViewport = true; + if (bucket.m_addressFeatures.empty()) + bucket.m_finished = true; } ASSERT_LESS_OR_EQUAL(bucket.m_featuresReported, bucket.m_addressFeatures.size(), ()); diff --git a/search/search.pro b/search/search.pro index f249443347..6b8ee9b95e 100644 --- a/search/search.pro +++ b/search/search.pro @@ -19,9 +19,11 @@ HEADERS += \ keyword_lang_matcher.hpp \ keyword_matcher.hpp \ latlon_match.hpp \ + locality.hpp \ locality_finder.hpp \ params.hpp \ query_saver.hpp \ + region.hpp \ result.hpp \ retrieval.hpp \ search_common.hpp \ @@ -40,9 +42,11 @@ SOURCES += \ keyword_lang_matcher.cpp \ keyword_matcher.cpp \ latlon_match.cpp \ + locality.cpp \ locality_finder.cpp \ params.cpp \ query_saver.cpp \ + region.cpp \ result.cpp \ retrieval.cpp \ search_engine.cpp \ diff --git a/search/search_engine.cpp b/search/search_engine.cpp index 13e27f5541..e59e537762 100644 --- a/search/search_engine.cpp +++ b/search/search_engine.cpp @@ -102,8 +102,7 @@ void SendStatistics(SearchParams const & params, m2::RectD const & viewport, Res Engine::Engine(Index & index, Reader * categoriesR, storage::CountryInfoGetter const & infoGetter, string const & locale, unique_ptr && factory) - : m_factory(move(factory)) - , m_data(make_unique(categoriesR)) + : m_factory(move(factory)), m_data(new EngineData(pCategoriesR)) { m_isReadyThread.clear(); @@ -217,15 +216,12 @@ void Engine::SearchAsync() // Get current search params. SearchParams params; m2::RectD viewport; - bool oneTimeSearch = false; { threads::MutexGuard updateGuard(m_updateMutex); params = m_params; - if (params.GetSearchRect(viewport)) - oneTimeSearch = true; - else + if (!params.GetSearchRect(viewport)) viewport = m_viewport; } @@ -246,7 +242,7 @@ void Engine::SearchAsync() Results res; - // Call m_query->IsCancelled() everywhere it needed without storing + // Call m_pQuery->IsCancelled() everywhere it needed without storing // return value. This flag can be changed from another thread. m_query->SearchCoordinates(params.m_query, res); @@ -258,54 +254,22 @@ void Engine::SearchAsync() if (viewportSearch) { - m_query->SetViewport(viewport, true); + m_query->SetViewport(viewport, true /* forceUpdate */); m_query->SearchViewportPoints(res); - - if (res.GetCount() > 0) - EmitResults(params, res); } else { - while (!m_query->IsCancelled()) - { - bool const isInflated = GetInflatedViewport(viewport); - size_t const oldCount = res.GetCount(); - - m_query->SetViewport(viewport, oneTimeSearch); - m_query->Search(res, RESULTS_COUNT); - - size_t const newCount = res.GetCount(); - bool const exit = (oneTimeSearch || !isInflated || newCount >= RESULTS_COUNT); - - if (exit || oldCount != newCount) - EmitResults(params, res); - - if (exit) - break; - } + m_query->SetViewport(viewport, params.IsSearchAroundPosition() /* forceUpdate */); + m_query->Search(res, RESULTS_COUNT); } + + if (res.GetCount() > 0) + EmitResults(params, res); } catch (Query::CancelException const &) { } - // Make additional search in whole mwm when not enough results (only for non-empty query). - size_t const count = res.GetCount(); - if (!viewportSearch && !m_query->IsCancelled() && count < RESULTS_COUNT) - { - try - { - m_query->SearchAdditional(res, RESULTS_COUNT); - } - catch (Query::CancelException const &) - { - } - - // Emit if we have more results. - if (res.GetCount() > count) - EmitResults(params, res); - } - if (!viewportSearch && !m_query->IsCancelled()) SendStatistics(params, viewport, res); diff --git a/search/search_engine.hpp b/search/search_engine.hpp index 394aa7cc0b..704f658844 100644 --- a/search/search_engine.hpp +++ b/search/search_engine.hpp @@ -32,8 +32,8 @@ class Engine typedef function SearchCallbackT; public: - // Doesn't take ownership of index. Takes ownership of pCategories - Engine(Index & index, Reader * categoriesR, storage::CountryInfoGetter const & infoGetter, + // Doesn't take ownership of @pIndex. Takes ownership of pCategories + Engine(Index & index, Reader * pCategoriesR, storage::CountryInfoGetter const & infoGetter, string const & locale, unique_ptr && factory); ~Engine(); diff --git a/search/search_query.cpp b/search/search_query.cpp index 7445c5b245..6d94750ff1 100644 --- a/search/search_query.cpp +++ b/search/search_query.cpp @@ -4,6 +4,8 @@ #include "geometry_utils.hpp" #include "indexed_value.hpp" #include "latlon_match.hpp" +#include "locality.hpp" +#include "region.hpp" #include "search_common.hpp" #include "search_query_params.hpp" #include "search_string_intersection.hpp" @@ -12,6 +14,9 @@ #include "indexer/categories_holder.hpp" #include "indexer/classificator.hpp" + +#include "indexer/feature.hpp" +#include "indexer/feature_algo.hpp" #include "indexer/feature_covering.hpp" #include "indexer/feature_impl.hpp" #include "indexer/features_vector.hpp" @@ -31,6 +36,14 @@ #include "std/algorithm.hpp" #include "std/function.hpp" +#include "std/iterator.hpp" + +#define LONG_OP(op) \ + { \ + if (IsCancelled()) \ + return; \ + op; \ + } namespace search { @@ -40,32 +53,115 @@ namespace using TCompareFunction1 = function; using TCompareFunction2 = function; +// Maximum result candidates count for each viewport/criteria. +size_t const kPreResultsCount = 200; + TCompareFunction1 g_arrCompare1[] = { - &impl::PreResult1::LessDistance, &impl::PreResult1::LessRank, + &impl::PreResult1::LessPriority, &impl::PreResult1::LessRank, }; TCompareFunction2 g_arrCompare2[] = { &impl::PreResult2::LessDistance, &impl::PreResult2::LessRank, }; - /// This indexes should match the initialization routine below. - int g_arrLang1[] = { 0, 1, 2, 2, 3 }; - int g_arrLang2[] = { 0, 0, 0, 1, 0 }; - enum LangIndexT { LANG_CURRENT = 0, - LANG_INPUT, - LANG_INTERNATIONAL, - LANG_EN, - LANG_DEFAULT, - LANG_COUNT }; +/// This indexes should match the initialization routine below. +int g_arrLang1[] = {0, 1, 2, 2, 3}; +int g_arrLang2[] = {0, 0, 0, 1, 0}; - pair GetLangIndex(int id) +enum LangIndexT +{ + LANG_CURRENT = 0, + LANG_INPUT, + LANG_INTERNATIONAL, + LANG_EN, + LANG_DEFAULT, + LANG_COUNT +}; + +pair GetLangIndex(int id) +{ + ASSERT_LESS(id, LANG_COUNT, ()); + return make_pair(g_arrLang1[id], g_arrLang2[id]); +} + +m2::PointD GetLocalityCenter(Index const & index, MwmSet::MwmId const & id, + Locality const & locality) +{ + Index::FeaturesLoaderGuard loader(index, id); + FeatureType feature; + loader.GetFeatureByIndex(locality.m_featureId, feature); + return feature::GetCenter(feature, FeatureType::WORST_GEOMETRY); +} + +ftypes::Type GetLocalityIndex(feature::TypesHolder const & types) +{ + using namespace ftypes; + + // Inner logic of SearchAddress expects COUNTRY, STATE and CITY only. + Type const type = IsLocalityChecker::Instance().GetType(types); + switch (type) { - ASSERT_LESS ( id, LANG_COUNT, () ); - return make_pair(g_arrLang1[id], g_arrLang2[id]); + case TOWN: + return CITY; + case VILLAGE: + return NONE; + default: + return type; } +} - // Maximum result candidates count for each viewport/criteria. - size_t const kPreResultsCount = 200; +class IndexedValue : public search::IndexedValueBase +{ + friend string DebugPrint(IndexedValue const & value); + + /// @todo Do not use shared_ptr for optimization issues. + /// Need to rewrite std::unique algorithm. + shared_ptr m_val; + +public: + explicit IndexedValue(impl::PreResult2 * v) : m_val(v) {} + + impl::PreResult2 const & operator*() const { return *m_val; } +}; + +string DebugPrint(IndexedValue const & value) +{ + string index; + for (auto const & i : value.m_ind) + index.append(" " + strings::to_string(i)); + return impl::DebugPrint(*value.m_val) + "; Index:" + index; +} + +void RemoveDuplicatingLinear(vector & indV) +{ + impl::PreResult2::LessLinearTypesF lessCmp; + impl::PreResult2::EqualLinearTypesF equalCmp; + + sort(indV.begin(), indV.end(), + [&lessCmp](IndexedValue const & lhs, IndexedValue const & rhs) + { + return lessCmp(*lhs, *rhs); + }); + + indV.erase(unique(indV.begin(), indV.end(), + [&equalCmp](IndexedValue const & lhs, IndexedValue const & rhs) + { + return equalCmp(*lhs, *rhs); + }), + indV.end()); +} +} // namespace + +Query::RetrievalCallback::RetrievalCallback(Query & query, ViewportID viewportId) + : m_query(query), m_viewportId(viewportId) +{ +} + +void Query::RetrievalCallback::OnFeaturesRetrieved(MwmSet::MwmId const & id, double scale, + vector const & featureIds) +{ + for (auto const & featureId : featureIds) + m_query.AddPreResult1(id, featureId, 0 /* rank */, scale, m_viewportId); } Query::Query(Index & index, CategoriesHolder const & categories, vector const & suggests, @@ -82,8 +178,6 @@ Query::Query(Index & index, CategoriesHolder const & categories, vector #endif , m_worldSearch(true) { - // m_viewport is initialized as empty rects - // Results queue's initialization. static_assert(kQueuesCount == ARRAY_SIZE(g_arrCompare1), ""); static_assert(kQueuesCount == ARRAY_SIZE(g_arrCompare2), ""); @@ -107,6 +201,18 @@ Query::Query(Index & index, CategoriesHolder const & categories, vector SetPreferredLocale("en"); } +void Query::Reset() +{ + Cancellable::Reset(); + m_retrieval.Reset(); +} + +void Query::Cancel() +{ + Cancellable::Cancel(); + m_retrieval.Cancel(); +} + void Query::SetLanguage(int id, int8_t lang) { m_keywordsScorer.SetLanguage(GetLangIndex(id), lang); @@ -161,7 +267,6 @@ void Query::SetViewportByIndex(TMWMVector const & mwmsInfo, m2::RectD const & vi } m_viewport[idx] = viewport; - UpdateViewportOffsets(mwmsInfo, viewport, m_offsetsInViewport[idx]); #ifdef FIND_LOCALITY_TEST m_locality.SetViewportByIndex(viewport, idx); @@ -233,68 +338,9 @@ void Query::ClearCaches() void Query::ClearCache(size_t ind) { - // clear cache and free memory - TOffsetsVector emptyV; - emptyV.swap(m_offsetsInViewport[ind]); - m_viewport[ind].MakeEmpty(); } -void Query::UpdateViewportOffsets(TMWMVector const & mwmsInfo, m2::RectD const & rect, - TOffsetsVector & offsets) -{ - offsets.clear(); - - int const queryScale = GetQueryIndexScale(rect); - covering::CoveringGetter cov(rect, covering::ViewportWithLowLevels); - - for (shared_ptr const & info : mwmsInfo) - { - // Search only mwms that intersect with viewport (world always does). - if (rect.IsIntersect(info->m_limitRect)) - { - MwmSet::MwmId mwmId(info); - Index::MwmHandle const mwmHandle = m_index.GetMwmHandleById(mwmId); - if (MwmValue const * pMwm = mwmHandle.GetValue()) - { - TFHeader const & header = pMwm->GetHeader(); - if (header.GetType() == TFHeader::country) - { - pair const scaleR = header.GetScaleRange(); - int const scale = min(max(queryScale, scaleR.first), scaleR.second); - - covering::IntervalsT const & interval = cov.Get(header.GetLastScale()); - - ScaleIndex index(pMwm->m_cont.GetReader(INDEX_FILE_TAG), - pMwm->m_factory); - - for (size_t i = 0; i < interval.size(); ++i) - { - auto collectFn = MakeBackInsertFunctor(offsets[mwmId]); - index.ForEachInIntervalAndScale(collectFn, interval[i].first, interval[i].second, scale); - } - - sort(offsets[mwmId].begin(), offsets[mwmId].end()); - } - } - } - } - -#ifdef DEBUG - size_t offsetsCached = 0; - for (shared_ptr const & info : mwmsInfo) - { - MwmSet::MwmId mwmId(info); - auto const it = offsets.find(mwmId); - if (it != offsets.end()) - offsetsCached += it->second.size(); - } - - LOG(LDEBUG, ("For search in viewport cached mwms:", mwmsInfo.size(), - "offsets:", offsetsCached)); -#endif -} - void Query::Init(bool viewportSearch) { Reset(); @@ -448,6 +494,48 @@ void Query::SetQuery(string const & query) }); } +void Query::Search(Results & res, size_t resCount) +{ + LOG(LINFO, ("Query::Search")); + if (IsCancelled()) + return; + + if (m_tokens.empty()) + SuggestStrings(res); + + LONG_OP(SearchAddress(res)); + LONG_OP(SearchFeatures()); + LONG_OP(FlushResults(res, false, resCount)); +} + +void Query::SearchViewportPoints(Results & res) +{ + LOG(LINFO, ("Query::SearchViewportPoints")); + LONG_OP(SearchAddress(res)); + LONG_OP(SearchFeaturesInViewport(CURRENT_V)); + + vector indV; + vector streets; + + MakePreResult2(indV, streets); + if (indV.empty()) + return; + + RemoveDuplicatingLinear(indV); + +#ifdef HOUSE_SEARCH_TEST + FlushHouses(res, false, streets); +#endif + + for (size_t i = 0; i < indV.size(); ++i) + { + if (IsCancelled()) + break; + res.AddResultNoChecks( + (*(indV[i])).GeneratePointResult(&m_categories, &m_prefferedTypes, m_currentLocaleCode)); + } +} + void Query::SearchCoordinates(string const & query, Results & res) const { double lat, lon; @@ -458,192 +546,97 @@ void Query::SearchCoordinates(string const & query, Results & res) const } } -void Query::Search(Results & res, size_t resCount) -{ - if (IsCancelled()) - return; - - if (m_tokens.empty()) - SuggestStrings(res); - - if (IsCancelled()) - return; - SearchAddress(res); - - if (IsCancelled()) - return; - SearchFeatures(); - - if (IsCancelled()) - return; - FlushResults(res, false, resCount); -} - namespace { - /// @name Functors to convert pointers to referencies. - /// Pass them to stl algorithms. - //@{ -template -class ProxyFunctor1 +struct CompFactory2 +{ + struct CompT { - TFunctor m_fn; - - public: + TCompareFunction2 m_fn; + explicit CompT(TCompareFunction2 fn) : m_fn(fn) {} template - explicit ProxyFunctor1(T const & p) : m_fn(*p) {} - - template - bool operator()(T const & p) { return m_fn(*p); } - }; - - template - class ProxyFunctor2 - { - TFunctor m_fn; - - public: - template - bool operator()(T const & p1, T const & p2) + bool operator()(T const & r1, T const & r2) const { - return m_fn(*p1, *p2); - } - }; - //@} - - class IndexedValue : public search::IndexedValueBase - { - using ValueT = impl::PreResult2; - - /// @todo Do not use shared_ptr for optimization issues. - /// Need to rewrite std::unique algorithm. - shared_ptr m_val; - - public: - explicit IndexedValue(ValueT * v) : m_val(v) {} - - ValueT const & operator*() const { return *m_val; } - ValueT const * operator->() const { return m_val.get(); } - - string DebugPrint() const - { - string index; - for (size_t i = 0; i < SIZE; ++i) - index = index + " " + strings::to_string(m_ind[i]); - - return impl::DebugPrint(*m_val) + "; Index:" + index; + return m_fn(*r1, *r2); } }; - inline string DebugPrint(IndexedValue const & t) - { - return t.DebugPrint(); - } + static size_t const SIZE = 2; - struct CompFactory2 - { - struct CompT - { - TCompareFunction2 m_fn; - explicit CompT(TCompareFunction2 fn) : m_fn(fn) {} - template - bool operator()(T const & r1, T const & r2) const - { - return m_fn(*r1, *r2); - } - }; + CompT Get(size_t i) { return CompT(g_arrCompare2[i]); } +}; - static size_t const SIZE = 2; +struct LessFeatureID +{ + using ValueT = impl::PreResult1; + bool operator()(ValueT const & r1, ValueT const & r2) const { return (r1.GetID() < r2.GetID()); } +}; - CompT Get(size_t i) { return CompT(g_arrCompare2[i]); } - }; +class EqualFeatureID +{ + using ValueT = impl::PreResult1; + ValueT const & m_val; - struct LessFeatureID - { - using ValueT = impl::PreResult1; - bool operator() (ValueT const & r1, ValueT const & r2) const - { - return (r1.GetID() < r2.GetID()); - } - }; +public: + EqualFeatureID(ValueT const & v) : m_val(v) {} + bool operator()(ValueT const & r) const { return (m_val.GetID() == r.GetID()); } +}; - class EqualFeatureID - { - using ValueT = impl::PreResult1; - ValueT const & m_val; - public: - EqualFeatureID(ValueT const & v) : m_val(v) {} - bool operator() (ValueT const & r) const - { - return (m_val.GetID() == r.GetID()); - } - }; - - template - void RemoveDuplicatingLinear(vector & indV) - { - sort(indV.begin(), indV.end(), ProxyFunctor2()); - indV.erase(unique(indV.begin(), indV.end(), - ProxyFunctor2()), - indV.end()); - } - - template - bool IsResultExists(impl::PreResult2 const * p, vector const & indV) - { - // do not insert duplicating results - return (indV.end() != find_if(indV.begin(), indV.end(), - ProxyFunctor1(p))); - } +bool IsResultExists(impl::PreResult2 const * p, vector const & indV) +{ + impl::PreResult2::StrictEqualF equalCmp(*p); + // Do not insert duplicating results. + return indV.end() != find_if(indV.begin(), indV.end(), [&equalCmp](IndexedValue const & iv) + { + return equalCmp(*iv); + }); } +} // namespace namespace impl { - class PreResult2Maker +class PreResult2Maker +{ + Query & m_query; + + unique_ptr m_pFV; + + // For the best performance, incoming id's should be sorted by id.first (mwm file id). + void LoadFeature(FeatureID const & id, FeatureType & f, string & name, string & country) { - Query & m_query; + if (m_pFV.get() == 0 || m_pFV->GetId() != id.m_mwmId) + m_pFV.reset(new Index::FeaturesLoaderGuard(m_query.m_index, id.m_mwmId)); - unique_ptr m_pFV; + m_pFV->GetFeatureByIndex(id.m_index, f); + f.SetID(id); - // For the best performance, incoming id's should be sorted by id.first (mwm file id). - void LoadFeature(FeatureID const & id, FeatureType & f, string & name, string & country) + m_query.GetBestMatchName(f, name); + + // country (region) name is a file name if feature isn't from World.mwm + if (m_pFV->IsWorld()) + country.clear(); + else + country = m_pFV->GetCountryFileName(); + } + +public: + PreResult2Maker(Query & q) : m_query(q) {} + + impl::PreResult2 * operator()(impl::PreResult1 const & res) + { + FeatureType feature; + string name, country; + LoadFeature(res.GetID(), feature, name, country); + + Query::ViewportID const viewportID = static_cast(res.GetViewportID()); + impl::PreResult2 * res2 = + new impl::PreResult2(feature, &res, m_query.GetPosition(viewportID), name, country); + + /// @todo: add exluding of states (without USA states), continents + using namespace ftypes; + Type const tp = IsLocalityChecker::Instance().GetType(res2->m_types); + switch (tp) { - if (m_pFV.get() == 0 || m_pFV->GetId() != id.m_mwmId) - m_pFV.reset(new Index::FeaturesLoaderGuard(m_query.m_index, id.m_mwmId)); - - m_pFV->GetFeatureByIndex(id.m_index, f); - f.SetID(id); - - m_query.GetBestMatchName(f, name); - - // country (region) name is a file name if feature isn't from World.mwm - if (m_pFV->IsWorld()) - country.clear(); - else - country = m_pFV->GetCountryFileName(); - } - - public: - PreResult2Maker(Query & q) : m_query(q) - { - } - - impl::PreResult2 * operator() (impl::PreResult1 const & res) - { - FeatureType feature; - string name, country; - LoadFeature(res.GetID(), feature, name, country); - - Query::ViewportID const viewportID = static_cast(res.GetViewportID()); - impl::PreResult2 * res2 = new impl::PreResult2(feature, &res, - m_query.GetPosition(viewportID), - name, country); - - /// @todo: add exluding of states (without USA states), continents - using namespace ftypes; - Type const tp = IsLocalityChecker::Instance().GetType(res2->m_types); - switch (tp) - { case COUNTRY: res2->m_rank /= 1.5; break; @@ -664,53 +657,53 @@ namespace impl break; default: break; - } - - return res2; } - impl::PreResult2 * operator() (FeatureID const & id) - { - FeatureType feature; - string name, country; - LoadFeature(id, feature, name, country); + return res2; + } - if (!name.empty() && !country.empty()) - return new impl::PreResult2(feature, 0, m_query.GetPosition(), name, country); - else - return 0; - } - }; - - class HouseCompFactory + impl::PreResult2 * operator()(FeatureID const & id) { - Query const & m_query; + FeatureType feature; + string name, country; + LoadFeature(id, feature, name, country); - bool LessDistance(HouseResult const & r1, HouseResult const & r2) const + if (!name.empty() && !country.empty()) + return new impl::PreResult2(feature, 0, m_query.GetPosition(), name, country); + else + return 0; + } +}; + +class HouseCompFactory +{ + Query const & m_query; + + bool LessDistance(HouseResult const & r1, HouseResult const & r2) const + { + return (PointDistance(m_query.m_pivot, r1.GetOrg()) < + PointDistance(m_query.m_pivot, r2.GetOrg())); + } + +public: + HouseCompFactory(Query const & q) : m_query(q) {} + + struct CompT + { + HouseCompFactory const * m_parent; + + CompT(HouseCompFactory const * parent) : m_parent(parent) {} + bool operator()(HouseResult const & r1, HouseResult const & r2) const { - return (PointDistance(m_query.m_pivot, r1.GetOrg()) < - PointDistance(m_query.m_pivot, r2.GetOrg())); + return m_parent->LessDistance(r1, r2); } - - public: - HouseCompFactory(Query const & q) : m_query(q) {} - - struct CompT - { - HouseCompFactory const * m_parent; - - CompT(HouseCompFactory const * parent) : m_parent(parent) {} - bool operator() (HouseResult const & r1, HouseResult const & r2) const - { - return m_parent->LessDistance(r1, r2); - } - }; - - static size_t const SIZE = 1; - - CompT Get(size_t) { return CompT(this); } }; -} + + static size_t const SIZE = 1; + + CompT Get(size_t) { return CompT(this); } +}; +} // namespace impl template void Query::MakePreResult2(vector & cont, vector & streets) @@ -808,62 +801,11 @@ void Query::FlushResults(Results & res, bool allMWMs, size_t resCount) } } -void Query::SearchViewportPoints(Results & res) -{ - if (IsCancelled()) - return; - SearchAddress(res); - - if (IsCancelled()) - return; - SearchFeatures(); - - vector indV; - vector streets; - - MakePreResult2(indV, streets); - - if (indV.empty()) - return; - - RemoveDuplicatingLinear(indV); - -#ifdef HOUSE_SEARCH_TEST - FlushHouses(res, false, streets); -#endif - - for (size_t i = 0; i < indV.size(); ++i) - { - if (IsCancelled()) - break; - - res.AddResultNoChecks( - indV[i]->GeneratePointResult(&m_categories, &m_prefferedTypes, m_currentLocaleCode)); - } -} - int Query::GetQueryIndexScale(m2::RectD const & viewport) const { return search::GetQueryIndexScale(viewport); } -ftypes::Type Query::GetLocalityIndex(feature::TypesHolder const & types) const -{ - using namespace ftypes; - - // Inner logic of SearchAddress expects COUNTRY, STATE and CITY only. - Type const type = IsLocalityChecker::Instance().GetType(types); - switch (type) - { - case TOWN: - return CITY; - case VILLAGE: - return NONE; - default: - return type; - } -} - void Query::RemoveStringPrefix(string const & str, string & res) const { search::Delimiters delims; @@ -951,28 +893,24 @@ void Query::ProcessSuggestions(vector & vec, Results & res) const } } -void Query::AddResultFromTrie(TTrieValue const & val, MwmSet::MwmId const & mwmID, - ViewportID vID /*= DEFAULT_V*/) +void Query::AddPreResult1(MwmSet::MwmId const & mwmId, uint32_t featureId, uint8_t rank, + double priority, ViewportID viewportId /*= DEFAULT_V*/) { - /// If we are in viewport search mode, check actual "point-in-viewport" criteria. - /// @todo Actually, this checks are more-like hack, but not a suitable place to do ... - if (m_queuesCount == 1 && vID == CURRENT_V && !m_viewport[CURRENT_V].IsPointInside(val.m_pt)) - return; - - impl::PreResult1 res(FeatureID(mwmID, val.m_featureId), val.m_rank, - val.m_pt, GetPosition(vID), vID); + impl::PreResult1 res(FeatureID(mwmId, featureId), rank, priority, viewportId); for (size_t i = 0; i < m_queuesCount; ++i) { // here can be the duplicates because of different language match (for suggest token) - if (m_results[i].end() == find_if(m_results[i].begin(), m_results[i].end(), EqualFeatureID(res))) + if (m_results[i].end() == + find_if(m_results[i].begin(), m_results[i].end(), EqualFeatureID(res))) + { m_results[i].push(res); + } } } namespace impl { - class BestNameFinder { KeywordLangMatcher::ScoreT m_score; @@ -995,8 +933,7 @@ public: return true; } }; - -} // namespace search::impl +} // namespace impl void Query::GetBestMatchName(FeatureType const & f, string & name) const { @@ -1284,182 +1221,6 @@ void Query::InitParams(bool localitySearch, SearchQueryParams & params) params.m_langs.insert(GetLanguage(i)); } -namespace impl -{ - struct Locality - { - string m_name, m_enName; ///< native name and english name of locality - Query::TTrieValue m_value; - vector m_matchedTokens; ///< indexes of matched tokens for locality - - ftypes::Type m_type; - double m_radius; - - Locality() : m_type(ftypes::NONE) {} - Locality(Query::TTrieValue const & val, ftypes::Type type) - : m_value(val), m_type(type), m_radius(0) - { - } - - bool IsValid() const - { - if (m_type != ftypes::NONE) - { - ASSERT ( !m_matchedTokens.empty(), () ); - return true; - } - else - return false; - } - - void Swap(Locality & rhs) - { - m_name.swap(rhs.m_name); - m_enName.swap(rhs.m_enName); - m_matchedTokens.swap(rhs.m_matchedTokens); - - using std::swap; - swap(m_value, rhs.m_value); - swap(m_type, rhs.m_type); - swap(m_radius, rhs.m_radius); - } - - bool operator< (Locality const & rhs) const - { - if (m_type != rhs.m_type) - return (m_type < rhs.m_type); - - if (m_matchedTokens.size() != rhs.m_matchedTokens.size()) - return (m_matchedTokens.size() < rhs.m_matchedTokens.size()); - - return (m_value.m_rank < rhs.m_value.m_rank); - } - - private: - class DoCount - { - size_t & m_count; - public: - DoCount(size_t & count) : m_count(count) { m_count = 0; } - - template - void operator()(T const &) { ++m_count; } - }; - - bool IsFullNameMatched() const - { - size_t count; - SplitUniString(NormalizeAndSimplifyString(m_name), DoCount(count), search::Delimiters()); - return (count <= m_matchedTokens.size()); - } - - using TString = strings::UniString; - using TTokensArray = buffer_vector; - - size_t GetSynonymTokenLength(TTokensArray const & tokens, TString const & prefix) const - { - // check only one token as a synonym - if (m_matchedTokens.size() == 1) - { - size_t const index = m_matchedTokens[0]; - if (index < tokens.size()) - return tokens[index].size(); - else - { - ASSERT_EQUAL ( index, tokens.size(), () ); - ASSERT ( !prefix.empty(), () ); - return prefix.size(); - } - } - - return size_t(-1); - } - - public: - /// Check that locality is suitable for source input tokens. - bool IsSuitable(TTokensArray const & tokens, TString const & prefix) const - { - bool const isMatched = IsFullNameMatched(); - - // Do filtering of possible localities. - using namespace ftypes; - - switch (m_type) - { - case STATE: // we process USA, Canada states only for now - // USA states has 2-symbol synonyms - return (isMatched || GetSynonymTokenLength(tokens, prefix) == 2); - - case COUNTRY: - // USA has synonyms: "US" or "USA" - return (isMatched || - (m_enName == "usa" && GetSynonymTokenLength(tokens, prefix) <= 3) || - (m_enName == "uk" && GetSynonymTokenLength(tokens, prefix) == 2)); - - case CITY: - // need full name match for cities - return isMatched; - - default: - ASSERT ( false, () ); - return false; - } - } - }; - - void swap(Locality & r1, Locality & r2) { r1.Swap(r2); } - - string DebugPrint(Locality const & l) - { - stringstream ss; - ss << "{ Locality: " << - "Name = " + l.m_name << - "; Name English = " << l.m_enName << - "; Rank = " << int(l.m_value.m_rank) << - "; Matched: " << l.m_matchedTokens.size() << " }"; - return ss.str(); - } - - struct Region - { - vector m_ids; - vector m_matchedTokens; - string m_enName; - - bool operator<(Region const & rhs) const - { - return (m_matchedTokens.size() < rhs.m_matchedTokens.size()); - } - - bool IsValid() const - { - if (!m_ids.empty()) - { - ASSERT ( !m_matchedTokens.empty(), () ); - ASSERT ( !m_enName.empty(), () ); - return true; - } - else - return false; - } - - void Swap(Region & rhs) - { - m_ids.swap(rhs.m_ids); - m_matchedTokens.swap(rhs.m_matchedTokens); - m_enName.swap(rhs.m_enName); - } - }; - - string DebugPrint(Region const & r) - { - string res("Region: "); - res += "Name English: " + r.m_enName; - res += "; Matched: " + ::DebugPrint(r.m_matchedTokens.size()); - return res; - } -} - void Query::SearchAddress(Results & res) { // Find World.mwm and do special search there. @@ -1474,8 +1235,8 @@ void Query::SearchAddress(Results & res) if (pMwm && pMwm->m_cont.IsExist(SEARCH_INDEX_FILE_TAG) && pMwm->GetHeader().GetType() == TFHeader::world) { - impl::Locality city; - impl::Region region; + Locality city; + Region region; SearchLocality(pMwm, city, region); if (city.IsValid()) @@ -1493,20 +1254,22 @@ void Query::SearchAddress(Results & res) { params.ProcessAddressTokens(); - m2::RectD const rect = MercatorBounds::RectByCenterXYAndSizeInMeters( - city.m_value.m_pt, city.m_radius); - SetViewportByIndex(mwmsInfo, rect, LOCALITY_V, false); + m2::PointD const cityCenter = GetLocalityCenter(m_index, mwmId, city); + double const cityRadius = city.m_radius; + m2::RectD const rect = + MercatorBounds::RectByCenterXYAndSizeInMeters(cityCenter, cityRadius); + SetViewportByIndex(mwmsInfo, rect, LOCALITY_V, false /* forceUpdate */); /// @todo Hack - do not search for address in World.mwm; Do it better in future. bool const b = m_worldSearch; m_worldSearch = false; - SearchFeatures(params, mwmsInfo, LOCALITY_V); + SearchFeaturesInViewport(params, mwmsInfo, LOCALITY_V); m_worldSearch = b; } else { // Add found locality as a result if nothing left to match. - AddResultFromTrie(city.m_value, mwmId); + AddPreResult1(mwmId, city.m_featureId, city.m_rank, 1.0 /* priority */); } } else if (region.IsValid()) @@ -1522,16 +1285,14 @@ void Query::SearchAddress(Results & res) if (!params.IsEmpty()) { - for (shared_ptr & info : mwmsInfo) + TMWMVector regionMwms; + auto regionMismatch = [this, ®ion](shared_ptr const & info) { - Index::MwmHandle const handle = m_index.GetMwmHandleById(info); - if (handle.IsAlive() && - m_infoGetter.IsBelongToRegions(handle.GetValue()->GetCountryFileName(), - region.m_ids)) - { - SearchInMWM(handle, params); - } - } + return !m_infoGetter.IsBelongToRegions(info->GetCountryName(), region.m_ids); + }; + remove_copy_if(mwmsInfo.begin(), mwmsInfo.end(), back_inserter(regionMwms), + regionMismatch); + SearchInMwms(regionMwms, params, DEFAULT_V); } } @@ -1542,221 +1303,216 @@ void Query::SearchAddress(Results & res) namespace impl { - class DoFindLocality +class DoFindLocality +{ + Query const & m_query; + + /// Index in array equal to Locality::m_type value. + vector m_localities[3]; + + FeaturesVector m_vector; + size_t m_index; ///< index of processing token + + int8_t m_lang; + int8_t m_arrEn[3]; + + /// Tanslates country full english name to mwm file name prefix + /// (need when matching correspondent mwm file in CountryInfoGetter::GetMatchedRegions). + //@{ + static bool FeatureName2FileNamePrefix(string & name, char const * prefix, char const * arr[], + size_t n) { - Query const & m_query; + for (size_t i = 0; i < n; ++i) + if (name.find(arr[i]) == string::npos) + return false; - /// Index in array equal to Locality::m_type value. - vector m_localities[3]; + name = prefix; + return true; + } - FeaturesVector m_vector; - size_t m_index; ///< index of processing token - - Locality * PushLocality(Locality const & l) - { - ASSERT ( 0 <= l.m_type && l.m_type <= ARRAY_SIZE(m_localities), (l.m_type) ); - m_localities[l.m_type].push_back(l); - return &(m_localities[l.m_type].back()); - } - - int8_t m_lang; - int8_t m_arrEn[3]; - - /// Tanslates country full english name to mwm file name prefix - /// (need when matching correspondent mwm file in CountryInfoGetter::GetMatchedRegions). - //@{ - static bool FeatureName2FileNamePrefix(string & name, char const * prefix, - char const * arr[], size_t n) - { - for (size_t i = 0; i < n; ++i) - if (name.find(arr[i]) == string::npos) - return false; - - name = prefix; - return true; - } - - void AssignEnglishName(FeatureType const & f, Locality & l) - { - // search for name in next order: "en", "int_name", "default" - for (int i = 0; i < 3; ++i) - if (f.GetName(m_arrEn[i], l.m_enName)) - { - // make name lower-case - strings::AsciiToLower(l.m_enName); - - char const * arrUSA[] = { "united", "states", "america" }; - char const * arrUK[] = { "united", "kingdom" }; - - if (!FeatureName2FileNamePrefix(l.m_enName, "usa", arrUSA, ARRAY_SIZE(arrUSA))) - if (!FeatureName2FileNamePrefix(l.m_enName, "uk", arrUK, ARRAY_SIZE(arrUK))) - return; - } - } - //@} - - void AddRegions(int index, vector & regions) const - { - // fill regions vector in priority order - vector const & arr = m_localities[index]; - for (auto i = arr.rbegin(); i != arr.rend(); ++i) + void AssignEnglishName(FeatureType const & f, Locality & l) + { + // search for name in next order: "en", "int_name", "default" + for (int i = 0; i < 3; ++i) + if (f.GetName(m_arrEn[i], l.m_enName)) { - // no need to check region with empty english name (can't match for polygon) - if (!i->m_enName.empty() && i->IsSuitable(m_query.m_tokens, m_query.m_prefix)) - { - vector vec; - m_query.m_infoGetter.GetMatchedRegions(i->m_enName, vec); - if (!vec.empty()) - { - regions.push_back(Region()); - Region & r = regions.back(); + // make name lower-case + strings::AsciiToLower(l.m_enName); - r.m_ids.swap(vec); - r.m_matchedTokens = i->m_matchedTokens; - r.m_enName = i->m_enName; - } + char const * arrUSA[] = {"united", "states", "america"}; + char const * arrUK[] = {"united", "kingdom"}; + + if (!FeatureName2FileNamePrefix(l.m_enName, "usa", arrUSA, ARRAY_SIZE(arrUSA))) + if (!FeatureName2FileNamePrefix(l.m_enName, "uk", arrUK, ARRAY_SIZE(arrUK))) + return; + } + } + //@} + + void AddRegions(int index, vector & regions) const + { + // fill regions vector in priority order + vector const & arr = m_localities[index]; + for (auto i = arr.rbegin(); i != arr.rend(); ++i) + { + // no need to check region with empty english name (can't match for polygon) + if (!i->m_enName.empty() && i->IsSuitable(m_query.m_tokens, m_query.m_prefix)) + { + vector vec; + m_query.m_infoGetter.GetMatchedRegions(i->m_enName, vec); + if (!vec.empty()) + { + regions.push_back(Region()); + Region & r = regions.back(); + + r.m_ids.swap(vec); + r.m_matchedTokens = i->m_matchedTokens; + r.m_enName = i->m_enName; } } } + } - bool IsBelong(Locality const & loc, Region const & r) const + bool IsBelong(Locality const & loc, Region const & r) const + { + // check that locality and region are produced from different tokens + vector dummy; + set_intersection(loc.m_matchedTokens.begin(), loc.m_matchedTokens.end(), + r.m_matchedTokens.begin(), r.m_matchedTokens.end(), back_inserter(dummy)); + + if (dummy.empty()) { - // check that locality and region are produced from different tokens - vector dummy; - set_intersection(loc.m_matchedTokens.begin(), loc.m_matchedTokens.end(), - r.m_matchedTokens.begin(), r.m_matchedTokens.end(), - back_inserter(dummy)); - - if (dummy.empty()) - { - // check that locality belong to region - return m_query.m_infoGetter.IsBelongToRegions(loc.m_value.m_pt, r.m_ids); - } - - return false; + // check that locality belong to region + return m_query.m_infoGetter.IsBelongToRegions(loc.m_center, r.m_ids); } - class EqualID - { - uint32_t m_id; - public: - EqualID(uint32_t id) : m_id(id) {} - bool operator() (Locality const & l) const { return (l.m_value.m_featureId == m_id); } - }; + return false; + } + + class EqualID + { + uint32_t m_id; public: - DoFindLocality(Query & q, MwmValue const * pMwm, int8_t lang) - : m_query(q), m_vector(pMwm->m_cont, pMwm->GetHeader(), pMwm->m_table), m_lang(lang) - { - m_arrEn[0] = q.GetLanguage(LANG_EN); - m_arrEn[1] = q.GetLanguage(LANG_INTERNATIONAL); - m_arrEn[2] = q.GetLanguage(LANG_DEFAULT); - } + EqualID(uint32_t id) : m_id(id) {} - void Resize(size_t) {} - - void SwitchTo(size_t ind) { m_index = ind; } - - void operator() (Query::TTrieValue const & v) - { - if (m_query.IsCancelled()) - throw Query::CancelException(); - - // find locality in current results - for (size_t i = 0; i < 3; ++i) - { - auto it = find_if(m_localities[i].begin(), m_localities[i].end(), EqualID(v.m_featureId)); - if (it != m_localities[i].end()) - { - it->m_matchedTokens.push_back(m_index); - return; - } - } - - // load feature - FeatureType f; - m_vector.GetByIndex(v.m_featureId, f); - - using namespace ftypes; - - // check, if feature is locality - Type const index = m_query.GetLocalityIndex(feature::TypesHolder(f)); - if (index != NONE) - { - Locality * loc = PushLocality(Locality(v, index)); - if (loc) - { - loc->m_radius = GetRadiusByPopulation(GetPopulation(f)); - // m_lang name should exist if we matched feature in search index for this language. - VERIFY(f.GetName(m_lang, loc->m_name), ()); - - loc->m_matchedTokens.push_back(m_index); - - AssignEnglishName(f, *loc); - } - } - } - - void SortLocalities() - { - for (int i = ftypes::COUNTRY; i <= ftypes::CITY; ++i) - sort(m_localities[i].begin(), m_localities[i].end()); - } - - void GetRegions(vector & regions) const - { - //LOG(LDEBUG, ("Countries before processing = ", m_localities[ftypes::COUNTRY])); - //LOG(LDEBUG, ("States before processing = ", m_localities[ftypes::STATE])); - - AddRegions(ftypes::STATE, regions); - AddRegions(ftypes::COUNTRY, regions); - - //LOG(LDEBUG, ("Regions after processing = ", regions)); - } - - void GetBestCity(Locality & res, vector const & regions) - { - size_t const regsCount = regions.size(); - vector & arr = m_localities[ftypes::CITY]; - - // Interate in reverse order from better to generic locality. - for (auto i = arr.rbegin(); i != arr.rend(); ++i) - { - if (!i->IsSuitable(m_query.m_tokens, m_query.m_prefix)) - continue; - - // additional check for locality belongs to region - vector belongs; - for (size_t j = 0; j < regsCount; ++j) - { - if (IsBelong(*i, regions[j])) - belongs.push_back(®ions[j]); - } - - for (size_t j = 0; j < belongs.size(); ++j) - { - // splice locality info with region info - i->m_matchedTokens.insert(i->m_matchedTokens.end(), - belongs[j]->m_matchedTokens.begin(), - belongs[j]->m_matchedTokens.end()); - // we need to store sorted range of token indexies - sort(i->m_matchedTokens.begin(), i->m_matchedTokens.end()); - - i->m_enName += (", " + belongs[j]->m_enName); - } - - if (res < *i) - i->Swap(res); - - if (regsCount == 0) - return; - } - } + bool operator()(Locality const & l) const { return (l.m_featureId == m_id); } }; -} -void Query::SearchLocality(MwmValue const * pMwm, impl::Locality & res1, impl::Region & res2) +public: + DoFindLocality(Query & q, MwmValue const * pMwm, int8_t lang) + : m_query(q), m_vector(pMwm->m_cont, pMwm->GetHeader(), pMwm->m_table), m_lang(lang) + { + m_arrEn[0] = q.GetLanguage(LANG_EN); + m_arrEn[1] = q.GetLanguage(LANG_INTERNATIONAL); + m_arrEn[2] = q.GetLanguage(LANG_DEFAULT); + } + + void Resize(size_t) {} + + void SwitchTo(size_t ind) { m_index = ind; } + + void operator()(Query::TTrieValue const & v) + { + LOG(LINFO, ("DoFindLocality::operator()")); + if (m_query.IsCancelled()) + throw Query::CancelException(); + + // find locality in current results + for (size_t i = 0; i < 3; ++i) + { + auto it = find_if(m_localities[i].begin(), m_localities[i].end(), EqualID(v.m_featureId)); + if (it != m_localities[i].end()) + { + it->m_matchedTokens.push_back(m_index); + return; + } + } + + // Load feature. + FeatureType f; + m_vector.GetByIndex(v.m_featureId, f); + + using namespace ftypes; + + // Check, if feature is locality. + Type const type = GetLocalityIndex(feature::TypesHolder(f)); + if (type == NONE) + return; + ASSERT_LESS_OR_EQUAL(0, type, ()); + ASSERT_LESS(type, ARRAY_SIZE(m_localities), ()); + + m2::PointD const center = feature::GetCenter(f, FeatureType::WORST_GEOMETRY); + m_localities[type].emplace_back(type, v.m_featureId, center, v.m_rank); + Locality & loc = m_localities[type].back(); + + loc.m_radius = GetRadiusByPopulation(GetPopulation(f)); + // m_lang name should exist if we matched feature in search index for this language. + VERIFY(f.GetName(m_lang, loc.m_name), ()); + loc.m_matchedTokens.push_back(m_index); + AssignEnglishName(f, loc); + } + + void SortLocalities() + { + for (int i = ftypes::COUNTRY; i <= ftypes::CITY; ++i) + sort(m_localities[i].begin(), m_localities[i].end()); + } + + void GetRegions(vector & regions) const + { + // LOG(LDEBUG, ("Countries before processing = ", m_localities[ftypes::COUNTRY])); + // LOG(LDEBUG, ("States before processing = ", m_localities[ftypes::STATE])); + + AddRegions(ftypes::STATE, regions); + AddRegions(ftypes::COUNTRY, regions); + + // LOG(LDEBUG, ("Regions after processing = ", regions)); + } + + void GetBestCity(Locality & res, vector const & regions) + { + size_t const regsCount = regions.size(); + vector & arr = m_localities[ftypes::CITY]; + + // Interate in reverse order from better to generic locality. + for (auto i = arr.rbegin(); i != arr.rend(); ++i) + { + if (!i->IsSuitable(m_query.m_tokens, m_query.m_prefix)) + continue; + + // additional check for locality belongs to region + vector belongs; + for (size_t j = 0; j < regsCount; ++j) + { + if (IsBelong(*i, regions[j])) + belongs.push_back(®ions[j]); + } + + for (size_t j = 0; j < belongs.size(); ++j) + { + // splice locality info with region info + i->m_matchedTokens.insert(i->m_matchedTokens.end(), belongs[j]->m_matchedTokens.begin(), + belongs[j]->m_matchedTokens.end()); + // we need to store sorted range of token indexies + sort(i->m_matchedTokens.begin(), i->m_matchedTokens.end()); + + i->m_enName += (", " + belongs[j]->m_enName); + } + + if (res < *i) + i->Swap(res); + + if (regsCount == 0) + return; + } + } +}; +} // namespace impl + +void Query::SearchLocality(MwmValue const * pMwm, Locality & res1, Region & res2) { + LOG(LDEBUG, ("Query::SearchLocality")); SearchQueryParams params; InitParams(true /* localitySearch */, params); @@ -1780,11 +1536,11 @@ void Query::SearchLocality(MwmValue const * pMwm, impl::Locality & res1, impl::R doFind.SortLocalities(); // Get regions from STATE and COUNTRY localities - vector regions; + vector regions; doFind.GetRegions(regions); // Get best CITY locality. - impl::Locality loc; + Locality loc; doFind.GetBestCity(loc, regions); if (res1 < loc) { @@ -1810,79 +1566,64 @@ void Query::SearchFeatures() SearchQueryParams params; InitParams(false /* localitySearch */, params); - // do usual search in viewport and near me (without last rect) - for (int i = 0; i < LOCALITY_V; ++i) - { - if (m_viewport[i].IsValid()) - SearchFeatures(params, mwmsInfo, static_cast(i)); - } + SearchInMwms(mwmsInfo, params, CURRENT_V); } -namespace +void Query::SearchFeaturesInViewport(ViewportID viewportId) { - class FeaturesFilter + TMWMVector mwmsInfo; + m_index.GetMwmsInfo(mwmsInfo); + + SearchQueryParams params; + InitParams(false /* localitySearch */, params); + + SearchFeaturesInViewport(params, mwmsInfo, viewportId); +} + +void Query::SearchFeaturesInViewport(SearchQueryParams const & params, TMWMVector const & mwmsInfo, + ViewportID viewportId) +{ + m2::RectD const * viewport = nullptr; + if (viewportId == LOCALITY_V) + viewport = &m_viewport[LOCALITY_V]; + else + viewport = &m_viewport[CURRENT_V]; + if (!viewport->IsValid()) + return; + + TMWMVector viewportMwms; + auto viewportMispatch = [&viewport](shared_ptr const & info) { - vector const * m_offsets; - - my::Cancellable const & m_cancellable; - public: - FeaturesFilter(vector const * offsets, my::Cancellable const & cancellable) - : m_offsets(offsets), m_cancellable(cancellable) - { - } - - bool operator() (uint32_t offset) const - { - if (m_cancellable.IsCancelled()) - { - //LOG(LINFO, ("Throw CancelException")); - //dbg::ObjectTracker::PrintLeaks(); - throw Query::CancelException(); - } - - return (m_offsets == 0 || - binary_search(m_offsets->begin(), m_offsets->end(), offset)); - } + return !viewport->IsIntersect(info->m_limitRect); }; + remove_copy_if(mwmsInfo.begin(), mwmsInfo.end(), back_inserter(viewportMwms), viewportMispatch); + SearchInMwms(viewportMwms, params, viewportId); } -void Query::SearchFeatures(SearchQueryParams const & params, TMWMVector const & mwmsInfo, - ViewportID vID) +void Query::SearchInMwms(TMWMVector const & mwmsInfo, SearchQueryParams const & params, + ViewportID viewportId) { - for (shared_ptr const & info : mwmsInfo) + Retrieval::Limits limits; + limits.SetMaxNumFeatures(kPreResultsCount); + limits.SetSearchInWorld(m_worldSearch); + + m2::RectD const * viewport = nullptr; + if (viewportId == LOCALITY_V) { - // Search only mwms that intersect with viewport (world always does). - if (m_viewport[vID].IsIntersect(info->m_limitRect)) - SearchInMWM(m_index.GetMwmHandleById(info), params, vID); + limits.SetMaxViewportScale(1.0); + viewport = &m_viewport[LOCALITY_V]; } -} - -void Query::SearchInMWM(Index::MwmHandle const & mwmHandle, SearchQueryParams const & params, - ViewportID viewportId /*= DEFAULT_V*/) -{ - MwmValue const * const value = mwmHandle.GetValue(); - if (!value || !value->m_cont.IsExist(SEARCH_INDEX_FILE_TAG)) - return; - - TFHeader const & header = value->GetHeader(); - /// @todo do not process World.mwm here - do it in SearchLocality - bool const isWorld = (header.GetType() == TFHeader::world); - if (isWorld && !m_worldSearch) - return; - - serial::CodingParams cp(trie::GetCodingParams(header.GetDefCodingParams())); - ModelReaderPtr searchReader = value->m_cont.GetReader(SEARCH_INDEX_FILE_TAG); - unique_ptr const trieRoot( - trie::ReadTrie(SubReaderWrapper(searchReader.GetPtr()), trie::ValueReader(cp), - trie::TEdgeValueReader())); - - MwmSet::MwmId const mwmId = mwmHandle.GetId(); - FeaturesFilter filter(viewportId == DEFAULT_V || isWorld ? - 0 : &m_offsetsInViewport[viewportId][mwmId], *this); - MatchFeaturesInTrie(params, *trieRoot, filter, [&](TTrieValue const & value) + else { - AddResultFromTrie(value, mwmId, viewportId); - }); + viewport = &m_viewport[CURRENT_V]; + } + + SearchQueryParams p = params; + p.m_scale = GetQueryIndexScale(*viewport); + m_retrieval.Init(m_index, mwmsInfo, *viewport, p, limits); + + RetrievalCallback callback(*this, viewportId); + m_retrieval.Go(callback); } void Query::SuggestStrings(Results & res) @@ -1942,43 +1683,20 @@ m2::PointD Query::GetPosition(ViewportID vID /*= DEFAULT_V*/) const } } -void Query::SearchAdditional(Results & res, size_t resCount) +string DebugPrint(Query::ViewportID viewportId) { - ClearQueues(); - - string const fileName = m_infoGetter.GetRegionFile(m_pivot); - if (!fileName.empty()) + switch (viewportId) { - LOG(LDEBUG, ("Additional MWM search: ", fileName)); - - TMWMVector mwmsInfo; - m_index.GetMwmsInfo(mwmsInfo); - - SearchQueryParams params; - InitParams(false /* localitySearch */, params); - - for (shared_ptr const & info : mwmsInfo) - { - Index::MwmHandle const handle = m_index.GetMwmHandleById(info); - if (handle.IsAlive() && - handle.GetValue()->GetCountryFileName() == fileName) - { - SearchInMWM(handle, params); - } - } - -#ifdef FIND_LOCALITY_TEST - m2::RectD rect; - for (auto const & r : m_results[0]) - rect.Add(r.GetCenter()); - - // Hack with 90.0 is important for the countries divided by 180 meridian. - if (rect.IsValid() && (rect.maxX() - rect.minX()) <= 90.0) - m_locality.SetReservedViewportIfNeeded(rect); -#endif - - FlushResults(res, true, resCount); + case Query::DEFAULT_V: + return "Default"; + case Query::CURRENT_V: + return "Current"; + case Query::LOCALITY_V: + return "Locality"; + case Query::COUNT_V: + return "Count"; } + ASSERT(false, ("Unknown viewportId")); + return "Unknown"; } - } // namespace search diff --git a/search/search_query.hpp b/search/search_query.hpp index 724bf5d6c0..056327d9fa 100644 --- a/search/search_query.hpp +++ b/search/search_query.hpp @@ -1,6 +1,7 @@ #pragma once #include "intermediate_result.hpp" #include "keyword_lang_matcher.hpp" +#include "retrieval.hpp" #include "suggest.hpp" #include "indexer/ftypes_matcher.hpp" @@ -39,6 +40,8 @@ namespace storage { class CountryInfoGetter; } namespace search { +struct Locality; +struct Region; struct SearchQueryParams; namespace impl @@ -46,8 +49,6 @@ namespace impl class FeatureLoader; class BestNameFinder; class PreResult2Maker; - struct Locality; - struct Region; class DoFindLocality; class HouseCompFactory; } @@ -55,10 +56,16 @@ namespace impl class Query : public my::Cancellable { public: - Query(Index & index, CategoriesHolder const & categories, - vector const & suggests, + Query(Index & index, CategoriesHolder const & categories, vector const & suggests, storage::CountryInfoGetter const & infoGetter); + // TODO (@gorshenin): current cancellation logic is completely wrong + // and broken by design. Fix it ASAP. + // + // my::Cancellable overrides: + void Reset() override; + void Cancel() override; + inline void SupportOldFormat(bool b) { m_supportOldFormat = b; } void Init(bool viewportSearch); @@ -82,11 +89,9 @@ public: /// @name Different search functions. //@{ - void SearchCoordinates(string const & query, Results & res) const; void Search(Results & res, size_t resCount); - void SearchAdditional(Results & res, size_t resCount); - void SearchViewportPoints(Results & res); + void SearchCoordinates(string const & query, Results & res) const; //@} // Get scale level to make geometry index query for current viewport. @@ -104,6 +109,30 @@ public: void InitParams(bool localitySearch, SearchQueryParams & params); private: + enum ViewportID + { + DEFAULT_V = -1, + CURRENT_V = 0, + LOCALITY_V = 1, + COUNT_V = 2 // Should always be the last + }; + + friend string DebugPrint(ViewportID viewportId); + + class RetrievalCallback : public Retrieval::Callback + { + public: + RetrievalCallback(Query & query, ViewportID id); + + // Retrieval::Callback overrides: + void OnFeaturesRetrieved(MwmSet::MwmId const & id, double scale, + vector const & featureIds) override; + + private: + Query & m_query; + ViewportID m_viewportId; + }; + friend class impl::FeatureLoader; friend class impl::BestNameFinder; friend class impl::PreResult2Maker; @@ -123,26 +152,15 @@ private: void SetViewportByIndex(TMWMVector const & mwmsInfo, m2::RectD const & viewport, size_t idx, bool forceUpdate); - void UpdateViewportOffsets(TMWMVector const & mwmsInfo, m2::RectD const & rect, - TOffsetsVector & offsets); void ClearCache(size_t ind); - enum ViewportID - { - DEFAULT_V = -1, - CURRENT_V = 0, - LOCALITY_V = 1, - COUNT_V = 2 // Should always be the last - }; - - void AddResultFromTrie(TTrieValue const & val, MwmSet::MwmId const & mwmID, - ViewportID vID = DEFAULT_V); + void AddPreResult1(MwmSet::MwmId const & mwmId, uint32_t featureId, uint8_t rank, double priority, + ViewportID viewportId = DEFAULT_V); template void MakePreResult2(vector & cont, vector & streets); void FlushHouses(Results & res, bool allMWMs, vector const & streets); void FlushResults(Results & res, bool allMWMs, size_t resCount); - ftypes::Type GetLocalityIndex(feature::TypesHolder const & types) const; void RemoveStringPrefix(string const & str, string & res) const; void GetSuggestion(string const & name, string & suggest) const; template void ProcessSuggestions(vector & vec, Results & res) const; @@ -153,20 +171,16 @@ private: /// @param[in] pMwm MWM file for World /// @param[out] res1 Best city-locality /// @param[out] res2 Best region-locality - void SearchLocality(MwmValue const * pMwm, impl::Locality & res1, impl::Region & res2); + void SearchLocality(MwmValue const * pMwm, Locality & res1, Region & res2); void SearchFeatures(); + void SearchFeaturesInViewport(ViewportID viewportId); + void SearchFeaturesInViewport(SearchQueryParams const & params, TMWMVector const & mwmsInfo, + ViewportID viewportId); - /// @param[in] ind Index of viewport rect to search (@see m_viewport). - /// If ind == -1, don't do any matching with features in viewport (@see m_offsetsInViewport). - //@{ - /// Do search in all maps from mwmInfo. - void SearchFeatures(SearchQueryParams const & params, TMWMVector const & mwmsInfo, - ViewportID vID); - /// Do search in particular map (mwmHandle). - void SearchInMWM(Index::MwmHandle const & mwmHandle, SearchQueryParams const & params, - ViewportID viewportId = DEFAULT_V); - //@} + /// Do search in a set of maps. + void SearchInMwms(TMWMVector const & mwmsInfo, SearchQueryParams const & params, + ViewportID viewportId); void SuggestStrings(Results & res); void MatchForSuggestionsImpl(strings::UniString const & token, int8_t locale, string const & prolog, Results & res); @@ -200,6 +214,7 @@ private: m2::RectD m_viewport[COUNT_V]; m2::PointD m_pivot; bool m_worldSearch; + Retrieval m_retrieval; /// @name Get ranking params. //@{ @@ -214,7 +229,6 @@ private: KeywordLangMatcher m_keywordsScorer; - TOffsetsVector m_offsetsInViewport[COUNT_V]; bool m_supportOldFormat; template diff --git a/search/search_tests_support/test_search_engine.cpp b/search/search_tests_support/test_search_engine.cpp index cc4a362b78..2a8becc550 100644 --- a/search/search_tests_support/test_search_engine.cpp +++ b/search/search_tests_support/test_search_engine.cpp @@ -5,9 +5,12 @@ #include "search/search_query.hpp" #include "search/search_query_factory.hpp" +#include "search/suggest.hpp" #include "platform/platform.hpp" +#include "defines.hpp" + #include "std/unique_ptr.hpp" namespace