From 1d4174dd5048d541493d8b8b434d0bd7b3771d77 Mon Sep 17 00:00:00 2001 From: Vladimir Byko-Ianko Date: Fri, 1 Jun 2018 17:16:38 +0300 Subject: [PATCH] Extrapolation benchmark implemented. --- map/extrapolation_benchmark/CMakeLists.txt | 6 +- .../extrapolation_benchmark.cpp | 208 ++++++++++++++++-- .../track_analyzer/cmd_unmatched_tracks.cpp | 2 +- 3 files changed, 195 insertions(+), 21 deletions(-) diff --git a/map/extrapolation_benchmark/CMakeLists.txt b/map/extrapolation_benchmark/CMakeLists.txt index f82bc03f74..75f8d88285 100644 --- a/map/extrapolation_benchmark/CMakeLists.txt +++ b/map/extrapolation_benchmark/CMakeLists.txt @@ -14,9 +14,13 @@ omim_add_executable(${PROJECT_NAME} ${SRC}) omim_link_libraries( ${PROJECT_NAME} - platform + map + routing geometry + platform + coding base + stats_client gflags ${LIBZ} ) diff --git a/map/extrapolation_benchmark/extrapolation_benchmark.cpp b/map/extrapolation_benchmark/extrapolation_benchmark.cpp index 40f85f16dd..0db0829ffb 100644 --- a/map/extrapolation_benchmark/extrapolation_benchmark.cpp +++ b/map/extrapolation_benchmark/extrapolation_benchmark.cpp @@ -1,9 +1,18 @@ +#include "map/extrapolation/extrapolator.hpp" + +#include "routing/base/followed_polyline.hpp" + #include "geometry/distance_on_sphere.hpp" #include "geometry/latlon.hpp" +#include "geometry/mercator.hpp" +#include "geometry/polyline2d.hpp" + +#include "platform/location.hpp" #include "base/logging.hpp" #include "base/string_utils.hpp" +#include #include #include #include @@ -15,27 +24,83 @@ #include "3party/gflags/src/gflags/gflags_declare.h" #include "3party/gflags/src/gflags/gflags.h" +// This tool is written to estimate quality of location extrapolation. To launch the benchmark +// you need tracks in csv file with the format described below. To generate the csv file +// you need to go through following steps: +// * take logs form Trafim project production in gz files +// * extract them (gzip -d) +// * run track_analyzer tool with unmatched_tracks command to generate csv +// (track_analyzer -cmd unmatched_tracks -in ./trafin_log.20180517-0000) +// * run this tool with csv_path equal to path to the csv +// (extrapolation_benchmark -csv_path=trafin_log.20180517-0000.track.csv) + DEFINE_string(csv_path, "", "Path to csv file with user in following format: mwm id (string), aloha id (string), " "latitude of the first coord (double), longitude of the first coord (double), " "timestamp in seconds (int), latitude of the second coord (double) and so on."); -DEFINE_bool(deviations, false, "Print deviations in meters for all extrapolations."); -DEFINE_int32(extrapolation_frequency, 10, "The number extrapolations in a second."); +using namespace extrapolation; +using namespace location; +using namespace routing; using namespace std; namespace { struct GpsPoint { - GpsPoint(double lat, double lon, double timestamp) - : m_lat(lat), m_lon(lon), m_timestamp(timestamp) + GpsPoint(double timestamp, double lat, double lon) + : m_timestamp(timestamp) + , m_lat(lat) + , m_lon(lon) { } + double m_timestamp; + // @TODO(bykoianko) Using LatLog type instead of two double should be considered. double m_lat; double m_lon; - double m_timestamp; +}; + +class MathematicalExpectation +{ +public: + void Add(double value) + { + if (m_counter == 0) + { + m_averageValue = value; + ++m_counter; + return; + } + + m_averageValue = (m_averageValue * m_counter + value) / (m_counter + 1); + ++m_counter; + } + + double Get() const { return m_averageValue; } + size_t GetCounter() const { return m_counter; } + +private: + double m_averageValue = 0.0; + size_t m_counter = 0; +}; + +class MathematicalExpectationVec +{ +public: + explicit MathematicalExpectationVec(size_t size) { m_mes.resize(size); } + + void Add(vector const & values) + { + CHECK_EQUAL(values.size(), m_mes.size(), ()); + for (size_t i = 0; i < values.size(); ++i) + m_mes[i].Add(values[i]); + } + + vector const & Get() const { return m_mes; } + +private: + vector m_mes; }; using Track = vector; @@ -65,15 +130,14 @@ bool GetUint64(stringstream & lineStream, uint64_t & result) return strings::to_uint64(strResult, result); } -bool GetGpsPoint(stringstream & lineStream, double & lat, double & lon, uint64_t & timestamp) +bool GetGpsPoint(stringstream & lineStream, uint64_t & timestamp, double & lat, double & lon) { + if (!GetUint64(lineStream, timestamp)) + return false; if (!GetDouble(lineStream, lat)) return false; - if (!GetDouble(lineStream, lon)) - return false; - - return GetUint64(lineStream, timestamp); + return GetDouble(lineStream, lon); } /// \brief Fills |tracks| based on file |pathToCsv| content. File |pathToCsv| should be @@ -104,15 +168,23 @@ bool Parse(string const & pathToCsv, Tracks & tracks) double lat; double lon; uint64_t timestamp; - if (!GetGpsPoint(lineStream, lat, lon, timestamp)) + if (!GetGpsPoint(lineStream, timestamp, lat, lon)) return false; - track.emplace_back(lat, lon, static_cast(timestamp)); + track.emplace_back(static_cast(timestamp), lat, lon); } tracks.push_back(move(track)); } csvStream.close(); return true; } + +void GpsPointToGpsInfo(GpsPoint const gpsPoint, GpsInfo & gpsInfo) +{ + gpsInfo.m_timestamp = gpsPoint.m_timestamp; + gpsInfo.m_latitude = gpsPoint.m_lat; + gpsInfo.m_longitude = gpsPoint.m_lon; + +} } // namespace /// \brief This benchmark is written to estimate how LinearExtrapolation() extrapolates real users tracks. @@ -121,7 +193,7 @@ int main(int argc, char * argv[]) { google::SetUsageMessage( "Location extrapolation benchmark. Calculates mathematical expectation and dispersion for " - "all extrapolation deviations form track passed in csv_path."); + "all extrapolation deviations from tracks passed in csv with with csv_path."); google::ParseCommandLineFlags(&argc, &argv, true); if (FLAGS_csv_path.empty()) @@ -137,6 +209,7 @@ int main(int argc, char * argv[]) return -1; } + // Printing some statistics about tracks. size_t trackPointNum = 0; for (auto const & t : tracks) trackPointNum += t.size(); @@ -146,16 +219,113 @@ int main(int argc, char * argv[]) { double trackLenM = 0; for (size_t j = 1; j < t.size(); ++j) - trackLenM += ms::DistanceOnEarth(ms::LatLon(t[j - 1].m_lat, t[j - 1].m_lon), ms::LatLon(t[j].m_lat, t[j].m_lon)); + { + trackLenM += ms::DistanceOnEarth(ms::LatLon(t[j - 1].m_lat, t[j - 1].m_lon), + ms::LatLon(t[j].m_lat, t[j].m_lon)); + } trackLengths += trackLenM; } - LOG(LINFO, ("General tracks stats. Number of tracks:", tracks.size(), "Track points:", - trackPointNum, "Points per track in average:", trackPointNum / tracks.size(), - "Average track length:", trackLengths / tracks.size(), "meters")); + LOG(LINFO, ("General tracks statistics." + "\n Number of tracks:", tracks.size(), + "\n Number of track points:", trackPointNum, + "\n Points per track in average:", trackPointNum / tracks.size(), + "\n Average track length:", trackLengths / tracks.size(), "meters")); - // @TODO(bykoianko) Parsed user track is placed to |tracks|. Then LinearExtrapolation() - // shall be used. + // For all points of each track in |tracks| some extrapolations will be calculated. + // The number of extrapolations depends on |Extrapolator::kExtrapolationPeriodMs| + // and |Extrapolator::kMaxExtrapolationTimeMs| and equal for all points. + // Then mathematical expectation and dispersion each extrapolation will be printed. + auto const extrapolationNumber = static_cast(Extrapolator::kMaxExtrapolationTimeMs / + Extrapolator::kExtrapolationPeriodMs); + MathematicalExpectationVec mes(extrapolationNumber); + MathematicalExpectationVec squareMes(extrapolationNumber); + // Number of extrapolations which projections are calculated successfully for. + size_t projectionCounter = 0; + for (auto const & t : tracks) + { + if (t.size() <= 1) + continue; + + m2::PolylineD poly; + for (auto const & p : t) + poly.Add(MercatorBounds::FromLatLon(p.m_lat, p.m_lon)); + CHECK_EQUAL(poly.GetSize(), t.size(), ()); + FollowedPolyline followedPoly(poly.Begin(), poly.End()); + CHECK(followedPoly.IsValid(), ()); + + // For each track point except for the first one some extrapolations will be calculated. + for (size_t i = 1; i < t.size(); ++i) + { + GpsInfo info1; + GpsPointToGpsInfo(t[i - 1], info1); + GpsInfo info2; + GpsPointToGpsInfo(t[i], info2); + + if (!AreCoordsGoodForExtrapolation(info1, info2)) + break; + + vector onePointDeviations; + vector onePointDeviationsInSqare; + bool cannotFindClosestProjection = false; + for (size_t timeMs = Extrapolator::kExtrapolationPeriodMs; + timeMs <= Extrapolator::kMaxExtrapolationTimeMs; + timeMs += Extrapolator::kExtrapolationPeriodMs) + { + GpsInfo const extrapolated = LinearExtrapolation(info1, info2, timeMs); + m2::PointD const extrapolatedMerc = MercatorBounds::FromLatLon(extrapolated.m_latitude, extrapolated.m_longitude); + + m2::RectD const posRect = MercatorBounds::MetresToXY( + extrapolated.m_longitude, extrapolated.m_latitude, 100.0 /* half square in meters */); + // Note. One is deducted from polyline size because in GetClosestProjectionInInterval() + // is used segment indices but not point indices. + auto const & iter = followedPoly.GetClosestProjectionInInterval( + posRect, + [&extrapolatedMerc](FollowedPolyline::Iter const & it) { + return MercatorBounds::DistanceOnEarth(it.m_pt, extrapolatedMerc); + }, + 0 /* start segment index */, followedPoly.GetPolyline().GetSize() - 1); + + if (iter.IsValid()) + { + ++projectionCounter; + } + else + { + // This situation is possible if |posRect| param of GetClosestProjectionInInterval() + // method is too small and there is no segment in |followedPoly| + // which is covered by this rect. It's a rare situation. + cannotFindClosestProjection = true; + break; + } + + double const distFromPoly = MercatorBounds::DistanceOnEarth(iter.m_pt, extrapolatedMerc); + onePointDeviations.push_back(distFromPoly); + onePointDeviationsInSqare.push_back(distFromPoly * distFromPoly); + } + + if (!cannotFindClosestProjection) + { + CHECK_EQUAL(onePointDeviations.size(), extrapolationNumber, ()); + mes.Add(onePointDeviations); + squareMes.Add(onePointDeviationsInSqare); + } + } + } + + CHECK_GREATER(extrapolationNumber, 0, ()); + LOG(LINFO, ("\n Processed", mes.Get()[0].GetCounter(), "points.\n", + " ", mes.Get()[0].GetCounter() * extrapolationNumber, "extrapolations is calculated.\n", + " Projection is calculated for", projectionCounter, "extrapolations.")); + + LOG(LINFO, ("Mathematical expectation for each extrapolation:")); + for (size_t i = 0; i < extrapolationNumber; ++i) + { + double const dispersion = squareMes.Get()[i].Get() - mes.Get()[i].Get() * mes.Get()[i].Get(); + LOG(LINFO, ("Extrapolation", i + 1, ",", Extrapolator::kExtrapolationPeriodMs * (i + 1), + "seconds after point two. Mathematical expectation =", mes.Get()[i].Get(), + "meters.", "Dispersion =", dispersion, ". Standard deviation =", sqrt(dispersion))); + } return 0; } diff --git a/track_analyzing/track_analyzer/cmd_unmatched_tracks.cpp b/track_analyzing/track_analyzer/cmd_unmatched_tracks.cpp index 6e90cd4411..c741aa1e2c 100644 --- a/track_analyzing/track_analyzer/cmd_unmatched_tracks.cpp +++ b/track_analyzing/track_analyzer/cmd_unmatched_tracks.cpp @@ -31,7 +31,7 @@ void CmdUnmatchedTracks(string const & logFile, string const & trackFileCsv) { ofs << numMwmIds->GetFile(kv.first).GetName() << ", " << idTrack.first; for (auto const & pnt : idTrack.second) - ofs << ", " << pnt.m_latLon.lat << ", " << pnt.m_latLon.lon << ", " << pnt.m_timestamp; + ofs << ", " << pnt.m_timestamp << ", " << pnt.m_latLon.lat << ", " << pnt.m_latLon.lon; ofs << "\n"; } }