From 65d9cfd9dde02f700b0ccd4ba72695e4e097cca3 Mon Sep 17 00:00:00 2001 From: Ilya Zverev Date: Wed, 23 May 2018 19:32:31 +0300 Subject: [PATCH] Started working on geocoding points --- conflate/conflate.py | 99 ++++++++++++++++++++++++++++++++++++++++++++ conflate/version.py | 2 +- setup.py | 1 + 3 files changed, 101 insertions(+), 1 deletion(-) diff --git a/conflate/conflate.py b/conflate/conflate.py index e8425dd..4fff838 100755 --- a/conflate/conflate.py +++ b/conflate/conflate.py @@ -8,6 +8,7 @@ import math import requests import re import os +import struct import sys from io import BytesIO from collections import defaultdict @@ -42,6 +43,7 @@ class SourcePoint: self.category = category self.dist_offset = 0 self.remarks = remarks + self.region = None self.exclusive_group = None def distance(self, other): @@ -1120,6 +1122,100 @@ def check_dataset_for_duplicates(profile, dataset, print_all=False): raise KeyError('Cannot continue with duplicate ids') +def init_geocoder(): + class PlacePoint: + def __init__(self, lon, lat, country, region): + self.coord = (lon, lat) + self.country = country + self.region = region + + def __len__(self): + return len(self.coord) + + def __getitem__(self, i): + return self.coord[i] + + filename = os.path.join(os.getcwd(), os.path.dirname(__file__), 'places.bin') + if not os.path.exists(filename): + return None + places = [] + with open(filename, 'rb') as f: + countries = [] + cnt = struct.unpack('B', f.read(1))[0] + for i in range(cnt): + countries.append(struct.unpack('2s', f.read(2))[0].decode('ascii')) + regions = [] + cnt = struct.unpack('h', f.read(2))[0] + for i in range(cnt): + l = struct.unpack('B', f.read(1))[0] + regions.append(f.read(l).decode('ascii')) + dlon = f.read(3) + while len(dlon) == 3: + dlat = f.read(3) + country = struct.unpack('B', f.read(1))[0] + region = struct.unpack('h', f.read(2))[0] + places.append(PlacePoint(struct.unpack('