Consolidate scripts into a single one, that is installed system-wide
This commit is contained in:
parent
631f828134
commit
96d1919fa8
11 changed files with 189 additions and 145 deletions
2
.gitignore
vendored
2
.gitignore
vendored
|
@ -1,3 +1,5 @@
|
||||||
build/
|
build/
|
||||||
__pycache__/
|
__pycache__/
|
||||||
*.pyc
|
*.pyc
|
||||||
|
dist/
|
||||||
|
*.egg*
|
||||||
|
|
9
CHANGELOG.md
Normal file
9
CHANGELOG.md
Normal file
|
@ -0,0 +1,9 @@
|
||||||
|
# mwm.py Change Log
|
||||||
|
|
||||||
|
## master branch
|
||||||
|
|
||||||
|
## 0.9.0
|
||||||
|
|
||||||
|
_Released 2017-06-08_
|
||||||
|
|
||||||
|
The initial release with some features.
|
31
README.md
31
README.md
|
@ -1,31 +0,0 @@
|
||||||
# mwm.py
|
|
||||||
|
|
||||||
It is a python library to read contents of MAPS.ME mwm files. Not everything
|
|
||||||
is supported, but you can get at least all the features and their attributes.
|
|
||||||
We at MAPS.ME use this script to do analytics and maintenance.
|
|
||||||
|
|
||||||
## Installation
|
|
||||||
|
|
||||||
pip install mwm
|
|
||||||
|
|
||||||
## Usage
|
|
||||||
|
|
||||||
Just add `import mwm` to your script, and read an mwm file with:
|
|
||||||
|
|
||||||
```python
|
|
||||||
with open('file.mwm', 'rb') as f:
|
|
||||||
data = mwm.MWM(f)
|
|
||||||
```
|
|
||||||
|
|
||||||
## Tools
|
|
||||||
|
|
||||||
There are some useful tools in the relevant directory, which can serve as
|
|
||||||
the library usage examples:
|
|
||||||
|
|
||||||
* `dump_mwm.py` prints the header and some statistics on an mwm file.
|
|
||||||
* `find_feature.py` can find features inside an mwm by type or name.
|
|
||||||
* `ft2osm.py` converts a feature id to an OSM website link.
|
|
||||||
|
|
||||||
## License
|
|
||||||
|
|
||||||
Written by Ilya Zverev for MAPS.ME. Published under the Apache License 2.0.
|
|
39
README.rst
Normal file
39
README.rst
Normal file
|
@ -0,0 +1,39 @@
|
||||||
|
mwm.py
|
||||||
|
======
|
||||||
|
|
||||||
|
It is a python library to read contents of MAPS.ME mwm files. Not
|
||||||
|
everything is supported, but you can get at least all the features and
|
||||||
|
their attributes. We at MAPS.ME use this script to do analytics and
|
||||||
|
maintenance.
|
||||||
|
|
||||||
|
Installation
|
||||||
|
------------
|
||||||
|
|
||||||
|
::
|
||||||
|
|
||||||
|
pip install mwm
|
||||||
|
|
||||||
|
Usage
|
||||||
|
-----
|
||||||
|
|
||||||
|
Just add ``import mwm`` to your script, and read an mwm file with:
|
||||||
|
|
||||||
|
.. code:: python
|
||||||
|
|
||||||
|
with open('file.mwm', 'rb') as f:
|
||||||
|
data = mwm.MWM(f)
|
||||||
|
|
||||||
|
Tools
|
||||||
|
-----
|
||||||
|
|
||||||
|
The package installs the ``mwmtool`` command-line script. It shows
|
||||||
|
statistics about an MWM file, can search for features or convert ids.
|
||||||
|
Run it with ``-h`` to see a list of options.
|
||||||
|
|
||||||
|
The script source can serve as a library usage example.
|
||||||
|
|
||||||
|
License
|
||||||
|
-------
|
||||||
|
|
||||||
|
Written by Ilya Zverev for MAPS.ME. Published under the Apache License
|
||||||
|
2.0.
|
|
@ -1,2 +1,2 @@
|
||||||
from .mwm import MWM, Osm2Ft
|
from .mwm import MWM, Osm2Ft, __version__
|
||||||
from .mwmfile import MWMFile
|
from .mwmfile import MWMFile
|
||||||
|
|
15
mwm/mwm.py
15
mwm/mwm.py
|
@ -2,14 +2,14 @@
|
||||||
from .mwmfile import MWMFile
|
from .mwmfile import MWMFile
|
||||||
from datetime import datetime
|
from datetime import datetime
|
||||||
|
|
||||||
# Unprocessed sections: geomN, trgN, idx, sdx (search index), addr (search address), offs (feature offsets - succinct)
|
__version__ = '0.9.0'
|
||||||
# Routing sections: mercedes (matrix), daewoo (edge data), infinity (edge id), skoda (shortcuts), chrysler (cross context), ftseg, node2ftseg
|
|
||||||
# (these mostly are succinct structures, except chrysler and node2ftseg, so no use trying to load them here)
|
# Unprocessed sections: geomN, trgN, idx, sdx (search index),
|
||||||
|
# addr (search address), offs (feature offsets - succinct)
|
||||||
|
|
||||||
# TODO:
|
# TODO:
|
||||||
# - Predictive reading of LineStrings
|
# - Predictive reading of LineStrings
|
||||||
# - Find why polygon geometry is incorrect in iter_features()
|
# - Find why polygon geometry is incorrect in iter_features()
|
||||||
# - Find feature ids in the 'dat' section, or find a way to read the 'offs' section
|
|
||||||
|
|
||||||
|
|
||||||
class MWM(MWMFile):
|
class MWM(MWMFile):
|
||||||
|
@ -43,10 +43,11 @@ class MWM(MWMFile):
|
||||||
fmt = self.read_varuint() + 1
|
fmt = self.read_varuint() + 1
|
||||||
version = self.read_varuint()
|
version = self.read_varuint()
|
||||||
if version < 161231:
|
if version < 161231:
|
||||||
version = datetime(2000 + int(version / 10000), int(version / 100) % 100, version % 100)
|
vdate = datetime(2000 + int(version / 10000), int(version / 100) % 100, version % 100)
|
||||||
else:
|
else:
|
||||||
version = datetime.fromtimestamp(version)
|
vdate = datetime.fromtimestamp(version)
|
||||||
return {'fmt': fmt, 'version': version}
|
version = int(vdate.strftime('%y%m%d'))
|
||||||
|
return {'fmt': fmt, 'version': version, 'date': vdate}
|
||||||
|
|
||||||
def read_header(self):
|
def read_header(self):
|
||||||
"""Reads 'header' section."""
|
"""Reads 'header' section."""
|
||||||
|
|
123
mwm/mwmtool.py
Executable file
123
mwm/mwmtool.py
Executable file
|
@ -0,0 +1,123 @@
|
||||||
|
#!/usr/bin/env python
|
||||||
|
import sys
|
||||||
|
import os.path
|
||||||
|
import random
|
||||||
|
import json
|
||||||
|
import argparse
|
||||||
|
from mwm import MWM, Osm2Ft
|
||||||
|
|
||||||
|
|
||||||
|
def dump_mwm(args):
|
||||||
|
mwm = MWM(args.mwm)
|
||||||
|
if os.path.exists(args.types):
|
||||||
|
mwm.read_types(args.types)
|
||||||
|
|
||||||
|
print('Tags:')
|
||||||
|
tvv = sorted([(k, v[0], v[1]) for k, v in mwm.tags.items()], key=lambda x: x[1])
|
||||||
|
for tv in tvv:
|
||||||
|
print(' {0:<8}: offs {1:9} len {2:8}'.format(tv[0], tv[1], tv[2]))
|
||||||
|
v = mwm.read_version()
|
||||||
|
print('Format: {0}, version: {1}'.format(v['fmt'], v['date'].strftime('%Y-%m-%d %H:%M')))
|
||||||
|
print('Header: {0}'.format(mwm.read_header()))
|
||||||
|
print('Region Info: {0}'.format(mwm.read_region_info()))
|
||||||
|
print('Metadata count: {0}'.format(len(mwm.read_metadata())))
|
||||||
|
|
||||||
|
cross = mwm.read_crossmwm()
|
||||||
|
if cross:
|
||||||
|
print('Outgoing points: {0}, incoming: {1}'.format(len(cross['out']), len(cross['in'])))
|
||||||
|
print('Outgoing regions: {0}'.format(set(cross['neighbours'])))
|
||||||
|
|
||||||
|
# Print some random features using reservoir sampling
|
||||||
|
count = 5
|
||||||
|
sample = []
|
||||||
|
for i, feature in enumerate(mwm.iter_features()):
|
||||||
|
if i < count:
|
||||||
|
sample.append(feature)
|
||||||
|
elif random.randint(0, i) < count:
|
||||||
|
sample[random.randint(0, count-1)] = feature
|
||||||
|
|
||||||
|
print('Feature count: {0}'.format(i))
|
||||||
|
print('Sample features:')
|
||||||
|
for feature in sample:
|
||||||
|
print(json.dumps(feature, ensure_ascii=False))
|
||||||
|
|
||||||
|
|
||||||
|
def find_feature(args):
|
||||||
|
mwm = MWM(args.mwm)
|
||||||
|
mwm.read_header()
|
||||||
|
if os.path.exists(args.types):
|
||||||
|
mwm.read_types(args.types)
|
||||||
|
if args.iname:
|
||||||
|
args.iname = args.iname.lower()
|
||||||
|
|
||||||
|
for i, feature in enumerate(mwm.iter_features(metadata=True)):
|
||||||
|
if args.fid and i != args.fid:
|
||||||
|
continue
|
||||||
|
if args.name or args.iname:
|
||||||
|
if 'name' not in feature['header']:
|
||||||
|
continue
|
||||||
|
found = False
|
||||||
|
for value in feature['header']['name'].values():
|
||||||
|
if args.name and args.name in value:
|
||||||
|
found = True
|
||||||
|
elif args.iname and args.iname in value.lower():
|
||||||
|
found = True
|
||||||
|
if not found:
|
||||||
|
continue
|
||||||
|
if args.type or args.exact_type:
|
||||||
|
found = False
|
||||||
|
for t in feature['header']['types']:
|
||||||
|
if t == args.type or t == args.exact_type:
|
||||||
|
found = True
|
||||||
|
elif args.type and args.type in t:
|
||||||
|
found = True
|
||||||
|
if not found:
|
||||||
|
continue
|
||||||
|
if args.meta and ('metadata' not in feature or args.meta not in feature['metadata']):
|
||||||
|
continue
|
||||||
|
print(json.dumps(feature, ensure_ascii=False, sort_keys=True))
|
||||||
|
|
||||||
|
|
||||||
|
def ft2osm(args):
|
||||||
|
ft2osm = Osm2Ft(args.osm2ft, True)
|
||||||
|
code = 0
|
||||||
|
type_abbr = {'n': 'node', 'w': 'way', 'r': 'relation'}
|
||||||
|
for ftid in args.ftid:
|
||||||
|
if ftid in ft2osm:
|
||||||
|
print('https://www.openstreetmap.org/{}/{}'.format(type_abbr[ft2osm[ftid][0]], ft2osm[ftid][1]))
|
||||||
|
else:
|
||||||
|
print('Could not find osm id for feature {}'.format(ftid))
|
||||||
|
code = 2
|
||||||
|
return code
|
||||||
|
|
||||||
|
|
||||||
|
def main():
|
||||||
|
parser = argparse.ArgumentParser(description='Toolbox for MWM files.')
|
||||||
|
parser.add_argument('--types', default=os.path.join(os.path.dirname(sys.argv[0]), '..', '..', '..', '..', 'data', 'types.txt'), help='path to types.txt')
|
||||||
|
subparsers = parser.add_subparsers(dest='cmd')
|
||||||
|
subparsers.required = True
|
||||||
|
parser_dump = subparsers.add_parser('dump', help='Dumps some structures.')
|
||||||
|
parser_dump.add_argument('mwm', type=argparse.FileType('rb'), help='file to browse')
|
||||||
|
parser_dump.set_defaults(func=dump_mwm)
|
||||||
|
parser_find = subparsers.add_parser('find', help='Finds features in a file.')
|
||||||
|
parser_find.add_argument('mwm', type=argparse.FileType('rb'), help='file to search')
|
||||||
|
parser_find.add_argument('-t', dest='type', help='look inside types ("-t hwtag" will find all hwtags-*)')
|
||||||
|
parser_find.add_argument('-et', dest='exact_type', help='look for a type ("-et shop won\'t find shop-chemist)')
|
||||||
|
parser_find.add_argument('-n', dest='name', help='look inside names, case-sensitive ("-n Starbucks" for all starbucks)')
|
||||||
|
parser_find.add_argument('-in', dest='iname', help='look inside names, case-insensitive ("-in star" will find Starbucks)')
|
||||||
|
parser_find.add_argument('-m', dest='meta', help='look for a metadata key ("m flats" for features with flats)')
|
||||||
|
parser_find.add_argument('-id', dest='fid', type=int, help='look for a feature id ("-id 1234 for feature #1234)')
|
||||||
|
parser_find.set_defaults(func=find_feature)
|
||||||
|
parser_osm = subparsers.add_parser('osm', help='Displays an OpenStreetMap link for a feature id.')
|
||||||
|
parser_osm.add_argument('osm2ft', type=argparse.FileType('rb'), help='.mwm.osm2ft file')
|
||||||
|
parser_osm.add_argument('ftid', type=int, nargs='+', help='feature id')
|
||||||
|
parser_osm.set_defaults(func=ft2osm)
|
||||||
|
|
||||||
|
args = parser.parse_args()
|
||||||
|
code = args.func(args)
|
||||||
|
if code is not None:
|
||||||
|
sys.exit(code)
|
||||||
|
|
||||||
|
|
||||||
|
if __name__ == '__main__':
|
||||||
|
main()
|
10
setup.py
10
setup.py
|
@ -1,18 +1,19 @@
|
||||||
from setuptools import setup
|
from setuptools import setup
|
||||||
from os import path
|
from os import path
|
||||||
|
from mwm import __version__
|
||||||
|
|
||||||
here = path.abspath(path.dirname(__file__))
|
here = path.abspath(path.dirname(__file__))
|
||||||
|
|
||||||
setup(
|
setup(
|
||||||
name='mwm',
|
name='mwm',
|
||||||
version='0.9.0',
|
version=__version__,
|
||||||
author='Ilya Zverev',
|
author='Ilya Zverev',
|
||||||
author_email='ilya@zverev.info',
|
author_email='ilya@zverev.info',
|
||||||
packages=['mwm'],
|
packages=['mwm'],
|
||||||
url='http://pypi.python.org/pypi/mwm/',
|
url='https://github.com/mapsme/mwm.py',
|
||||||
license='Apache License 2.0',
|
license='Apache License 2.0',
|
||||||
description='Library to read binary MAPS.ME files.',
|
description='Library to read binary MAPS.ME files.',
|
||||||
long_description=open(path.join(here, 'README.md')).read(),
|
long_description=open(path.join(here, 'README.rst')).read(),
|
||||||
classifiers=[
|
classifiers=[
|
||||||
'Development Status :: 4 - Beta',
|
'Development Status :: 4 - Beta',
|
||||||
'Intended Audience :: Developers',
|
'Intended Audience :: Developers',
|
||||||
|
@ -25,4 +26,7 @@ setup(
|
||||||
'Programming Language :: Python :: 2.7',
|
'Programming Language :: Python :: 2.7',
|
||||||
'Programming Language :: Python :: 3',
|
'Programming Language :: Python :: 3',
|
||||||
],
|
],
|
||||||
|
entry_points={
|
||||||
|
'console_scripts': ['mwmtool = mwm.mwmtool:main']
|
||||||
|
},
|
||||||
)
|
)
|
||||||
|
|
|
@ -1,40 +0,0 @@
|
||||||
#!/usr/bin/python
|
|
||||||
import sys, os.path, random
|
|
||||||
import json
|
|
||||||
from mwm import MWM
|
|
||||||
|
|
||||||
if len(sys.argv) < 2:
|
|
||||||
print('Dumps some MWM structures.')
|
|
||||||
print('Usage: {0} <country.mwm>'.format(sys.argv[0]))
|
|
||||||
sys.exit(1)
|
|
||||||
|
|
||||||
mwm = MWM(open(sys.argv[1], 'rb'))
|
|
||||||
mwm.read_types(os.path.join(os.path.dirname(sys.argv[0]), '..', '..', '..', '..', 'data', 'types.txt'))
|
|
||||||
print('Tags:')
|
|
||||||
tvv = sorted([(k, v[0], v[1]) for k, v in mwm.tags.items()], key=lambda x: x[1])
|
|
||||||
for tv in tvv:
|
|
||||||
print(' {0:<8}: offs {1:9} len {2:8}'.format(tv[0], tv[1], tv[2]))
|
|
||||||
v = mwm.read_version()
|
|
||||||
print('Format: {0}, version: {1}'.format(v['fmt'], v['version'].strftime('%Y-%m-%d %H:%M')))
|
|
||||||
print('Header: {0}'.format(mwm.read_header()))
|
|
||||||
print('Region Info: {0}'.format(mwm.read_region_info()))
|
|
||||||
print('Metadata count: {0}'.format(len(mwm.read_metadata())))
|
|
||||||
|
|
||||||
cross = mwm.read_crossmwm()
|
|
||||||
if cross:
|
|
||||||
print('Outgoing points: {0}, incoming: {1}'.format(len(cross['out']), len(cross['in'])))
|
|
||||||
print('Outgoing regions: {0}'.format(set(cross['neighbours'])))
|
|
||||||
|
|
||||||
# Print some random features using reservoir sampling
|
|
||||||
count = 5
|
|
||||||
sample = []
|
|
||||||
for i, feature in enumerate(mwm.iter_features()):
|
|
||||||
if i < count:
|
|
||||||
sample.append(feature)
|
|
||||||
elif random.randint(0, i) < count:
|
|
||||||
sample[random.randint(0, count-1)] = feature
|
|
||||||
|
|
||||||
print('Feature count: {0}'.format(i))
|
|
||||||
print('Sample features:')
|
|
||||||
for feature in sample:
|
|
||||||
print(json.dumps(feature, ensure_ascii=False))
|
|
|
@ -1,41 +0,0 @@
|
||||||
#!/usr/bin/env python
|
|
||||||
import sys, os.path, json
|
|
||||||
from mwm import MWM
|
|
||||||
|
|
||||||
if len(sys.argv) < 4:
|
|
||||||
print('Finds features in an mwm file based on a query')
|
|
||||||
print('Usage: {0} <country.mwm> <type> <string>'.format(sys.argv[0]))
|
|
||||||
print('')
|
|
||||||
print('Type:')
|
|
||||||
print(' t for inside types ("t hwtag" will find all hwtags-*)')
|
|
||||||
print(' et for exact type ("et shop" won\'t find shop-chemist)')
|
|
||||||
print(' n for names, case-sensitive ("n Starbucks" for all starbucks)')
|
|
||||||
print(' m for metadata keys ("m flats" for features with flats)')
|
|
||||||
print(' id for feature id ("id 1234" for feature #1234)')
|
|
||||||
sys.exit(1)
|
|
||||||
|
|
||||||
typ = sys.argv[2].lower()
|
|
||||||
find = sys.argv[3].decode('utf-8')
|
|
||||||
|
|
||||||
mwm = MWM(open(sys.argv[1], 'rb'))
|
|
||||||
mwm.read_header()
|
|
||||||
mwm.read_types(os.path.join(os.path.dirname(sys.argv[0]), '..', '..', '..', '..', 'data', 'types.txt'))
|
|
||||||
for i, feature in enumerate(mwm.iter_features(metadata=True)):
|
|
||||||
found = False
|
|
||||||
if typ == 'n' and 'name' in feature['header']:
|
|
||||||
for value in feature['header']['name'].values():
|
|
||||||
if find in value:
|
|
||||||
found = True
|
|
||||||
elif typ in ('t', 'et'):
|
|
||||||
for t in feature['header']['types']:
|
|
||||||
if t == find:
|
|
||||||
found = True
|
|
||||||
elif typ == 't' and find in t:
|
|
||||||
found = True
|
|
||||||
elif typ == 'm' and 'metadata' in feature:
|
|
||||||
if find in feature['metadata']:
|
|
||||||
found = True
|
|
||||||
elif typ == 'id' and i == int(find):
|
|
||||||
found = True
|
|
||||||
if found:
|
|
||||||
print(json.dumps(feature, ensure_ascii=False, sort_keys=True).encode('utf-8'))
|
|
|
@ -1,22 +0,0 @@
|
||||||
#!/usr/bin/env python
|
|
||||||
import sys
|
|
||||||
import mwm
|
|
||||||
|
|
||||||
if len(sys.argv) < 3:
|
|
||||||
print('Finds an OSM object for a given feature id.')
|
|
||||||
print('Usage: {} <mwm.osm2ft> <ftid>'.format(sys.argv[0]))
|
|
||||||
sys.exit(1)
|
|
||||||
|
|
||||||
with open(sys.argv[1], 'rb') as f:
|
|
||||||
ft2osm = mwm.Osm2Ft(f, True)
|
|
||||||
|
|
||||||
code = 0
|
|
||||||
type_abbr = {'n': 'node', 'w': 'way', 'r': 'relation'}
|
|
||||||
for ftid in sys.argv[2:]:
|
|
||||||
ftid = int(ftid)
|
|
||||||
if ftid in ft2osm:
|
|
||||||
print('https://www.openstreetmap.org/{}/{}'.format(type_abbr[ft2osm[ftid][0]], ft2osm[ftid][1]))
|
|
||||||
else:
|
|
||||||
print('Could not find osm id for feature {}'.format(ftid))
|
|
||||||
code = 2
|
|
||||||
sys.exit(code)
|
|
Loading…
Add table
Reference in a new issue