Consolidate scripts into a single one, that is installed system-wide

2017-05-05 17:52:07 +03:00 · 2017-05-05 17:52:07 +03:00 · 96d1919fa8
commit 96d1919fa8
parent 631f828134
11 changed files with 189 additions and 145 deletions
--- a/.gitignore
+++ b/.gitignore
@ -1,3 +1,5 @@
 build/
 __pycache__/
 *.pyc
+dist/
+*.egg*
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@ -0,0 +1,9 @@
+# mwm.py Change Log
+
+## master branch
+
+## 0.9.0
+
+_Released 2017-06-08_
+
+The initial release with some features.
--- a/README.md
+++ b/README.md
@ -1,31 +0,0 @@
-# mwm.py
-
-It is a python library to read contents of MAPS.ME mwm files. Not everything
-is supported, but you can get at least all the features and their attributes.
-We at MAPS.ME use this script to do analytics and maintenance.
-
-## Installation
-
-    pip install mwm
-
-## Usage
-
-Just add `import mwm` to your script, and read an mwm file with:
-
-```python
-with open('file.mwm', 'rb') as f:
-    data = mwm.MWM(f)
-```
-
-## Tools
-
-There are some useful tools in the relevant directory, which can serve as
-the library usage examples:
-
-* `dump_mwm.py` prints the header and some statistics on an mwm file.
-* `find_feature.py` can find features inside an mwm by type or name.
-* `ft2osm.py` converts a feature id to an OSM website link.
-
-## License
-
-Written by Ilya Zverev for MAPS.ME. Published under the Apache License 2.0.
--- a/README.rst
+++ b/README.rst
@ -0,0 +1,39 @@
+mwm.py
+======
+
+It is a python library to read contents of MAPS.ME mwm files. Not
+everything is supported, but you can get at least all the features and
+their attributes. We at MAPS.ME use this script to do analytics and
+maintenance.
+
+Installation
+------------
+
+::
+
+    pip install mwm
+
+Usage
+-----
+
+Just add ``import mwm`` to your script, and read an mwm file with:
+
+.. code:: python
+
+    with open('file.mwm', 'rb') as f:
+        data = mwm.MWM(f)
+
+Tools
+-----
+
+The package installs the ``mwmtool`` command-line script. It shows
+statistics about an MWM file, can search for features or convert ids.
+Run it with ``-h`` to see a list of options.
+
+The script source can serve as a library usage example.
+
+License
+-------
+
+Written by Ilya Zverev for MAPS.ME. Published under the Apache License
+2.0.
--- a/mwm/init.py
+++ b/mwm/init.py
@ -1,2 +1,2 @@
-from .mwm import MWM, Osm2Ft
+from .mwm import MWM, Osm2Ft, __version__
 from .mwmfile import MWMFile
--- a/mwm/mwm.py
+++ b/mwm/mwm.py
@ -2,14 +2,14 @@
 from .mwmfile import MWMFile
 from datetime import datetime

-# Unprocessed sections: geomN, trgN, idx, sdx (search index), addr (search address), offs (feature offsets - succinct)
-# Routing sections: mercedes (matrix), daewoo (edge data), infinity (edge id), skoda (shortcuts), chrysler (cross context), ftseg, node2ftseg
-# (these mostly are succinct structures, except chrysler and node2ftseg, so no use trying to load them here)
+__version__ = '0.9.0'
+
+# Unprocessed sections: geomN, trgN, idx, sdx (search index),
+# addr (search address), offs (feature offsets - succinct)

 # TODO:
 # - Predictive reading of LineStrings
 # - Find why polygon geometry is incorrect in iter_features()
-# - Find feature ids in the 'dat' section, or find a way to read the 'offs' section


 class MWM(MWMFile):
@ -43,10 +43,11 @@ class MWM(MWMFile):
        fmt = self.read_varuint() + 1
        version = self.read_varuint()
        if version < 161231:
-            version = datetime(2000 + int(version / 10000), int(version / 100) % 100, version % 100)
+            vdate = datetime(2000 + int(version / 10000), int(version / 100) % 100, version % 100)
        else:
-            version = datetime.fromtimestamp(version)
-        return {'fmt': fmt, 'version': version}
+            vdate = datetime.fromtimestamp(version)
+            version = int(vdate.strftime('%y%m%d'))
+        return {'fmt': fmt, 'version': version, 'date': vdate}

    def read_header(self):
        """Reads 'header' section."""
--- a/mwm/mwmtool.py
+++ b/mwm/mwmtool.py
@ -0,0 +1,123 @@
+#!/usr/bin/env python
+import sys
+import os.path
+import random
+import json
+import argparse
+from mwm import MWM, Osm2Ft
+
+
+def dump_mwm(args):
+    mwm = MWM(args.mwm)
+    if os.path.exists(args.types):
+        mwm.read_types(args.types)
+
+    print('Tags:')
+    tvv = sorted([(k, v[0], v[1]) for k, v in mwm.tags.items()], key=lambda x: x[1])
+    for tv in tvv:
+        print('  {0:<8}: offs {1:9} len {2:8}'.format(tv[0], tv[1], tv[2]))
+    v = mwm.read_version()
+    print('Format: {0}, version: {1}'.format(v['fmt'], v['date'].strftime('%Y-%m-%d %H:%M')))
+    print('Header: {0}'.format(mwm.read_header()))
+    print('Region Info: {0}'.format(mwm.read_region_info()))
+    print('Metadata count: {0}'.format(len(mwm.read_metadata())))
+
+    cross = mwm.read_crossmwm()
+    if cross:
+        print('Outgoing points: {0}, incoming: {1}'.format(len(cross['out']), len(cross['in'])))
+        print('Outgoing regions: {0}'.format(set(cross['neighbours'])))
+
+    # Print some random features using reservoir sampling
+    count = 5
+    sample = []
+    for i, feature in enumerate(mwm.iter_features()):
+        if i < count:
+            sample.append(feature)
+        elif random.randint(0, i) < count:
+            sample[random.randint(0, count-1)] = feature
+
+    print('Feature count: {0}'.format(i))
+    print('Sample features:')
+    for feature in sample:
+        print(json.dumps(feature, ensure_ascii=False))
+
+
+def find_feature(args):
+    mwm = MWM(args.mwm)
+    mwm.read_header()
+    if os.path.exists(args.types):
+        mwm.read_types(args.types)
+    if args.iname:
+        args.iname = args.iname.lower()
+
+    for i, feature in enumerate(mwm.iter_features(metadata=True)):
+        if args.fid and i != args.fid:
+            continue
+        if args.name or args.iname:
+            if 'name' not in feature['header']:
+                continue
+            found = False
+            for value in feature['header']['name'].values():
+                if args.name and args.name in value:
+                    found = True
+                elif args.iname and args.iname in value.lower():
+                    found = True
+            if not found:
+                continue
+        if args.type or args.exact_type:
+            found = False
+            for t in feature['header']['types']:
+                if t == args.type or t == args.exact_type:
+                    found = True
+                elif args.type and args.type in t:
+                    found = True
+            if not found:
+                continue
+        if args.meta and ('metadata' not in feature or args.meta not in feature['metadata']):
+            continue
+        print(json.dumps(feature, ensure_ascii=False, sort_keys=True))
+
+
+def ft2osm(args):
+    ft2osm = Osm2Ft(args.osm2ft, True)
+    code = 0
+    type_abbr = {'n': 'node', 'w': 'way', 'r': 'relation'}
+    for ftid in args.ftid:
+        if ftid in ft2osm:
+            print('https://www.openstreetmap.org/{}/{}'.format(type_abbr[ft2osm[ftid][0]], ft2osm[ftid][1]))
+        else:
+            print('Could not find osm id for feature {}'.format(ftid))
+            code = 2
+    return code
+
+
+def main():
+    parser = argparse.ArgumentParser(description='Toolbox for MWM files.')
+    parser.add_argument('--types', default=os.path.join(os.path.dirname(sys.argv[0]), '..', '..', '..', '..', 'data', 'types.txt'), help='path to types.txt')
+    subparsers = parser.add_subparsers(dest='cmd')
+    subparsers.required = True
+    parser_dump = subparsers.add_parser('dump', help='Dumps some structures.')
+    parser_dump.add_argument('mwm', type=argparse.FileType('rb'), help='file to browse')
+    parser_dump.set_defaults(func=dump_mwm)
+    parser_find = subparsers.add_parser('find', help='Finds features in a file.')
+    parser_find.add_argument('mwm', type=argparse.FileType('rb'), help='file to search')
+    parser_find.add_argument('-t', dest='type', help='look inside types ("-t hwtag" will find all hwtags-*)')
+    parser_find.add_argument('-et', dest='exact_type', help='look for a type ("-et shop won\'t find shop-chemist)')
+    parser_find.add_argument('-n', dest='name', help='look inside names, case-sensitive ("-n Starbucks" for all starbucks)')
+    parser_find.add_argument('-in', dest='iname', help='look inside names, case-insensitive ("-in star" will find Starbucks)')
+    parser_find.add_argument('-m', dest='meta', help='look for a metadata key ("m flats" for features with flats)')
+    parser_find.add_argument('-id', dest='fid', type=int, help='look for a feature id ("-id 1234 for feature #1234)')
+    parser_find.set_defaults(func=find_feature)
+    parser_osm = subparsers.add_parser('osm', help='Displays an OpenStreetMap link for a feature id.')
+    parser_osm.add_argument('osm2ft', type=argparse.FileType('rb'), help='.mwm.osm2ft file')
+    parser_osm.add_argument('ftid', type=int, nargs='+', help='feature id')
+    parser_osm.set_defaults(func=ft2osm)
+
+    args = parser.parse_args()
+    code = args.func(args)
+    if code is not None:
+        sys.exit(code)
+
+
+if __name__ == '__main__':
+    main()
--- a/setup.py
+++ b/setup.py
@ -1,18 +1,19 @@
 from setuptools import setup
 from os import path
+from mwm import __version__

 here = path.abspath(path.dirname(__file__))

 setup(
    name='mwm',
-    version='0.9.0',
+    version=__version__,
    author='Ilya Zverev',
    author_email='ilya@zverev.info',
    packages=['mwm'],
-    url='http://pypi.python.org/pypi/mwm/',
+    url='https://github.com/mapsme/mwm.py',
    license='Apache License 2.0',
    description='Library to read binary MAPS.ME files.',
-    long_description=open(path.join(here, 'README.md')).read(),
+    long_description=open(path.join(here, 'README.rst')).read(),
    classifiers=[
        'Development Status :: 4 - Beta',
        'Intended Audience :: Developers',
@ -25,4 +26,7 @@ setup(
        'Programming Language :: Python :: 2.7',
        'Programming Language :: Python :: 3',
    ],
+    entry_points={
+        'console_scripts': ['mwmtool = mwm.mwmtool:main']
+    },
 )
--- a/tools/dump_mwm.py
+++ b/tools/dump_mwm.py
@ -1,40 +0,0 @@
-#!/usr/bin/python
-import sys, os.path, random
-import json
-from mwm import MWM
-
-if len(sys.argv) < 2:
-    print('Dumps some MWM structures.')
-    print('Usage: {0} <country.mwm>'.format(sys.argv[0]))
-    sys.exit(1)
-
-mwm = MWM(open(sys.argv[1], 'rb'))
-mwm.read_types(os.path.join(os.path.dirname(sys.argv[0]), '..', '..', '..', '..', 'data', 'types.txt'))
-print('Tags:')
-tvv = sorted([(k, v[0], v[1]) for k, v in mwm.tags.items()], key=lambda x: x[1])
-for tv in tvv:
-    print('  {0:<8}: offs {1:9} len {2:8}'.format(tv[0], tv[1], tv[2]))
-v = mwm.read_version()
-print('Format: {0}, version: {1}'.format(v['fmt'], v['version'].strftime('%Y-%m-%d %H:%M')))
-print('Header: {0}'.format(mwm.read_header()))
-print('Region Info: {0}'.format(mwm.read_region_info()))
-print('Metadata count: {0}'.format(len(mwm.read_metadata())))
-
-cross = mwm.read_crossmwm()
-if cross:
-    print('Outgoing points: {0}, incoming: {1}'.format(len(cross['out']), len(cross['in'])))
-    print('Outgoing regions: {0}'.format(set(cross['neighbours'])))
-
-# Print some random features using reservoir sampling
-count = 5
-sample = []
-for i, feature in enumerate(mwm.iter_features()):
-    if i < count:
-        sample.append(feature)
-    elif random.randint(0, i) < count:
-        sample[random.randint(0, count-1)] = feature
-
-print('Feature count: {0}'.format(i))
-print('Sample features:')
-for feature in sample:
-    print(json.dumps(feature, ensure_ascii=False))
--- a/tools/find_feature.py
+++ b/tools/find_feature.py
@ -1,41 +0,0 @@
-#!/usr/bin/env python
-import sys, os.path, json
-from mwm import MWM
-
-if len(sys.argv) < 4:
-    print('Finds features in an mwm file based on a query')
-    print('Usage: {0} <country.mwm> <type> <string>'.format(sys.argv[0]))
-    print('')
-    print('Type:')
-    print('  t for inside types ("t hwtag" will find all hwtags-*)')
-    print('  et for exact type ("et shop" won\'t find shop-chemist)')
-    print('  n for names, case-sensitive ("n Starbucks" for all starbucks)')
-    print('  m for metadata keys ("m flats" for features with flats)')
-    print('  id for feature id ("id 1234" for feature #1234)')
-    sys.exit(1)
-
-typ = sys.argv[2].lower()
-find = sys.argv[3].decode('utf-8')
-
-mwm = MWM(open(sys.argv[1], 'rb'))
-mwm.read_header()
-mwm.read_types(os.path.join(os.path.dirname(sys.argv[0]), '..', '..', '..', '..', 'data', 'types.txt'))
-for i, feature in enumerate(mwm.iter_features(metadata=True)):
-    found = False
-    if typ == 'n' and 'name' in feature['header']:
-        for value in feature['header']['name'].values():
-            if find in value:
-                found = True
-    elif typ in ('t', 'et'):
-        for t in feature['header']['types']:
-            if t == find:
-                found = True
-            elif typ == 't' and find in t:
-                found = True
-    elif typ == 'm' and 'metadata' in feature:
-        if find in feature['metadata']:
-            found = True
-    elif typ == 'id' and i == int(find):
-        found = True
-    if found:
-        print(json.dumps(feature, ensure_ascii=False, sort_keys=True).encode('utf-8'))
--- a/tools/ft2osm.py
+++ b/tools/ft2osm.py
@ -1,22 +0,0 @@
-#!/usr/bin/env python
-import sys
-import mwm
-
-if len(sys.argv) < 3:
-    print('Finds an OSM object for a given feature id.')
-    print('Usage: {} <mwm.osm2ft> <ftid>'.format(sys.argv[0]))
-    sys.exit(1)
-
-with open(sys.argv[1], 'rb') as f:
-    ft2osm = mwm.Osm2Ft(f, True)
-
-code = 0
-type_abbr = {'n': 'node', 'w': 'way', 'r': 'relation'}
-for ftid in sys.argv[2:]:
-    ftid = int(ftid)
-    if ftid in ft2osm:
-        print('https://www.openstreetmap.org/{}/{}'.format(type_abbr[ft2osm[ftid][0]], ft2osm[ftid][1]))
-    else:
-        print('Could not find osm id for feature {}'.format(ftid))
-        code = 2
-sys.exit(code)