Refactor to split processor/validator and mapsme output

This commit is contained in:
Ilya Zverev 2017-12-06 22:28:38 +03:00
parent 0197fb6ac0
commit 3d75e5e881
4 changed files with 184 additions and 181 deletions

View file

@ -8,9 +8,9 @@ import sys
import time
import urllib.parse
import urllib.request
from processors import processor
from subway_structure import (
distance,
download_cities,
find_transfers,
get_unused_entrances_geojson,
@ -277,180 +277,6 @@ def slugify(name):
return re.sub(r'[^a-z0-9_-]+', '', name.lower().replace(' ', '_'))
OSM_TYPES = {'n': (0, 'node'), 'w': (2, 'way'), 'r': (3, 'relation')}
SPEED_TO_ENTRANCE = 3 # km/h
SPEED_ON_TRANSFER = 3.5
SPEED_ON_LINE = 40
DEFAULT_INTERVAL = 2.5 # minutes
def prepare_mapsme_data(transfers, cities, cache_name):
def uid(elid, typ=None):
t = elid[0]
osm_id = int(elid[1:])
if not typ:
osm_id = osm_id << 2 + OSM_TYPES[t][0]
elif typ != t:
raise Exception('Got {}, expected {}'.format(elid, typ))
return osm_id << 1
def format_colour(c):
return c[1:] if c else None
def find_exits_for_platform(center, nodes):
exits = []
min_distance = None
for n in nodes:
d = distance(center, (n['lon'], n['lat']))
if not min_distance:
min_distance = d * 2 / 3
elif d < min_distance:
continue
too_close = False
for e in exits:
d = distance((e['lon'], e['lat']), (n['lon'], n['lat']))
if d < min_distance:
too_close = True
break
if not too_close:
exits.append(n)
return exits
cache = {}
if cache_name:
with open(cache_name, 'r', encoding='utf-8') as f:
cache = json.load(f)
stops = {} # el_id -> station data
networks = []
good_cities = set([c.name for c in cities])
for city_name, data in cache.items():
if city_name in good_cities:
continue
# TODO: get a network, stops and transfers from cache
platform_nodes = {}
for city in cities:
network = {'network': city.name, 'routes': [], 'agency_id': city.id}
for route in city:
routes = {
'type': route.mode,
'ref': route.ref,
'name': route.name,
'colour': format_colour(route.colour),
'route_id': uid(route.id, 'r'),
'itineraries': []
}
if route.infill:
routes['casing'] = routes['colour']
routes['colour'] = format_colour(route.infill)
for i, variant in enumerate(route):
itin = []
for stop in variant:
stops[stop.stoparea.id] = stop.stoparea
itin.append([uid(stop.stoparea.id), round(stop.distance*3.6/SPEED_ON_LINE)])
# Make exits from platform nodes, if we don't have proper exits
if len(stop.stoparea.entrances) + len(stop.stoparea.exits) == 0:
for pl in stop.stoparea.platforms:
pl_el = city.elements[pl]
if pl_el['type'] == 'node':
pl_nodes = [pl_el]
elif pl_el['type'] == 'way':
pl_nodes = [city.elements['n{}'.format(n)]
for n in pl_el['nodes']]
else:
pl_nodes = []
for m in pl_el['members']:
if m['type'] == 'way':
pl_nodes.extend(
[city.elements['n{}'.format(n)]
for n in city.elements['{}{}'.format(
m['type'][0], m['ref'])]['nodes']])
platform_nodes[pl] = find_exits_for_platform(
stop.stoparea.centers[pl], pl_nodes)
routes['itineraries'].append({
'stops': itin,
'interval': round((variant.interval or DEFAULT_INTERVAL) * 60)
})
network['routes'].append(routes)
networks.append(network)
m_stops = []
for stop in stops.values():
st = {
'name': stop.name,
'int_name': stop.int_name,
'lat': stop.center[1],
'lon': stop.center[0],
'osm_type': OSM_TYPES[stop.station.id[0]][1],
'osm_id': int(stop.station.id[1:]),
'id': uid(stop.id),
'entrances': [],
'exits': [],
}
for e_l, k in ((stop.entrances, 'entrances'), (stop.exits, 'exits')):
for e in e_l:
if e[0] == 'n':
st[k].append({
'osm_type': 'node',
'osm_id': int(e[1:]),
'lon': stop.centers[e][0],
'lat': stop.centers[e][1],
'distance': 60 + round(distance(
stop.centers[e], stop.center)*3.6/SPEED_TO_ENTRANCE)
})
if len(stop.entrances) + len(stop.exits) == 0:
if stop.platforms:
for pl in stop.platforms:
for n in platform_nodes[pl]:
for k in ('entrances', 'exits'):
st[k].append({
'osm_type': n['type'],
'osm_id': n['id'],
'lon': n['lon'],
'lat': n['lat'],
'distance': 60 + round(distance(
(n['lon'], n['lat']), stop.center)*3.6/SPEED_TO_ENTRANCE)
})
else:
for k in ('entrances', 'exits'):
st[k].append({
'osm_type': OSM_TYPES[stop.station.id[0]][1],
'osm_id': int(stop.station.id[1:]),
'lon': stop.centers[stop.id][0],
'lat': stop.centers[stop.id][1],
'distance': 60
})
m_stops.append(st)
c_transfers = []
for t_set in transfers:
t = list(t_set)
for t_first in range(len(t) - 1):
for t_second in range(t_first + 1, len(t)):
if t[t_first].id in stops and t[t_second].id in stops:
c_transfers.append([
uid(t[t_first].id),
uid(t[t_second].id),
30 + round(distance(t[t_first].center,
t[t_second].center)*3.6/SPEED_ON_TRANSFER)
])
if cache_name:
with open(cache_name, 'w', encoding='utf-8') as f:
json.dump(cache, f)
result = {
'stops': m_stops,
'transfers': c_transfers,
'networks': networks
}
return result
if __name__ == '__main__':
parser = argparse.ArgumentParser()
parser.add_argument(
@ -466,8 +292,8 @@ if __name__ == '__main__':
parser.add_argument('-l', '--log', type=argparse.FileType('w', encoding='utf-8'),
help='Validation JSON file name')
parser.add_argument('-o', '--output', type=argparse.FileType('w', encoding='utf-8'),
help='JSON file for MAPS.ME')
parser.add_argument('--cache', help='Cache file name for MAPS.ME data')
help='Processed metro systems output')
parser.add_argument('--cache', help='Cache file name for processed data')
parser.add_argument('-d', '--dump', help='Make a YAML file for a city data')
parser.add_argument('-j', '--json', help='Make a GeoJSON file for a city data')
parser.add_argument('--crude', action='store_true',
@ -573,7 +399,6 @@ if __name__ == '__main__':
res.append(v)
json.dump(res, options.log)
# Finally, prepare a JSON file for MAPS.ME
if options.output:
json.dump(prepare_mapsme_data(transfers, good_cities, options.cache),
json.dump(processor.process(good_cities, transfers, options.cache),
options.output, indent=1, ensure_ascii=False)

2
processors/__init__.py Normal file
View file

@ -0,0 +1,2 @@
# Here you can change the processor
from . import mapsme as processor

176
processors/mapsme.py Executable file
View file

@ -0,0 +1,176 @@
import json
from subway_structure import distance
OSM_TYPES = {'n': (0, 'node'), 'w': (2, 'way'), 'r': (3, 'relation')}
SPEED_TO_ENTRANCE = 3 # km/h
SPEED_ON_TRANSFER = 3.5
SPEED_ON_LINE = 40
DEFAULT_INTERVAL = 2.5 # minutes
def process(cities, transfers, cache_name):
def uid(elid, typ=None):
t = elid[0]
osm_id = int(elid[1:])
if not typ:
osm_id = osm_id << 2 + OSM_TYPES[t][0]
elif typ != t:
raise Exception('Got {}, expected {}'.format(elid, typ))
return osm_id << 1
def format_colour(c):
return c[1:] if c else None
def find_exits_for_platform(center, nodes):
exits = []
min_distance = None
for n in nodes:
d = distance(center, (n['lon'], n['lat']))
if not min_distance:
min_distance = d * 2 / 3
elif d < min_distance:
continue
too_close = False
for e in exits:
d = distance((e['lon'], e['lat']), (n['lon'], n['lat']))
if d < min_distance:
too_close = True
break
if not too_close:
exits.append(n)
return exits
cache = {}
if cache_name:
with open(cache_name, 'r', encoding='utf-8') as f:
cache = json.load(f)
stops = {} # el_id -> station data
networks = []
good_cities = set([c.name for c in cities])
for city_name, data in cache.items():
if city_name in good_cities:
continue
# TODO: get a network, stops and transfers from cache
platform_nodes = {}
for city in cities:
network = {'network': city.name, 'routes': [], 'agency_id': city.id}
for route in city:
routes = {
'type': route.mode,
'ref': route.ref,
'name': route.name,
'colour': format_colour(route.colour),
'route_id': uid(route.id, 'r'),
'itineraries': []
}
if route.infill:
routes['casing'] = routes['colour']
routes['colour'] = format_colour(route.infill)
for i, variant in enumerate(route):
itin = []
for stop in variant:
stops[stop.stoparea.id] = stop.stoparea
itin.append([uid(stop.stoparea.id), round(stop.distance*3.6/SPEED_ON_LINE)])
# Make exits from platform nodes, if we don't have proper exits
if len(stop.stoparea.entrances) + len(stop.stoparea.exits) == 0:
for pl in stop.stoparea.platforms:
pl_el = city.elements[pl]
if pl_el['type'] == 'node':
pl_nodes = [pl_el]
elif pl_el['type'] == 'way':
pl_nodes = [city.elements['n{}'.format(n)]
for n in pl_el['nodes']]
else:
pl_nodes = []
for m in pl_el['members']:
if m['type'] == 'way':
pl_nodes.extend(
[city.elements['n{}'.format(n)]
for n in city.elements['{}{}'.format(
m['type'][0], m['ref'])]['nodes']])
platform_nodes[pl] = find_exits_for_platform(
stop.stoparea.centers[pl], pl_nodes)
routes['itineraries'].append({
'stops': itin,
'interval': round((variant.interval or DEFAULT_INTERVAL) * 60)
})
network['routes'].append(routes)
networks.append(network)
m_stops = []
for stop in stops.values():
st = {
'name': stop.name,
'int_name': stop.int_name,
'lat': stop.center[1],
'lon': stop.center[0],
'osm_type': OSM_TYPES[stop.station.id[0]][1],
'osm_id': int(stop.station.id[1:]),
'id': uid(stop.id),
'entrances': [],
'exits': [],
}
for e_l, k in ((stop.entrances, 'entrances'), (stop.exits, 'exits')):
for e in e_l:
if e[0] == 'n':
st[k].append({
'osm_type': 'node',
'osm_id': int(e[1:]),
'lon': stop.centers[e][0],
'lat': stop.centers[e][1],
'distance': 60 + round(distance(
stop.centers[e], stop.center)*3.6/SPEED_TO_ENTRANCE)
})
if len(stop.entrances) + len(stop.exits) == 0:
if stop.platforms:
for pl in stop.platforms:
for n in platform_nodes[pl]:
for k in ('entrances', 'exits'):
st[k].append({
'osm_type': n['type'],
'osm_id': n['id'],
'lon': n['lon'],
'lat': n['lat'],
'distance': 60 + round(distance(
(n['lon'], n['lat']), stop.center)*3.6/SPEED_TO_ENTRANCE)
})
else:
for k in ('entrances', 'exits'):
st[k].append({
'osm_type': OSM_TYPES[stop.station.id[0]][1],
'osm_id': int(stop.station.id[1:]),
'lon': stop.centers[stop.id][0],
'lat': stop.centers[stop.id][1],
'distance': 60
})
m_stops.append(st)
c_transfers = []
for t_set in transfers:
t = list(t_set)
for t_first in range(len(t) - 1):
for t_second in range(t_first + 1, len(t)):
if t[t_first].id in stops and t[t_second].id in stops:
c_transfers.append([
uid(t[t_first].id),
uid(t[t_second].id),
30 + round(distance(t[t_first].center,
t[t_second].center)*3.6/SPEED_ON_TRANSFER)
])
if cache_name:
with open(cache_name, 'w', encoding='utf-8') as f:
json.dump(cache, f)
result = {
'stops': m_stops,
'transfers': c_transfers,
'networks': networks
}
return result

View file

@ -41,7 +41,7 @@ PYTHON=${PYTHON:-python3}
# This will fail if there is no python
"$PYTHON" --version > /dev/null
SUBWAYS_PATH="$(dirname "$0")/.."
[ ! -f "$SUBWAYS_PATH/mapsme_subways.py" ] && echo "Please clone the subways repo to $SUBWAYS_PATH" && exit 2
[ ! -f "$SUBWAYS_PATH/process_subways.py" ] && echo "Please clone the subways repo to $SUBWAYS_PATH" && exit 2
TMPDIR="${TMPDIR:-$SUBWAYS_PATH}"
# Downloading the latest version of the subways script
@ -71,7 +71,7 @@ QNODES="railway=station station=subway =light_rail =monorail railway=subway_entr
# Running the validation
VALIDATION="$TMPDIR/validation.json"
"$PYTHON" "$SUBWAYS_PATH/mapsme_subways.py" -q -x "$FILTERED_DATA" -l "$VALIDATION" ${MAPSME+-o "$MAPSME"} ${CITY+-c "$CITY"} ${DUMP+-d "$DUMP"} ${JSON+-j "$JSON"}
"$PYTHON" "$SUBWAYS_PATH/process_subways.py" -q -x "$FILTERED_DATA" -l "$VALIDATION" ${MAPSME+-o "$MAPSME"} ${CITY+-c "$CITY"} ${DUMP+-d "$DUMP"} ${JSON+-j "$JSON"}
rm "$FILTERED_DATA"
# Preparing HTML files