Add a couple more profile examples
This commit is contained in:
parent
1b97e96785
commit
7d8b7e8ccd
2 changed files with 182 additions and 0 deletions
78
profiles/rosinter.py
Normal file
78
profiles/rosinter.py
Normal file
|
@ -0,0 +1,78 @@
|
||||||
|
download_url = 'http://www.rosinter.ru/locator/RestaurantsFeed.aspx?city=all&location=&lang=ru&brand=all&cuisine=all&metro=&hasDelivery=&isCorporate='
|
||||||
|
source = 'Rosinter'
|
||||||
|
no_dataset_id = True
|
||||||
|
max_distance = 500
|
||||||
|
query = [('amenity', 'restaurant', 'cafe', 'bar', 'pub', 'fast_food')]
|
||||||
|
overpass_timeout = 1000
|
||||||
|
duplicate_distance = -1
|
||||||
|
nearest_points = 30
|
||||||
|
master_tags = ('name', 'phone', 'amenity')
|
||||||
|
|
||||||
|
types = {
|
||||||
|
# substr: osm_substr, amenity, cuisine
|
||||||
|
'Costa': ['costa', 'cafe', 'coffee_shop'],
|
||||||
|
'IL': [('patio', 'патио'), 'restaurant', 'italian'],
|
||||||
|
'TGI': [('tgi', 'friday'), 'restaurant', 'american'],
|
||||||
|
'Бар и': ['гриль', 'restaurant', 'american'],
|
||||||
|
'Макд': ['мак', 'fast_food', None],
|
||||||
|
'Раша': ['мама', 'fast_food', 'russian'],
|
||||||
|
'Планета': ['планета', 'restaurant', 'japanese'],
|
||||||
|
'Шика': ['шика', 'restaurant', 'asian'],
|
||||||
|
'Свои': ['сво', 'restaurant', None],
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
def matches(osmtags, ritags):
|
||||||
|
global types
|
||||||
|
rname = ritags['name']
|
||||||
|
name = osmtags.get('name', '').lower()
|
||||||
|
for k, v in types.items():
|
||||||
|
if k in rname:
|
||||||
|
if isinstance(v[0], str):
|
||||||
|
return v[0] in name
|
||||||
|
for n in v[0]:
|
||||||
|
if n in name:
|
||||||
|
return True
|
||||||
|
return False
|
||||||
|
logging.error('Unknown rname value: %s', rname)
|
||||||
|
return False
|
||||||
|
|
||||||
|
|
||||||
|
def dataset(f):
|
||||||
|
global types
|
||||||
|
from lxml import etree
|
||||||
|
root = etree.parse(f).getroot()
|
||||||
|
for el in root.find('Restaurants'):
|
||||||
|
rid = el.find('id').text
|
||||||
|
city = el.find('city').text
|
||||||
|
if city in ('Прага', 'Будапешт', 'Варшава', 'Баку', 'Рига'):
|
||||||
|
continue
|
||||||
|
brand = el.find('brand').text
|
||||||
|
if 'TGI' in brand:
|
||||||
|
brand = 'TGI Fridays'
|
||||||
|
elif 'СВОИ' in brand:
|
||||||
|
brand = 'Свои'
|
||||||
|
phone = el.find('telephone').text
|
||||||
|
if phone:
|
||||||
|
phone = phone.replace('(', '').replace(')', '')
|
||||||
|
website = el.find('siteurl').text
|
||||||
|
if website and 'il-patio' in website:
|
||||||
|
website = 'http://ilpatio.ru'
|
||||||
|
if 'Свои' in brand:
|
||||||
|
website = 'http://restoransvoi.by'
|
||||||
|
lat = float(el.find('latitude').text)
|
||||||
|
lon = float(el.find('longitude').text)
|
||||||
|
tags = {
|
||||||
|
'amenity': 'restaurant',
|
||||||
|
'name': brand,
|
||||||
|
'phone': phone,
|
||||||
|
'website': website,
|
||||||
|
}
|
||||||
|
address = el.find('address').text
|
||||||
|
for k, v in types.items():
|
||||||
|
if k in brand:
|
||||||
|
tags['amenity'] = v[1]
|
||||||
|
tags['cuisine'] = v[2]
|
||||||
|
yield SourcePoint(
|
||||||
|
rid, lat, lon, tags,
|
||||||
|
remarks='Обязательно подвиньте точку!\nАдрес: ' + str(address))
|
104
profiles/schocoladnitsa.py
Normal file
104
profiles/schocoladnitsa.py
Normal file
|
@ -0,0 +1,104 @@
|
||||||
|
download_url = 'http://new.shoko.ru/addresses/'
|
||||||
|
source = 'Шоколадница'
|
||||||
|
no_dataset_id = True
|
||||||
|
overpass_timeout = 600
|
||||||
|
max_distance = 250
|
||||||
|
max_request_boxes = 6
|
||||||
|
query = [('amenity',), ('name', '~Шоколадница')]
|
||||||
|
master_tags = ['amenity', 'name', 'name:ru', 'name:en', 'website', 'phone', 'opening_hours']
|
||||||
|
|
||||||
|
|
||||||
|
def dataset(fileobj):
|
||||||
|
def parse_oh(s):
|
||||||
|
if not s:
|
||||||
|
return None
|
||||||
|
olds = s
|
||||||
|
if s.strip().lower() == 'круглосуточно':
|
||||||
|
return '24/7'
|
||||||
|
trans = {
|
||||||
|
'будни': 'Mo-Fr',
|
||||||
|
'суббота': 'Sa',
|
||||||
|
'воскресенье': 'Su',
|
||||||
|
'ежедневно': 'Mo-Su',
|
||||||
|
'выходные': 'Sa-Su',
|
||||||
|
'восерсенье': 'Su',
|
||||||
|
'ежеденевно': 'Mo-Su',
|
||||||
|
'пн-чтивс': 'Mo-Th,Su',
|
||||||
|
'пн-чт,вс': 'Mo-Th,Su',
|
||||||
|
'пт.-сб': 'Fr-Sa',
|
||||||
|
'вск.-чт': 'Su-Th',
|
||||||
|
'смаяпооктябрь': 'May-Oct',
|
||||||
|
'ч.смаяпооктябрь': 'May-Oct',
|
||||||
|
'сентября': 'May-Sep',
|
||||||
|
}
|
||||||
|
weekdays = {'пн': 'Mo', 'вт': 'Tu', 'ср': 'We', 'чт': 'Th', 'пт': 'Fr', 'сб': 'Sa', 'вс': 'Su'}
|
||||||
|
if s == 'с 10 до 22' or s == 'с 10.00-22.00':
|
||||||
|
s = '10:00 - 22:00'
|
||||||
|
s = s.replace('круглосуточно', '00:00-24:00')
|
||||||
|
s = s.replace('23,', '23:00')
|
||||||
|
parts = []
|
||||||
|
for m in re.finditer(r'([а-яА-Я ,.:\(\)-]+?)?(?:\sс)?\s*(\d?\d[:.]\d\d)(?: до |[^\w\d]+)(\d\d[:.]\d\d)', s):
|
||||||
|
days = (m[1] or '').strip(' -.,:()').lower().replace(' ', '')
|
||||||
|
m2 = re.match(r'^([б-ч]{2})\s?[,и-]\s?([б-ч]{2})$', days)
|
||||||
|
if not days:
|
||||||
|
days = 'Mo-Su'
|
||||||
|
elif days in weekdays:
|
||||||
|
days = weekdays[days]
|
||||||
|
elif m2 and m2[1] in weekdays and m2[2] in weekdays:
|
||||||
|
days = weekdays[m2[1]] + '-' + weekdays[m2[2]]
|
||||||
|
else:
|
||||||
|
if days not in trans:
|
||||||
|
logging.warn('Unknown days: %s', days)
|
||||||
|
continue
|
||||||
|
days = trans[days]
|
||||||
|
parts.append('{} {:0>5}-{}'.format(days, m[2].replace('.', ':'), m[3].replace('.', ':')))
|
||||||
|
# logging.info('%s -> %s', olds, '; '.join(parts))
|
||||||
|
if parts:
|
||||||
|
return '; '.join(parts)
|
||||||
|
return None
|
||||||
|
|
||||||
|
from lxml import html
|
||||||
|
import re
|
||||||
|
import logging
|
||||||
|
import phonenumbers
|
||||||
|
h = html.fromstring(fileobj.read().decode('utf-8'))
|
||||||
|
markers = h.get_element_by_id('markers')
|
||||||
|
i = 0
|
||||||
|
for m in markers:
|
||||||
|
lat = m.get('data-lat')
|
||||||
|
lon = m.get('data-lng')
|
||||||
|
if not lat or not lon:
|
||||||
|
continue
|
||||||
|
oh = parse_oh(m.get('data-time'))
|
||||||
|
phone = m.get('data-phone')
|
||||||
|
if phone[:3] == '812':
|
||||||
|
phone = '+7' + phone
|
||||||
|
if ' 891' in phone:
|
||||||
|
phone = phone[:phone.index(' 891')]
|
||||||
|
if ' 8-91' in phone:
|
||||||
|
phone = phone[:phone.index(' 8-91')]
|
||||||
|
try:
|
||||||
|
if phone == 'отключен' or not phone:
|
||||||
|
phone = None
|
||||||
|
else:
|
||||||
|
parsed_phone = phonenumbers.parse(phone.replace(';', ',').split(',')[0], "RU")
|
||||||
|
except:
|
||||||
|
logging.info(phone)
|
||||||
|
raise
|
||||||
|
if phone is None:
|
||||||
|
fphone = None
|
||||||
|
else:
|
||||||
|
fphone = phonenumbers.format_number(
|
||||||
|
parsed_phone, phonenumbers.PhoneNumberFormat.INTERNATIONAL)
|
||||||
|
tags = {
|
||||||
|
'amenity': 'cafe',
|
||||||
|
'name': 'Шоколадница',
|
||||||
|
'name:ru': 'Шоколадница',
|
||||||
|
'name:en': 'Shokoladnitsa',
|
||||||
|
'website': 'http://shoko.ru',
|
||||||
|
'cuisine': 'coffee_shop',
|
||||||
|
'phone': fphone,
|
||||||
|
'opening_hours': oh
|
||||||
|
}
|
||||||
|
i += 1
|
||||||
|
yield SourcePoint(i, float(lat), float(lon), tags, remarks=m.get('data-title'))
|
Loading…
Add table
Reference in a new issue