diff --git a/tools/python/booking_hotels_quality.py b/tools/python/booking_hotels_quality.py index cd82adfd2d..7f7107c9c7 100755 --- a/tools/python/booking_hotels_quality.py +++ b/tools/python/booking_hotels_quality.py @@ -21,26 +21,22 @@ logging.basicConfig(level=logging.DEBUG, format='[%(asctime)s] %(levelname)s: %( def load_binary_list(path): - """ - Loads reference binary classifier output. - """ + """Loads reference binary classifier output. """ bits = [] with open(path, 'r') as fd: for line in fd: - if (not line.strip()) or line[0] == '#': + if (not line.strip()) or line.startswith('#'): continue - bits.append(1 if line[0] == 'y' else 0) + bits.append(1 if line.startswith('y') else 0) return bits def load_score_list(path): - """ - Loads list of matching scores. - """ + """Loads list of matching scores. """ scores = [] with open(path, 'r') as fd: for line in fd: - if (not line.strip()) or line[0] == '#': + if (not line.strip()) or line.startswith('#'): continue scores.append(float(re.search(r'result score: (\d*\.\d+)', line).group(1))) return scores diff --git a/tools/python/opentable_restaurants.py b/tools/python/opentable_restaurants.py new file mode 100755 index 0000000000..b4392827aa --- /dev/null +++ b/tools/python/opentable_restaurants.py @@ -0,0 +1,119 @@ +#! /usr/bin/env python2 +# coding: utf-8 + +from __future__ import print_function + +import argparse +import base64 +import copy +import json +import logging +import os +import sys +import urllib2 + +from datetime import datetime + +# Initialize logging. +logging.basicConfig(level=logging.DEBUG, format='[%(asctime)s] %(levelname)s: %(message)s') + +class OpentableDownloaderError(Exception): + pass + +class OpentableDownloader(object): + def __init__(self, login, password, opentable_filename, tsv_filename=None): + self.login = login + self.password = password + self.token = None + self.opentable_filename = opentable_filename + self.tsv_filename = tsv_filename + + # TODO(mgsergio): Check if toke is atual in functions. + self._get_token() + + def download(self): + headers = self._add_auth_header({'Content-Type': 'application/json'}) + url = 'https://platform.otqa.com/sync/listings' + + with open(self.opentable_filename, 'w') as f: + offset = 0 + while True: + request = urllib2.Request(url + '?offset={}'.format(offset), headers=headers) + logging.debug('Fetching data with headers %s from %s', + str(headers), request.get_full_url()) + resp = urllib2.urlopen(request) + # TODO(mgsergio): Handle exceptions + data = json.loads(resp.read()) + for rest in data['items']: + print(json.dumps(rest), file=f) + + total_items = int(data['total_items']) + offset = int(data['offset']) + items_count = len(data['items']) + + if total_items <= offset + items_count: + break + + offset += items_count + + def _get_token(self): + url = 'https://oauth-pp.opentable.com/api/v2/oauth/token?grant_type=client_credentials' + headers = self._add_auth_header({}) + request = urllib2.Request(url, headers=headers) + logging.debug('Fetching token with headers %s', str(headers)) + resp = urllib2.urlopen(request) + # TODO(mgsergio): Handle exceptions + if resp.getcode() != 200: + raise OpentableDownloaderError("Cant't get token. Response: {}".format(resp.read())) + self.token = json.loads(resp.read()) + logging.debug('Token is %s', self.token) + + def _add_auth_header(self, headers): + if self.token is None: + key = base64.b64encode('{}:{}'.format(self.login, self.password)) + headers['Authorization'] = 'Basic {}'.format(key) + else: + headers['Authorization'] = '{} {}'.format(self.token['token_type'], + self.token['access_token']) + return headers + + +def make_tsv(data_file, output_file): + for rest in data_file: + rest = json.loads(rest) + try: + address = ' '.join([rest['address'], rest['city'], rest['country']]) + except TypeError: + address = '' + row = '\t'.join(map(unicode, [rest['rid'], rest['latitude'], rest['longitude'], + rest['name'], address, rest['reservation_url'], + rest['phone_number']])) + print(row.encode('utf-8'), file=output_file) + + +if __name__ == '__main__': + parser = argparse.ArgumentParser(description='Downloads opentable data.') + parser.add_argument('-d', '--download', action='store_true', help='Download data') + parser.add_argument('--tsv', type=str, nargs='?', const='', + help='A file to put data into, stdout if value is empty ' + 'If ommited, no tsv data is generated') + parser.add_argument('--opentable_data', type=str, help='Path to opentable data file') + + # TODO(mgsergio): Allow config instead. + parser.add_argument('--client', required=True, help='Opentable client id') + parser.add_argument('--secrete', required=True, help="Opentable client's secrete") + + args = parser.parse_args(sys.argv[1:]) + + if args.download: + print('Downloading') + loader = OpentableDownloader(args.client, args.secrete, args.opentable_data) + loader.download() + if args.tsv is not None: + data = open(args.opentable_data) + tsv = open(args.tsv) if args.tsv else sys.stdout + try: + make_tsv(data, tsv) + finally: + data.close() + tsv.close()