/
local_options.py
130 lines (98 loc) · 4.37 KB
/
local_options.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
#!/usr/bin/env python
#
# Copyright 2014 Martin J Chorley
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import csv
from decorators import venue_response
from db_cache import MongoDBCache
from chain_decision import ChainDecider
from venue_searcher import VenueSearcher
class LocalComparison():
def __init__(self):
self.vs = VenueSearcher()
self.cd = ChainDecider()
self.db = MongoDBCache(db='fsqexp')
def get_venue_ids(self):
venues = []
# get all the venues from the database
db_venues = self.db.get_collection('venues').find(timeout=False)
# extract information needed for comparison
for v in db_venues:
# just work with venue information instead of whole response
if v.get('response'):
v = v['response']['venue']
venues.append(v['id'])
return venues
@venue_response
def local_comparison(self, venue, radius):
alt_chain_count = 0
chain_alternates = []
indie_alternates = []
alternates = self.vs.search_alternates(venue, radius)
for alternate in alternates:
v = self.vs.get_venue_json(alternate['id'])
if v is not None:
if v['id'] != venue['id']:
chain_id = self.cd.is_chain(v)
if chain_id is not None:
alt_chain_count += 1
chain_alternates.append(v)
else:
indie_alternates.append(v)
return chain_alternates, indie_alternates
if __name__ == '__main__':
distances = [50, 250, 500]
data_fields = ['venue_id', 'venue_name', 'chain']
for distance in distances:
data_fields.append('%d_indie_names' % distance)
data_fields.append('%d_indie_ids' % distance)
data_fields.append('%d_chain_names' % distance)
data_fields.append('%d_chain_ids' % distance)
with open('chain_indie_data.csv', 'w') as output_file:
writer = csv.DictWriter(output_file, data_fields)
writer.writeheader()
lc = LocalComparison()
venues = lc.get_venue_ids()
for venue in venues[0:1000]:
v = lc.vs.get_venue_json(venue)
data = dict.fromkeys(data_fields, "")
data['venue_id'] = v['id']
data['venue_name'] = v['name']
data['chain'] = lc.cd.is_chain(v)
print v['name']
for distance in distances:
c_a, i_a = lc.local_comparison(v, distance)
data['%d_chain_names' % distance] = []
data['%d_chain_ids' % distance] = []
data['%d_indie_names' % distance] = []
data['%d_indie_ids' % distance] = []
for alt in c_a:
if alt.get('response'):
data['%d_chain_names' % distance],append(alt['response']['venue']['name'])
data['%d_chain_ids' % distance],append(alt['response']['venue']['id'])
else:
if alt.get('name'):
data['%d_chain_names' % distance].append(alt['name'])
if alt.get('id'):
data['%d_chain_ids' % distance].append(alt['id'])
for alt in i_a:
if alt.get('response'):
data['%d_indie_names' % distance].append(alt['response']['venue']['name'])
data['%d_indie_ids' % distance].append(alt['response']['venue']['id'])
else:
if alt.get('name'):
data['%d_indie_names' % distance].append(alt['name'])
if alt.get('id'):
data['%d_indie_ids' % distance].append(alt['id'])
writer.writerow(data)