1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
|
import re
import urllib
from urlparse import urljoin
import mysql
from bs4 import BeautifulSoup as bs
import jfr_playoff.sql as p_sql
from jfr_playoff.dto import Match, Team
class MatchInfo:
matches = {}
url_cache = {}
def __init__(self, match_config, teams, database):
self.config = match_config
self.teams = teams
self.database = database
self.info = Match()
self.__init_info()
self.__fetch_match_link()
def __init_info(self):
self.info.id = self.config['id']
MatchInfo.matches[self.info.id] = self.info
self.info.running = 0
self.info.winner_matches = []
self.info.loser_matches = []
for i in range(0, 2):
if 'winner' in self.config['teams'][i]:
self.info.winner_matches += self.config['teams'][i]['winner']
if 'loser' in self.config['teams'][i]:
self.info.loser_matches += self.config['teams'][i]['loser']
self.info.winner_matches = list(set(self.info.winner_matches))
self.info.loser_matches = list(set(self.info.loser_matches))
self.info.teams = []
def __get_link(self, suffix):
try:
row = self.database.fetch(
self.config['database'], p_sql.PREFIX, ())
if row is not None:
if len(row) > 0:
return row[0] + suffix
except mysql.connector.Error:
return None
return None
def __fetch_match_link(self):
if 'link' in self.config:
self.info.link = self.config['link']
elif 'round' in self.config:
self.info.link = self.__get_link(
'runda%d.html' % (self.config['round']))
def __get_predefined_scores(self):
teams = [Team(), Team()]
scores_fetched = False
teams_fetched = False
if 'score' in self.config:
i = 0
for score in self.config['score']:
if isinstance(self.config['score'], dict):
teams[i].score = self.config['score'][score]
try:
team_no = int(score)
teams[i].name = self.teams[team_no-1][0]
except ValueError:
teams[i].name = score
teams_fetched = True
else:
teams[i].score = score
i += 1
if i == 2:
break
scores_fetched = True
return scores_fetched, teams_fetched, teams
def __get_db_teams(self, teams, fetch_scores):
row = self.database.fetch(
self.config['database'], p_sql.MATCH_RESULTS,
(self.config['table'], self.config['round']))
teams[0].name = row[0]
teams[1].name = row[1]
if fetch_scores:
teams[0].score = row[3] + row[5]
teams[1].score = row[4] + row[6]
if row[2] > 0:
teams[0].score += row[2]
else:
teams[1].score -= row[2]
return teams
def __fetch_url(self, url):
if url not in MatchInfo.url_cache:
MatchInfo.url_cache[url] = urllib.urlopen(url).read()
return MatchInfo.url_cache[url]
def __find_table_row(self, url):
html_content = bs(self.__fetch_url(url), 'lxml')
for row in html_content.select('tr tr'):
for cell in row.select('td.t1'):
if cell.text.strip() == str(self.config['table']):
return row
return None
def __get_html_teams(self, teams, fetch_score):
row = self.__find_table_row(self.info.link)
if row is None:
raise ValueError('table row not found')
score_cell = row.select('td.bdc')[-1]
scores = [
float(text) for text
in score_cell.contents
if isinstance(text, unicode)]
team_names = [[text for text in link.contents
if isinstance(text, unicode)][0].strip(u'\xa0')
for link in row.select('a[onmouseover]')]
for i in range(0, 2):
teams[i].name = team_names[i]
teams[i].score = scores[i]
return teams
def __get_config_teams(self, teams):
for i in range(0, 2):
match_teams = []
if isinstance(self.config['teams'][i], basestring):
teams[i].name = self.config['teams'][i]
elif isinstance(self.config['teams'][i], list):
teams[i].name = '<br />'.join(self.config['teams'][i])
else:
if 'winner' in self.config['teams'][i]:
match_teams += [
MatchInfo.matches[winner_match].winner
for winner_match in self.config['teams'][i]['winner']]
if 'loser' in self.config['teams'][i]:
match_teams += [
MatchInfo.matches[loser_match].loser
for loser_match in self.config['teams'][i]['loser']]
if 'place' in self.config['teams'][i]:
match_teams += [
self.teams[place-1][0]
for place in self.config['teams'][i]['place']]
known_teams = [team for team in match_teams if team is not None]
if len(known_teams) > 0:
teams[i].name = '<br />'.join([
team if team is not None
else '??' for team in match_teams])
else:
teams[i].name = ''
return teams
def __fetch_teams_with_scores(self):
(scores_fetched, teams_fetched, self.info.teams) = self.__get_predefined_scores()
if scores_fetched:
if 'running' in self.config:
self.info.running = int(self.config['running'])
else:
self.info.running = -1
if not teams_fetched:
try:
try:
if self.database is None:
raise KeyError('database not configured')
if 'database' not in self.config:
raise KeyError('database not configured')
self.info.teams = self.__get_db_teams(
self.info.teams, not scores_fetched)
except (mysql.connector.Error, TypeError, IndexError, KeyError):
self.info.teams = self.__get_html_teams(
self.info.teams, not scores_fetched)
except (TypeError, IndexError, KeyError, IOError, ValueError):
self.info.teams = self.__get_config_teams(self.info.teams)
def __get_db_board_count(self):
towels = self.database.fetch(
self.config['database'], p_sql.TOWEL_COUNT,
(self.config['table'], self.config['round']))
row = [0 if r is None
else r for r in
self.database.fetch(
self.config['database'], p_sql.BOARD_COUNT,
(self.config['table'], self.config['round']))]
boards_to_play = int(row[0])
boards_played = max(int(row[1]), 0)
if boards_to_play > 0:
boards_played += int(towels[0])
return boards_played, boards_to_play
def __has_segment_link(self, cell):
links = [link for link in cell.select('a[href]')
if re.match(r'^.*\d+t\d+-\d+\.htm$', link['href'])]
return len(links) > 0
def __has_towel_image(self, cell):
return len(cell.select('img[alt="towel"]')) > 0
def __has_running_board_count(self, cell):
return len(cell.select('img[alt="running..."]')) > 0
def __get_html_running_boards(self, cell):
return int(cell.contents[-1].strip())
def __get_finished_info(self, cell):
segment_link = cell.select('a[href]')
if len(segment_link) > 0:
segment_url = re.sub(
r'\.htm$', '.html',
urljoin(self.info.link, segment_link[0]['href']))
try:
segment_content = bs(self.__fetch_url(segment_url), 'lxml')
board_rows = [row for row in segment_content.find_all('tr') if len(row.select('a.zb')) > 0]
board_count = len(board_rows)
played_boards = len([
row for row in board_rows if len(
''.join([cell.text.strip() for cell in row.select('td.bdn') + row.select('td.bde')])) > 0])
return board_count, played_boards >= board_count
except IOError:
return 0, False
return 0, False
def __get_html_board_count(self):
row = self.__find_table_row(self.info.link)
if row is None:
raise ValueError('table row not found')
cells = row.select('td.bdc')
segments = [cell for cell in cells if self.__has_segment_link(cell)]
towels = [cell for cell in cells if self.__has_towel_image(cell)]
if len(segments) == 0:
if len(towels) > 0:
return 1, 1 # entire match is toweled, so mark as finished
else:
raise ValueError('segments not found')
running_segments = [cell for cell in row.select('td.bdca') if self.__has_running_board_count(cell)]
running_boards = sum([self.__get_html_running_boards(segment) for segment in running_segments])
finished_segments = []
boards_in_segment = None
for segment in segments:
if segment not in running_segments:
boards, is_finished = self.__get_finished_info(segment)
if is_finished:
finished_segments.append(segment)
if boards_in_segment is None and boards > 0:
boards_in_segment = boards
total_boards = (len(segments) + len(towels) + len(running_segments)) * boards_in_segment
played_boards = (len(towels) + len(finished_segments)) * boards_in_segment + running_boards
return played_boards, total_boards
def __fetch_board_count(self):
boards_played = 0
boards_to_play = 0
try:
if self.database is None:
raise KeyError('database not configured')
boards_played, boards_to_play = self.__get_db_board_count()
except (mysql.connector.Error, TypeError, IndexError, KeyError):
try:
boards_played, boards_to_play = self.__get_html_board_count()
except (TypeError, IndexError, KeyError, IOError, ValueError):
pass
if boards_played > 0:
self.info.running = -1 \
if boards_played >= boards_to_play \
else boards_played
def __determine_outcome(self):
if (self.info.running == -1):
if self.info.teams[0].score > self.info.teams[1].score:
self.info.winner = self.info.teams[0].name
self.info.loser = self.info.teams[1].name
else:
self.info.loser = self.info.teams[0].name
self.info.winner = self.info.teams[1].name
def __get_db_running_link(self, prefix, round_no):
current_segment = int(
self.database.fetch(
self.config['database'], p_sql.CURRENT_SEGMENT, ())[0])
return '%s%st%d-%d.html' % (
prefix, round_no, self.config['table'], current_segment)
def __get_html_running_link(self):
row = self.__find_table_row(self.info.link)
running_link = row.select('td.bdcg a[href]')
if len(running_link) == 0:
raise ValueError('running link not found')
return urljoin(self.info.link, running_link[0]['href'])
def __determine_running_link(self):
link_match = re.match(r'^(.*)runda(\d+)\.html$', self.info.link)
if link_match:
try:
if self.database is None:
raise KeyError('database not configured')
self.info.link = self.__get_db_running_link(
link_match.group(1), link_match.group(2))
except (mysql.connector.Error, TypeError, IndexError, KeyError):
try:
self.info.link = self.__get_html_running_link()
except (TypeError, IndexError, KeyError, IOError, ValueError):
pass
def set_phase_link(self, phase_link):
if self.info.link is None:
self.info.link = phase_link
else:
if self.info.link != '#':
self.info.link = urljoin(phase_link, self.info.link)
def get_info(self):
self.__fetch_teams_with_scores()
self.__fetch_board_count()
self.__determine_outcome()
if self.info.running > 0:
self.__determine_running_link()
return self.info
|