1 # -*- coding: utf-8 -*-
3 from gotovienna.BeautifulSoup import BeautifulSoup
4 #from urllib2 import urlopen
5 from urllib import quote_plus
6 from UrlOpener import urlopen
7 from datetime import time, datetime, timedelta
10 from errors import LineNotFoundError, StationNotFoundError
12 from cache import Stations
13 from time import sleep
15 from gotovienna import defaults
17 class Departure(dict):
18 def __init__(self, line, station, direction, time, lowfloor):
20 self['station'] = station
21 self['direction'] = direction
23 self['lowfloor'] = lowfloor
25 def __getitem__(self, *args, **kwargs):
26 if args[0] == 'ftime':
28 elif args[0] == 'deltatime':
29 return self.departure_deltatime
30 elif args[0] == 'atime':
31 return self.departure_time
32 return dict.__getitem__(self, *args, **kwargs)
35 def departure_time(self):
36 """ return time object of departure time
38 if type(self['time']) == time:
41 return (datetime.now() + timedelta(self['time'])).time()
44 def departure_deltatime(self):
45 """ return int representing minutes until departure
47 if type(self['time']) == int:
50 raise NotImplementedError()
54 if type(self['time']) == int:
55 return str(self['time'])
56 elif type(self['time']) == time:
57 return self['time'].strftime('%H:%M')
61 self._lines = cache.lines
63 def get_stations(self, name):
64 """ Get station by direction
65 {'Directionname': [('Station name', 'url')]}
67 if not name in self.lines:
73 bs = BeautifulSoup(urlopen(self.lines[name]))
74 tables = bs.findAll('table', {'class': 'text_10pix'})
76 dir = tables[i].div.contents[-1].strip()[6:-6]
79 for tr in tables[i].findAll('tr', {'onmouseout': 'obj_unhighlight(this);'}):
81 sta.append((tr.a.text, defaults.line_overview + tr.a['href']))
83 sta.append((tr.text.strip(' '), None))
91 """ Dictionary of Line names with url as value
94 bs = BeautifulSoup(urlopen(defaults.line_overview))
96 lines = bs.findAll('td', {'class': 'linie'})
100 href = defaults.line_overview + line.a['href']
102 self._lines[line.text] = href
104 self._lines[line.img['alt']] = href
108 def get_url_from_direction(self, line, direction, station):
109 stations = self.get_stations(line)
111 for stationname, url in stations.get(direction, []):
112 if stationname == station:
117 def get_departures_by_station(self, station):
118 """ Get list of Departures for one station
121 # TODO 1. Error handling
122 # TODO 2. more error handling
123 # TODO 3. ultimative error handling
126 bs = BeautifulSoup(urlopen(defaults.departures_by_station % quote_plus(station.encode('UTF-8'))))
128 li = bs.ul.findAll('li')
130 # Dirty workaround for ambiguous station
131 bs = BeautifulSoup(urlopen(defaults.qando + li[0].a['href']))
132 li = bs.ul.findAll('li')
137 if d.find('»') == -1:
140 direction = d.replace('»', '').strip()
141 if direction.startswith('NICHT EINSTEIGEN'):
145 for span in l.findAll('span'):
146 if span.text.isdigit():
148 elif span.text.find(':') >= 0:
149 tim = time(*map(int, span.text.split(':')))
151 print 'Warning: %s' % span.text
154 if span['class'] == 'departureBarrierFree':
159 dep.append(Departure(line, station, direction, tim, lowfloor))
162 print 'Warning: %s' % l
165 except AttributeError:
166 print 'Error while getting station %s' % station
171 def get_departures(self, url):
172 """ Get list of next departures as Departure object
175 #TODO parse line name and direction for station site parsing
178 # FIXME prevent from calling this method with None
179 print "ERROR empty url"
182 # open url for 90 min timeslot / get departure for next 90 min
184 tries = 2 # try a second time before return empty list
186 bs = BeautifulSoup(urlopen(url + "&departureSizeTimeSlot=90"))
188 lines = bs.find('form', {'name': 'mainform'}).table.findAll('tr')[1]
191 except AttributeError:
193 msg = bs.findAll('span', {'class': 'rot fett'})
194 if len(msg) > 0 and str(msg[0].text).find(u'technischen St') > 0:
195 print 'Temporary problem'
196 print '\n'.join(map(lambda x: x.text.replace(' ', ''), msg))
197 # FIXME Change to error message after fixing qml gui
205 if len(lines.findAll('td', {'class': 'info'})) > 0:
206 station = lines.span.text.replace(' ', '')
207 line = lines.findAll('span')[-1].text.replace(' ', '')
209 station = lines.td.span.text.replace(' ', '')
210 line = lines.find('td', {'align': 'right'}).span.text.replace(' ', '')
212 result_lines = bs.findAll('table')[-1].findAll('tr')
215 for tr in result_lines[1:]:
216 d = {'station': station}
217 th = tr.findAll('th')
220 #TODO replace with logger
221 print "[DEBUG] Unable to find th in:\n%s" % str(tr)
223 # underground site looks different -.-
226 d['direction'] = th[0].text.replace(' ', '')
230 print th[-1].find('img') and th[-1].img.has_key('alt')
231 d['lowfloor'] = th[-1].find('img') and th[-1].img.has_key('alt')
232 d['line'] = th[0].text.replace(' ', '')
233 d['direction'] = th[1].text.replace(' ', '')
236 tim = t.text.split(' ')
238 # print '[WARNING] Invalid time: %s' % time
239 # TODO: Issue a warning OR convert "HH:MM" format to countdown
244 if tim.find('rze...') >= 0:
247 # if time to next departure in cell convert to int
250 # check if time of next departue in cell
251 t = tim.strip(' ').split(':')
252 if len(t) == 2 and all(map(lambda x: x.isdigit(), t)):
257 #TODO replace with logger
258 print "[DEBUG] Invalid data:\n%s" % time
260 dep.append(Departure(**d))
265 UBAHN, TRAM, BUS, NIGHTLINE, OTHER = range(5)
266 LINE_TYPE_NAMES = ['U-Bahn', 'Strassenbahn', 'Bus', 'Nightline', 'Andere']
268 def get_line_sort_key(name):
269 """Return a sort key for a line name
271 >>> get_line_sort_key('U6')
274 >>> get_line_sort_key('D')
277 >>> get_line_sort_key('59A')
280 txt = ''.join(x for x in name if not x.isdigit())
281 num = ''.join(x for x in name if x.isdigit()) or '0'
283 return (txt, int(num))
285 def get_line_type(name):
286 """Get the type of line for the given name
288 >>> get_line_type('U1')
290 >>> get_line_type('59A')
295 elif name.endswith('A') or name.endswith('B') and name[1].isdigit():
297 elif name.startswith('U'):
299 elif name.startswith('N'):
301 elif name in ('D', 'O', 'VRT', 'WLB'):
306 def categorize_lines(lines):
307 """Return a categorized version of a list of line names
309 >>> categorize_lines(['U4', 'U3', '59A'])
310 [('U-Bahn', ['U3', 'U4']), ('Bus', ['59A'])]
312 categorized_lines = collections.defaultdict(list)
314 for line in sorted(lines):
315 line_type = get_line_type(line)
316 categorized_lines[line_type].append(line)
318 for lines in categorized_lines.values():
319 lines.sort(key=get_line_sort_key)
321 return [(LINE_TYPE_NAMES[key], categorized_lines[key])
322 for key in sorted(categorized_lines)]