1 # -*- coding: utf-8 -*-
3 from gotovienna.BeautifulSoup import BeautifulSoup
4 from urllib2 import urlopen
5 from datetime import time
9 from gotovienna import defaults
16 def get_stations(self, name):
17 """ Get station by direction
18 {'Directionname': [('Station name', 'url')]}
20 if not self._stations.has_key(name):
23 if not self.lines.has_key(name):
26 bs = BeautifulSoup(urlopen(self.lines[name]))
27 tables = bs.findAll('table', {'class': 'text_10pix'})
29 dir = tables[i].div.contents[-1].strip(' ')
32 for tr in tables[i].findAll('tr', {'onmouseout': 'obj_unhighlight(this);'}):
34 sta.append((tr.a.text, defaults.line_overview + tr.a['href']))
36 sta.append((tr.text.strip(' '), None))
39 self._stations[name] = st
41 return self._stations[name]
45 """ Dictionary of Line names with url as value
48 bs = BeautifulSoup(urlopen(defaults.line_overview))
50 lines = bs.findAll('td', {'class': 'linie'})
54 href = defaults.line_overview + line.a['href']
56 self._lines[line.text] = href
58 self._lines[line.img['alt']] = href
62 def get_departures(self, url):
63 """ Get list of next departures
64 integer if time until next departure
65 time if time of next departure
68 #TODO parse line name and direction for station site parsing
71 # FIXME prevent from calling this method with None
74 bs = BeautifulSoup(urlopen(url))
75 result_lines = bs.findAll('table')[-1].findAll('tr')
78 for tr in result_lines[1:]:
81 #TODO replace with logger
82 print "[DEBUG] Unable to find th in:\n%s" % str(tr)
86 time = th[-2].text.split(' ')
88 #print 'Invalid time: %s' % time
89 # TODO: Issue a warning OR convert "HH:MM" format to countdown
94 if time.find('rze...') >= 0:
97 # if time to next departure in cell convert to int
100 # check if time of next departue in cell
101 t = time.strip(' ').split(':')
102 if len(t) == 2 and all(map(lambda x: x.isdigit(), t)):
107 #TODO replace with logger
108 print "[DEBUG] Invalid data:\n%s" % time
113 UBAHN, TRAM, BUS, NIGHTLINE, OTHER = range(5)
114 LINE_TYPE_NAMES = ['U-Bahn', 'Strassenbahn', 'Bus', 'Nightline', 'Andere']
116 def get_line_sort_key(name):
117 """Return a sort key for a line name
119 >>> get_line_sort_key('U6')
122 >>> get_line_sort_key('D')
125 >>> get_line_sort_key('59A')
128 txt = ''.join(x for x in name if not x.isdigit())
129 num = ''.join(x for x in name if x.isdigit()) or '0'
131 return (txt, int(num))
133 def get_line_type(name):
134 """Get the type of line for the given name
136 >>> get_line_type('U1')
138 >>> get_line_type('59A')
143 elif name.endswith('A') or name.endswith('B') and name[1].isdigit():
145 elif name.startswith('U'):
147 elif name.startswith('N'):
149 elif name in ('D', 'O', 'VRT', 'WLB'):
154 def categorize_lines(lines):
155 """Return a categorized version of a list of line names
157 >>> categorize_lines(['U4', 'U3', '59A'])
158 [('U-Bahn', ['U3', 'U4']), ('Bus', ['59A'])]
160 categorized_lines = collections.defaultdict(list)
162 for line in sorted(lines):
163 line_type = get_line_type(line)
164 categorized_lines[line_type].append(line)
166 for lines in categorized_lines.values():
167 lines.sort(key=get_line_sort_key)
169 return [(LINE_TYPE_NAMES[key], categorized_lines[key])
170 for key in sorted(categorized_lines)]