weboob-devel/modules/transilien/pages.py
Romain Bignon d61e15cf84 rename things related to browsers
weboob.tools.browser -> weboob.deprecated.browser
weboob.tools.parsers -> weboob.deprecated.browser.parsers
weboob.tools.mech -> weboob.deprecated.mech
weboob.browser2 -> weboob.browser
weboob.core.exceptions -> weboob.exceptions

Also, the new tree for browser2 is:

weboob.browser: import weboob.browser.browsers.* and weboob.browser.url.*
weboob.browser.browsers: all browsers (including PagesBrowser and LoginBrowser)
weboob.browser.url: the URL class
weboob.browser.profiles: all Profile classes
weboob.browser.sessions: WeboobSession and FuturesSession
weboob.browser.cookies: that's a cookies thing
weboob.browser.pages: all Page and derivated classes, and Form class
weboob.browser.exceptions: specific browser exceptions
weboob.browser.elements: AbstractElement classes, and 'method' decorator
weboob.browser.filters.*: all filters
2014-10-07 00:30:07 +02:00

176 lines
6.7 KiB
Python

# -*- coding: utf-8 -*-
# Copyright(C) 2010-2011 Julien Hébert, Romain Bignon
# Copyright(C) 2014 Benjamin Carton
#
# This file is part of weboob.
#
# weboob is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# weboob is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with weboob. If not, see <http://www.gnu.org/licenses/>.
import re
from weboob.browser.pages import JsonPage, HTMLPage
from weboob.browser.elements import TableElement, ItemElement, ListElement, method
from weboob.capabilities.travel import Station, Departure, RoadStep
from weboob.capabilities import NotAvailable
from weboob.browser.filters.standard import CleanText, TableCell, Filter, DateTime, Env, Regexp, Duration
from weboob.browser.filters.json import Dict
from weboob.browser.filters.html import Link
from weboob.tools.date import LinearDateGuesser
class DictElement(ListElement):
def find_elements(self):
if self.item_xpath is not None:
for el in self.el.get(self.item_xpath):
yield el
else:
yield self.el
class RoadMapDuration(Duration):
regexp = re.compile(r'(?P<mn>\d+)')
kwargs = {'minutes': 'mn'}
class DepartureTypeFilter(Filter):
def filter(self, el):
result = []
for img in el[0].getiterator(tag='img'):
result.append(img.attrib['alt'])
return u' '.join(result)
class Child(Filter):
def filter(self, el):
return list(el[0].iterchildren())
class RoadMapPage(HTMLPage):
def request_roadmap(self, station, arrival, arrival_date):
form = self.get_form('//form[@id="cRechercheItineraire"]')
form['depart'] = station
form['arrivee'] = arrival
form.submit()
def get_roadmap(self):
for step in self.doc.xpath('//table[@class="trajet_etapes"]/tr[@class="etape"]'):
roadstep = RoadStep()
roadstep.line = '%s %s' % (DepartureTypeFilter(step.xpath('./td[@class="moyen"]'))(self),
CleanText('./td[@class="moyen"]')(step))
roadstep.start_time = DateTime(CleanText('./th/span[@class="depart"]'),
LinearDateGuesser())(step)
roadstep.end_time = DateTime(CleanText('./th/span[@class="depart"]/following-sibling::span'),
LinearDateGuesser())(step)
roadstep.departure = CleanText('./td[@class="arret"]/p/strong')(step)
roadstep.arrival = CleanText('./td[@class="arret"]/p/following-sibling::p/strong')(step)
roadstep.duration = RoadMapDuration(CleanText('./td[@class="time"]'))(step)
yield roadstep
class HorairesPage(HTMLPage):
def get_departures(self, station, arrival, date):
for table in self.doc.xpath('//table[@class="trajet_horaires trajet_etapes"]'):
lignes = table.xpath('./tr[@class="ligne"]/th')
arrives = table.xpath('./tr[@class="arrivee"]/td')
departs = table.xpath('./tr[@class="depart"]/td')
items = zip(lignes, arrives, departs)
for item in items:
departure = Departure()
departure.id = Regexp(Link('./div/a'), '.*?vehicleJourneyExternalCode=(.*?)&.*?')(item[1])
departure.departure_station = station
departure.arrival_station = arrival
hour, minute = CleanText('./div/a')(item[1]).split('h')
departure.time = date.replace(hour=int(hour), minute=int(minute))
hour, minute = CleanText('./div/a')(item[2]).split('h')
departure.arrival_time = date.replace(hour=int(hour), minute=int(minute))
departure.information = CleanText('.')(item[0])
departure.type = DepartureTypeFilter(item)(self)
yield departure
class StationsPage(JsonPage):
@method
class get_stations(DictElement):
item_xpath = 'gares'
class item(ItemElement):
klass = Station
def condition(self):
if self.env['only_station']:
return Dict('entryPointType')(self.el) == 'StopArea' and Dict('reseau')(self.el)[0]
return True
obj_name = CleanText(Dict('gare'))
obj_id = CleanText(Dict('gare'), replace=[(' ', '-')])
class DeparturesPage2(HTMLPage):
def get_potential_arrivals(self):
arrivals = {}
for el in self.doc.xpath('//select[@id="gare_arrive_ambigu"]/option'):
arrivals[el.text] = el.attrib['value']
return arrivals
def get_station_id(self):
form = self.get_form('//form[@id="cfichehoraire"]')
return form['departExternalCode']
def init_departure(self, station):
form = self.get_form('//form[@id="cfichehoraire"]')
form['depart'] = station
form.submit()
def get_departures(self, arrival, date):
form = self.get_form('//form[@id="cfichehoraire"]')
form['arrive'] = arrival
if date:
form['jourHoraire'] = date.day
form['moiHoraire'] = '%s|%s' % (date.month, date.year)
form['heureHoraire'] = date.hour
form['minuteHoraire'] = date.minute
self.logger.debug(form)
form.submit()
class DeparturesPage(HTMLPage):
@method
class get_departures(TableElement):
head_xpath = u'//table[@class="etat_trafic"][1]/thead/tr/th[@scope="col"]/text()'
item_xpath = u'//table[@class="etat_trafic"]/tr'
col_type = u'Ligne'
col_info = u'Nom du train'
col_time = u'Heure de départ'
col_arrival = u'Destination'
col_plateform = u'Voie/quai'
col_id = u'Gares desservies'
class item(ItemElement):
klass = Departure
def condition(self):
return len(self.el.xpath('./td')) >= 6
obj_time = TableCell('time') & CleanText & DateTime | NotAvailable
obj_type = DepartureTypeFilter(TableCell('type'))
obj_departure_station = CleanText(Env('station'))
obj_arrival_station = CleanText(TableCell('arrival'))
obj_information = TableCell('time') & CleanText & Regexp(pattern='([^\d:]+)') | u''
obj_plateform = CleanText(TableCell('plateform'))
obj_id = Regexp(Link(Child(TableCell('id'))), '.*?numeroTrain=(.*?)&.*?')