From 0c04db0b185754bde339c209450027a7d2fa5fb1 Mon Sep 17 00:00:00 2001 From: Juke Date: Mon, 14 Mar 2011 00:58:50 +0100 Subject: [PATCH] fix buildbot fail on inrockstv (closes #544) --- weboob/backends/inrocks/browser.py | 5 ++- weboob/backends/inrocks/pages/inrockstv.py | 36 ++++++++++++++++++++++ 2 files changed, 40 insertions(+), 1 deletion(-) create mode 100644 weboob/backends/inrocks/pages/inrockstv.py diff --git a/weboob/backends/inrocks/browser.py b/weboob/backends/inrocks/browser.py index 78472d43..110b4d98 100644 --- a/weboob/backends/inrocks/browser.py +++ b/weboob/backends/inrocks/browser.py @@ -17,6 +17,7 @@ # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. from .pages.article import ArticlePage +from .pages.inrockstv import InrocksTvPage from weboob.tools.browser import BaseBrowser @@ -24,7 +25,9 @@ from weboob.tools.browser import BaseBrowser class NewspaperInrocksBrowser(BaseBrowser): "NewspaperInrocksBrowser class" PAGES = { - '.*': ArticlePage, + 'http://www.lesinrocks.com/actualite/.*': ArticlePage, + 'http://www.lesinrocks.com/inrockstv/.*': InrocksTvPage, + 'http://blogs.lesinrocks.com/.*': ArticlePage, } def is_logged(self): diff --git a/weboob/backends/inrocks/pages/inrockstv.py b/weboob/backends/inrocks/pages/inrockstv.py new file mode 100644 index 00000000..8ba686e4 --- /dev/null +++ b/weboob/backends/inrocks/pages/inrockstv.py @@ -0,0 +1,36 @@ +"ArticlePage object for inrocks" +# -*- coding: utf-8 -*- + +# Copyright(C) 2011 Julien Hebert +# +# This program is free software; you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation, version 3 of the License. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with this program; if not, write to the Free Software +# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. + +from weboob.tools.parsers.lxmlparser import select, SelectElementException +from weboob.tools.genericArticle import GenericNewsPage, try_remove, \ + try_remove_from_selector_list, \ + drop_comments, NoneMainDiv + +class InrocksTvPage(GenericNewsPage): + "ArticlePage object for inrocks" + def on_loaded(self): + self.main_div = self.document.getroot() + self.element_title_selector = "h2" + self.element_author_selector = "div.name>span" + self.element_body_selector = "span.infos" + + def get_body(self): + element_body = self.get_element_body() + return self.browser.parser.tostring(element_body) + +