bnporc: Add support of some broken messages
This commit is contained in:
parent
e7f6086916
commit
a84fde80e6
1 changed files with 8 additions and 3 deletions
|
|
@ -18,7 +18,7 @@
|
||||||
# along with weboob. If not, see <http://www.gnu.org/licenses/>.
|
# along with weboob. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
|
||||||
|
|
||||||
from weboob.tools.browser import BasePage
|
from weboob.tools.browser import BasePage, BrokenPageError
|
||||||
from weboob.capabilities.messages import Message, Thread
|
from weboob.capabilities.messages import Message, Thread
|
||||||
from weboob.capabilities.base import NotLoaded
|
from weboob.capabilities.base import NotLoaded
|
||||||
from weboob.tools.capabilities.messages.genericArticle import try_drop_tree
|
from weboob.tools.capabilities.messages.genericArticle import try_drop_tree
|
||||||
|
|
@ -70,8 +70,13 @@ class MessagePage(BasePage):
|
||||||
This page has a date, but it is less precise than the main list page,
|
This page has a date, but it is less precise than the main list page,
|
||||||
so we only use it for the message content.
|
so we only use it for the message content.
|
||||||
"""
|
"""
|
||||||
content = self.parser.select(self.document.getroot(),
|
try:
|
||||||
'div.txtMessage div.contenu', 1)
|
content = self.parser.select(self.document.getroot(),
|
||||||
|
'div.txtMessage div.contenu', 1)
|
||||||
|
except BrokenPageError:
|
||||||
|
# This happens with some old messages (2007)
|
||||||
|
content = self.parser.select(self.document.getroot(), 'div.txtMessage', 1)
|
||||||
|
|
||||||
content = make_links_absolute(content, self.url)
|
content = make_links_absolute(content, self.url)
|
||||||
try_drop_tree(self.parser, content, 'script')
|
try_drop_tree(self.parser, content, 'script')
|
||||||
return self.parser.tostring(content)
|
return self.parser.tostring(content)
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue