[inrocks] do not try to parse premium news pages
This commit is contained in:
parent
a85c73da34
commit
8f31594314
1 changed files with 9 additions and 8 deletions
|
|
@ -28,7 +28,8 @@ class ArticlePage(GenericNewsPage):
|
||||||
"ArticlePage object for inrocks"
|
"ArticlePage object for inrocks"
|
||||||
|
|
||||||
def on_loaded(self):
|
def on_loaded(self):
|
||||||
self.main_div = self.document.getroot()
|
main = self.parser.select(self.document.getroot(), "div#content")
|
||||||
|
self.main_div = main[0] if len(main) else None
|
||||||
self.element_title_selector = "h1"
|
self.element_title_selector = "h1"
|
||||||
self.element_author_selector = "div.name>span"
|
self.element_author_selector = "div.name>span"
|
||||||
self.element_body_selector = "div.maincol"
|
self.element_body_selector = "div.maincol"
|
||||||
|
|
@ -37,7 +38,7 @@ class ArticlePage(GenericNewsPage):
|
||||||
try:
|
try:
|
||||||
element_body = self.get_element_body()
|
element_body = self.get_element_body()
|
||||||
except NoneMainDiv:
|
except NoneMainDiv:
|
||||||
return None
|
return u'Ceci est un article payant'
|
||||||
else:
|
else:
|
||||||
div_header_element = self.parser.select(element_body, "div.header", 1)
|
div_header_element = self.parser.select(element_body, "div.header", 1)
|
||||||
element_detail = self.parser.select(element_body, "div.details", 1)
|
element_detail = self.parser.select(element_body, "div.details", 1)
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue