add url patterns and fix encoding issues
This commit is contained in:
parent
cdca302efd
commit
9cba3c63a0
1 changed files with 2 additions and 1 deletions
|
|
@ -26,8 +26,9 @@ from .tools import id2url
|
||||||
|
|
||||||
class Newspaper20minutesBrowser(BaseBrowser):
|
class Newspaper20minutesBrowser(BaseBrowser):
|
||||||
"Newspaper20minutesBrowser class"
|
"Newspaper20minutesBrowser class"
|
||||||
|
ENCODING = None
|
||||||
PAGES = {
|
PAGES = {
|
||||||
'http://www.20minutes.fr/article/?.*': ArticlePage,
|
'http://www.20minutes.fr/(?!preums|ledirect).+/?.*': ArticlePage,
|
||||||
'http://www.20minutes.fr/ledirect/?.*': SimplePage,
|
'http://www.20minutes.fr/ledirect/?.*': SimplePage,
|
||||||
'http://www.20minutes.fr/preums/?.*': SimplePage
|
'http://www.20minutes.fr/preums/?.*': SimplePage
|
||||||
}
|
}
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue