[monster] improve page parsing

This commit is contained in:
Bezleputh 2015-02-23 09:38:01 +01:00 committed by Romain Bignon
commit 4d59d1f9ea
2 changed files with 5 additions and 5 deletions

View file

@ -71,8 +71,8 @@ class AdvertPage(HTMLPage):
obj_id = Env('_id')
obj_url = BrowserURL('advert', _id=Env('_id'))
obj_title = CleanText('//div[@id="jobcopy"]/h1[@itemprop="title"]')
obj_description = CleanHTML('//div[@id="jobBodyContent"]')
obj_title = CleanText('//div[@id="jobcopy"]/h1[@itemprop="title"]|//div[@itemprop="title"]/h1')
obj_description = CleanHTML('//div[@id="jobBodyContent"]|//div[@itemprop="description"]')
obj_contract_type = Join('%s ', '//dd[starts-with(@class, "multipledd")]')
obj_society_name = CleanText('//dd[@itemprop="hiringOrganization"]')
obj_place = CleanText('//span[@itemprop="jobLocation"]')