# -*- coding: utf-8 -*- # Copyright(C) 2013 Bezleputh # # This file is part of weboob. # # weboob is free software: you can redistribute it and/or modify # it under the terms of the GNU Affero General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # # weboob is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU Affero General Public License for more details. # # You should have received a copy of the GNU Affero General Public License # along with weboob. If not, see . from weboob.tools.browser import BasePage import dateutil.parser from .job import PopolemploiJobAdvert __all__ = ['SearchPage', 'AdvertPage'] class SearchPage(BasePage): def iter_job_adverts(self): rows = self.document.getroot().xpath('//table[@class="definition-table ordered"]/tbody/tr') for row in rows: advert = self.create_job_advert(row) if advert: yield advert def create_job_advert(self, row): a = self.parser.select(row, 'td[@headers="offre"]/a', 1, method='xpath') _id = u'%s' % (a.attrib['href'][-7:]) if _id: advert = PopolemploiJobAdvert(_id) advert.contract_type = u'%s' % self.parser.select(row, 'td[@headers="contrat"]', 1, method='xpath').text advert.title = u'%s' % a.text_content().strip() society = self.parser.select(row, 'td/div/p/span[@class="company"]', method='xpath') if society: advert.society_name = society[0].text advert.place = u'%s' % self.parser.select(row, 'td[@headers="lieu"]', 1, method='xpath').text_content() date = self.parser.select(row, 'td[@headers="dateEmission"]', 1, method='xpath') advert.publication_date = dateutil.parser.parse(date.text).date() return advert class AdvertPage(BasePage): def get_job_advert(self, url, advert): content = self.document.getroot().xpath('//div[@class="block-content"]/div')[0] if not advert: _id = self.parser.select(content, 'ul/li/ul/li/div[@class="value"]/span', 1, method='xpath').text advert = PopolemploiJobAdvert(_id) print url advert.title = u'%s' % self.parser.select(content, 'h4', 1, method='xpath').text.strip() advert.job_name = u'%s' % self.parser.select(content, 'h4', 1, method='xpath').text.strip() advert.description = u'%s' % self.parser.select(content, 'p[@itemprop="description"]', 1, method='xpath').text society_name = self.parser.select(content, 'div[@class="vcard"]/p[@class="title"]/span', method='xpath') if society_name: advert.society_name = u'%s' % society_name[0].text advert.url = url advert.place = u'%s' % self.parser.select(content, 'ul/li/div[@class="value"]/ul/li[@itemprop="addressRegion"]', 1, method='xpath').text.strip() advert.contract_type = u'%s' % self.parser.select(content, 'ul/li/div[@class="value"]/span[@itemprop="employmentType"]', 1, method='xpath').text.strip() advert.experience = u'%s' % self.parser.select(content, 'ul/li/div[@class="value"]/span[@itemprop="experienceRequirements"]', 1, method='xpath').text.strip() advert.formation = u'%s' % self.parser.select(content, 'ul/li/div[@class="value"]/span[@itemprop="qualifications"]', 1, method='xpath').text.strip() advert.pay = u'%s' % self.parser.select(content, 'ul/li/div[@class="value"]/span[@itemprop="baseSalary"]', 1, method='xpath').text.strip() return advert