fix double with hidden photos finder
This commit is contained in:
parent
384280c0df
commit
fb01c73028
1 changed files with 11 additions and 7 deletions
|
|
@ -273,13 +273,6 @@ class ProfilePage(PageBase):
|
||||||
if m:
|
if m:
|
||||||
self.photos.append(dict(url=re.sub(u'thumb[0-2]_', u'image', div.getAttribute('background')),
|
self.photos.append(dict(url=re.sub(u'thumb[0-2]_', u'image', div.getAttribute('background')),
|
||||||
hidden=False))
|
hidden=False))
|
||||||
photo_regex = re.compile('(?P<base_url>http://.+\.adopteunmec\.com/.+/)image(?P<id>.+)\.jpg')
|
|
||||||
photo_max_id = max(int(photo_regex.match(photo['url']).groupdict()['id']) for photo in self.photos)
|
|
||||||
base_url = photo_regex.match(self.photos[0]['url']).groupdict()['base_url']
|
|
||||||
for id in xrange(1, photo_max_id + 1):
|
|
||||||
url = '%simage%s.jpg' % (base_url, id)
|
|
||||||
if not url in [photo['url'] for photo in self.photos]:
|
|
||||||
self.photos.append(dict(url=url, hidden=True))
|
|
||||||
if div.hasAttribute('width') and str(div.getAttribute('width')) == '226':
|
if div.hasAttribute('width') and str(div.getAttribute('width')) == '226':
|
||||||
trs = div.getElementsByTagName('tr')
|
trs = div.getElementsByTagName('tr')
|
||||||
for tr in trs:
|
for tr in trs:
|
||||||
|
|
@ -317,6 +310,17 @@ class ProfilePage(PageBase):
|
||||||
if self.id:
|
if self.id:
|
||||||
break
|
break
|
||||||
|
|
||||||
|
if len(self.photos) == 0:
|
||||||
|
return
|
||||||
|
|
||||||
|
# find hidden photos.
|
||||||
|
photo_regex = re.compile('(?P<base_url>http://.+\.adopteunmec\.com/.+/)image(?P<id>.+)\.jpg')
|
||||||
|
photo_max_id = max(int(photo_regex.match(photo['url']).groupdict()['id']) for photo in self.photos)
|
||||||
|
base_url = photo_regex.match(self.photos[0]['url']).groupdict()['base_url']
|
||||||
|
for id in xrange(1, photo_max_id + 1):
|
||||||
|
if not url in [photo['url'] for photo in self.photos]:
|
||||||
|
self.photos.append(dict(url=url, hidden=True))
|
||||||
|
|
||||||
def parse_description(self, div):
|
def parse_description(self, div):
|
||||||
# look for description
|
# look for description
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue