@@ 1431-1457 (lines=27) @@ | ||
1428 | } |
|
1429 | ||
1430 | ||
1431 | class ButterSafe(GenericListableComic): |
|
1432 | """Class to retrieve Butter Safe comics.""" |
|
1433 | name = 'butter' |
|
1434 | long_name = 'ButterSafe' |
|
1435 | url = 'http://buttersafe.com' |
|
1436 | get_url_from_archive_element = get_href |
|
1437 | comic_link_re = re.compile('^%s/([0-9]*)/([0-9]*)/([0-9]*)/.*' % url) |
|
1438 | ||
1439 | @classmethod |
|
1440 | def get_archive_elements(cls): |
|
1441 | archive_url = urljoin_wrapper(cls.url, 'archive/') |
|
1442 | return reversed(get_soup_at_url(archive_url).find_all('a', href=cls.comic_link_re)) |
|
1443 | ||
1444 | @classmethod |
|
1445 | def get_comic_info(cls, soup, link): |
|
1446 | """Get information about a particular comics.""" |
|
1447 | url = cls.get_url_from_archive_element(link) |
|
1448 | title = link.string |
|
1449 | year, month, day = [int(s) for s in cls.comic_link_re.match(url).groups()] |
|
1450 | img = soup.find('div', id='comic').find('img') |
|
1451 | assert img['alt'] == title |
|
1452 | return { |
|
1453 | 'title': title, |
|
1454 | 'day': day, |
|
1455 | 'month': month, |
|
1456 | 'year': year, |
|
1457 | 'img': [img['src']], |
|
1458 | } |
|
1459 | ||
1460 | ||
@@ 2427-2451 (lines=25) @@ | ||
2424 | } |
|
2425 | ||
2426 | ||
2427 | class JuliasDrawings(GenericListableComic): |
|
2428 | """Class to retrieve Julia's Drawings.""" |
|
2429 | name = 'julia' |
|
2430 | long_name = "Julia's Drawings" |
|
2431 | url = 'https://drawings.jvns.ca' |
|
2432 | get_url_from_archive_element = get_href |
|
2433 | ||
2434 | @classmethod |
|
2435 | def get_archive_elements(cls): |
|
2436 | div = get_soup_at_url(cls.url).find('div', class_='drawings') |
|
2437 | return reversed(div.find_all('a')) |
|
2438 | ||
2439 | @classmethod |
|
2440 | def get_comic_info(cls, soup, archive_elt): |
|
2441 | """Get information about a particular comics.""" |
|
2442 | date_str = soup.find('meta', property='og:article:published_time')['content'][:10] |
|
2443 | day = string_to_date(date_str, "%Y-%m-%d") |
|
2444 | title = soup.find('h3', class_='p-post-title').string |
|
2445 | imgs = soup.find('section', class_='post-content').find_all('img') |
|
2446 | return { |
|
2447 | 'title': title, |
|
2448 | 'img': [urljoin_wrapper(cls.url, i['src']) for i in imgs], |
|
2449 | 'month': day.month, |
|
2450 | 'year': day.year, |
|
2451 | 'day': day.day, |
|
2452 | } |
|
2453 | ||
2454 | ||
@@ 1497-1519 (lines=23) @@ | ||
1494 | last_date = comic_date |
|
1495 | ||
1496 | ||
1497 | class AbstruseGoose(GenericListableComic): |
|
1498 | """Class to retrieve AbstruseGoose Comics.""" |
|
1499 | name = 'abstruse' |
|
1500 | long_name = 'Abstruse Goose' |
|
1501 | url = 'http://abstrusegoose.com' |
|
1502 | get_url_from_archive_element = get_href |
|
1503 | comic_url_re = re.compile('^%s/([0-9]*)$' % url) |
|
1504 | comic_img_re = re.compile('^%s/strips/.*' % url) |
|
1505 | ||
1506 | @classmethod |
|
1507 | def get_archive_elements(cls): |
|
1508 | archive_url = urljoin_wrapper(cls.url, 'archive') |
|
1509 | return get_soup_at_url(archive_url).find_all('a', href=cls.comic_url_re) |
|
1510 | ||
1511 | @classmethod |
|
1512 | def get_comic_info(cls, soup, archive_elt): |
|
1513 | comic_url = cls.get_url_from_archive_element(archive_elt) |
|
1514 | num = int(cls.comic_url_re.match(comic_url).groups()[0]) |
|
1515 | imgs = soup.find_all('img', src=cls.comic_img_re) |
|
1516 | return { |
|
1517 | 'num': num, |
|
1518 | 'title': archive_elt.string, |
|
1519 | 'img': [i['src'] for i in imgs], |
|
1520 | } |
|
1521 | ||
1522 |