@@ 2999-3035 (lines=37) @@ | ||
2996 | 'short_url': short_url, |
|
2997 | 'num': num, |
|
2998 | 'img': [i['src'] for i in imgs], |
|
2999 | 'month': day.month, |
|
3000 | 'year': day.year, |
|
3001 | 'day': day.day, |
|
3002 | 'title': title, |
|
3003 | 'tags': tags, |
|
3004 | 'alt': alt, |
|
3005 | 'author': author, |
|
3006 | } |
|
3007 | ||
3008 | ||
3009 | class SystemComic(GenericNavigableComic): |
|
3010 | """Class to retrieve System Comic.""" |
|
3011 | name = 'system' |
|
3012 | long_name = 'System Comic' |
|
3013 | url = 'http://www.systemcomic.com' |
|
3014 | get_navi_link = get_a_rel_next |
|
3015 | ||
3016 | @classmethod |
|
3017 | def get_first_comic_link(cls): |
|
3018 | """Get link to first comics.""" |
|
3019 | return get_soup_at_url(cls.url).find('li', class_='first').find('a') |
|
3020 | ||
3021 | @classmethod |
|
3022 | def get_comic_info(cls, soup, link): |
|
3023 | """Get information about a particular comics.""" |
|
3024 | title = soup.find('meta', property='og:title')['content'] |
|
3025 | desc = soup.find('meta', property='og:description')['content'] |
|
3026 | date_str = soup.find('time')["datetime"] |
|
3027 | day = string_to_date(date_str, "%Y-%m-%d") |
|
3028 | imgs = soup.find('figure').find_all('img') |
|
3029 | return { |
|
3030 | 'title': title, |
|
3031 | 'description': desc, |
|
3032 | 'day': day.day, |
|
3033 | 'month': day.month, |
|
3034 | 'year': day.year, |
|
3035 | 'img': [i['src'] for i in imgs], |
|
3036 | } |
|
3037 | ||
3038 | ||
@@ 782-816 (lines=35) @@ | ||
779 | get_navi_link = get_link_rel_next |
|
780 | get_url_from_link = join_cls_url_to_href |
|
781 | ||
782 | @classmethod |
|
783 | def get_comic_info(cls, soup, link): |
|
784 | """Get information about a particular comics.""" |
|
785 | short_url_re = re.compile('^%s/\\?p=([0-9]*)' % cls.url) |
|
786 | short_url = cls.get_url_from_link(soup.find('link', rel='shortlink')) |
|
787 | num = int(short_url_re.match(short_url).groups()[0]) |
|
788 | imgs = soup.find('div', id='comic').find_all('img') |
|
789 | assert len(imgs) == 1, imgs |
|
790 | title = imgs[0]['alt'] |
|
791 | title2 = imgs[0]['title'] |
|
792 | return { |
|
793 | 'short_url': short_url, |
|
794 | 'title': title, |
|
795 | 'title2': title2, |
|
796 | 'img': [urljoin_wrapper(cls.url, i['src']) for i in imgs], |
|
797 | 'num': num, |
|
798 | } |
|
799 | ||
800 | ||
801 | class Garfield(GenericNavigableComic): |
|
802 | """Class to retrieve Garfield comics.""" |
|
803 | # Also on http://www.gocomics.com/garfield |
|
804 | name = 'garfield' |
|
805 | long_name = 'Garfield' |
|
806 | url = 'https://garfield.com' |
|
807 | _categories = ('GARFIELD', ) |
|
808 | get_first_comic_link = simulate_first_link |
|
809 | first_url = 'https://garfield.com/comic/1978/06/19' |
|
810 | ||
811 | @classmethod |
|
812 | def get_navi_link(cls, last_soup, next_): |
|
813 | """Get link to next or previous comic.""" |
|
814 | return last_soup.find('a', class_='comic-arrow-right' if next_ else 'comic-arrow-left') |
|
815 | ||
816 | @classmethod |
|
817 | def get_comic_info(cls, soup, link): |
|
818 | """Get information about a particular comics.""" |
|
819 | url = cls.get_url_from_link(link) |