|
@@ 2223-2242 (lines=20) @@
|
| 2220 |
|
name = 'anythingcomic' |
| 2221 |
|
long_name = 'Anything Comic' |
| 2222 |
|
url = 'http://www.anythingcomic.com' |
| 2223 |
|
|
| 2224 |
|
@classmethod |
| 2225 |
|
def get_archive_elements(cls): |
| 2226 |
|
archive_url = urljoin_wrapper(cls.url, 'archive/') |
| 2227 |
|
# The first 2 <tr>'s do not correspond to comics |
| 2228 |
|
return get_soup_at_url(archive_url).find('table', id='chapter_table').find_all('tr')[2:] |
| 2229 |
|
|
| 2230 |
|
@classmethod |
| 2231 |
|
def get_url_from_archive_element(cls, tr): |
| 2232 |
|
"""Get url corresponding to an archive element.""" |
| 2233 |
|
td_num, td_comic, td_date, _ = tr.find_all('td') |
| 2234 |
|
link = td_comic.find('a') |
| 2235 |
|
return urljoin_wrapper(cls.url, link['href']) |
| 2236 |
|
|
| 2237 |
|
@classmethod |
| 2238 |
|
def get_comic_info(cls, soup, tr): |
| 2239 |
|
"""Get information about a particular comics.""" |
| 2240 |
|
td_num, td_comic, td_date, _ = tr.find_all('td') |
| 2241 |
|
num = int(td_num.string) |
| 2242 |
|
link = td_comic.find('a') |
| 2243 |
|
title = link.string |
| 2244 |
|
imgs = soup.find_all('img', id='comic_image') |
| 2245 |
|
date_str = td_date.string |
|
@@ 1914-1932 (lines=19) @@
|
| 1911 |
|
|
| 1912 |
|
class InvisibleBread(GenericListableComic): |
| 1913 |
|
"""Class to retrieve Invisible Bread comics.""" |
| 1914 |
|
# Also on http://www.gocomics.com/invisible-bread |
| 1915 |
|
name = 'invisiblebread' |
| 1916 |
|
long_name = 'Invisible Bread' |
| 1917 |
|
url = 'http://invisiblebread.com' |
| 1918 |
|
|
| 1919 |
|
@classmethod |
| 1920 |
|
def get_archive_elements(cls): |
| 1921 |
|
archive_url = urljoin_wrapper(cls.url, 'archives/') |
| 1922 |
|
return reversed(get_soup_at_url(archive_url).find_all('td', class_='archive-title')) |
| 1923 |
|
|
| 1924 |
|
@classmethod |
| 1925 |
|
def get_url_from_archive_element(cls, td): |
| 1926 |
|
return td.find('a')['href'] |
| 1927 |
|
|
| 1928 |
|
@classmethod |
| 1929 |
|
def get_comic_info(cls, soup, td): |
| 1930 |
|
"""Get information about a particular comics.""" |
| 1931 |
|
url = cls.get_url_from_archive_element(td) |
| 1932 |
|
title = td.find('a').string |
| 1933 |
|
month_and_day = td.previous_sibling.string |
| 1934 |
|
link_re = re.compile('^%s/([0-9]+)/' % cls.url) |
| 1935 |
|
year = link_re.match(url).groups()[0] |