Code Duplication - SylvainDe/ComicBookMaker - Measure and Improve Code Quality continuously with Scrutinizer

Code Duplication Length = 22-26 lines in 6 locations

comics.py 6 locations


        }


class LinsEditions(GenericNavigableComic):
    """Class to retrieve L.I.N.S. Editions comics."""
    # Also on http://linscomics.tumblr.com
    # Now on https://warandpeas.com
    name = 'lins'
    long_name = 'L.I.N.S. Editions'
    url = 'https://linsedition.com'
    _categories = ('LINS', )
    get_navi_link = get_link_rel_next
    get_first_comic_link = simulate_first_link
    first_url = 'https://linsedition.com/2011/09/07/l-i-n-s/'

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        title = soup.find('meta', property='og:title')['content']
        imgs = soup.find_all('meta', property='og:image')
        date_str = soup.find('meta', property='article:published_time')['content'][:10]
        day = string_to_date(date_str, "%Y-%m-%d")
        return {
            'title': title,
            'img': [i['content'] for i in imgs],
            'month': day.month,
            'year': day.year,
            'day': day.day,
        }



        return []


class ExtraFabulousComics(GenericNavigableComic):
    """Class to retrieve Extra Fabulous Comics."""
    name = 'efc'
    long_name = 'Extra Fabulous Comics'
    url = 'http://extrafabulouscomics.com'
    get_first_comic_link = get_a_navi_navifirst
    get_navi_link = get_link_rel_next

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        img_src_re = re.compile('^%s/wp-content/uploads/' % cls.url)
        imgs = soup.find_all('img', src=img_src_re)
        title = soup.find('meta', property='og:title')['content']
        date_str = soup.find('meta', property='article:published_time')['content'][:10]
        day = string_to_date(date_str, "%Y-%m-%d")
        return {
            'title': title,
            'img': [i['src'] for i in imgs],
            'month': day.month,
            'year': day.year,
            'day': day.day,
            'prefix': title + '-'
        }



        }


class GenericLeMondeBlog(GenericNavigableComic):
    """Generic class to retrieve comics from Le Monde blogs."""
    _categories = ('LEMONDE', 'FRANCAIS')
    get_navi_link = get_link_rel_next
    get_first_comic_link = simulate_first_link
    first_url = NotImplemented

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        url2 = soup.find('link', rel='shortlink')['href']
        title = soup.find('meta', property='og:title')['content']
        date_str = soup.find("span", class_="entry-date").string
        day = string_to_date(date_str, "%d %B %Y", "fr_FR.utf8")
        imgs = soup.find_all('meta', property='og:image')
        return {
            'title': title,
            'url2': url2,
            'img': [convert_iri_to_plain_ascii_uri(i['content']) for i in imgs],
            'month': day.month,
            'year': day.year,
            'day': day.day,
        }



        }


class SafelyEndangered(GenericNavigableComic):
    """Class to retrieve Safely Endangered comics."""
    # Also on http://tumblr.safelyendangered.com
    name = 'endangered'
    long_name = 'Safely Endangered'
    url = 'http://www.safelyendangered.com'
    get_navi_link = get_link_rel_next
    get_first_comic_link = simulate_first_link
    first_url = 'http://www.safelyendangered.com/comic/ignored/'

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        title = soup.find('h2', class_='post-title').string
        date_str = soup.find('span', class_='post-date').string
        day = string_to_date(date_str, '%B %d, %Y')
        imgs = soup.find('div', id='comic').find_all('img')
        alt = imgs[0]['alt']
        assert all(i['alt'] == i['title'] for i in imgs)
        return {
            'day': day.day,
            'month': day.month,
            'year': day.year,
            'img': [i['src'] for i in imgs],
            'title': title,
            'alt': alt,
        }



        }


class MyExtraLife(GenericNavigableComic):
    """Class to retrieve My Extra Life comics."""
    name = 'extralife'
    long_name = 'My Extra Life'
    url = 'http://www.myextralife.com'
    get_navi_link = get_link_rel_next

    @classmethod
    def get_first_comic_link(cls):
        """Get link to first comics."""
        return get_soup_at_url(cls.url).find('a', class_='comic_nav_link first_comic_link')

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        title = soup.find("h1", class_="comic_title").string
        date_str = soup.find("span", class_="comic_date").string
        day = string_to_date(date_str, "%B %d, %Y")
        imgs = soup.find_all("img", class_="comic")
        assert all(i['alt'] == i['title'] == title for i in imgs)
        return {
            'title': title,
            'img': [i['src'] for i in imgs if i["src"]],
            'day': day.day,
            'month': day.month,
            'year': day.year
        }



        }


class MarketoonistComics(GenericNavigableComic):
    """Class to retrieve Marketoonist Comics."""
    name = 'marketoonist'
    long_name = 'Marketoonist'
    url = 'https://marketoonist.com/cartoons'
    get_first_comic_link = simulate_first_link
    get_navi_link = get_link_rel_next
    first_url = 'https://marketoonist.com/2002/10/the-8-types-of-brand-managers-2.html'

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        imgs = soup.find_all('meta', property='og:image')
        date_str = soup.find('meta', property='article:published_time')['content'][:10]
        day = string_to_date(date_str, "%Y-%m-%d")
        title = soup.find('meta', property='og:title')['content']
        return {
            'img': [i['content'] for i in imgs],
            'day': day.day,
            'month': day.month,
            'year': day.year,
            'title': title,
        }



		@@ 2282-2306 (lines=25) @@
2279		}
2280
2281
2282		class LinsEditions(GenericNavigableComic):
2283		"""Class to retrieve L.I.N.S. Editions comics."""
2284		# Also on http://linscomics.tumblr.com
2285		# Now on https://warandpeas.com
2286		name = 'lins'
2287		long_name = 'L.I.N.S. Editions'
2288		url = 'https://linsedition.com'
2289		_categories = ('LINS', )
2290		get_navi_link = get_link_rel_next
2291		get_first_comic_link = simulate_first_link
2292		first_url = 'https://linsedition.com/2011/09/07/l-i-n-s/'
2293
2294		@classmethod
2295		def get_comic_info(cls, soup, link):
2296		"""Get information about a particular comics."""
2297		title = soup.find('meta', property='og:title')['content']
2298		imgs = soup.find_all('meta', property='og:image')
2299		date_str = soup.find('meta', property='article:published_time')['content'][:10]
2300		day = string_to_date(date_str, "%Y-%m-%d")
2301		return {
2302		'title': title,
2303		'img': [i['content'] for i in imgs],
2304		'month': day.month,
2305		'year': day.year,
2306		'day': day.day,
2307		}
2308
2309
		@@ 349-371 (lines=23) @@
346		return []
347
348
349		class ExtraFabulousComics(GenericNavigableComic):
350		"""Class to retrieve Extra Fabulous Comics."""
351		name = 'efc'
352		long_name = 'Extra Fabulous Comics'
353		url = 'http://extrafabulouscomics.com'
354		get_first_comic_link = get_a_navi_navifirst
355		get_navi_link = get_link_rel_next
356
357		@classmethod
358		def get_comic_info(cls, soup, link):
359		"""Get information about a particular comics."""
360		img_src_re = re.compile('^%s/wp-content/uploads/' % cls.url)
361		imgs = soup.find_all('img', src=img_src_re)
362		title = soup.find('meta', property='og:title')['content']
363		date_str = soup.find('meta', property='article:published_time')['content'][:10]
364		day = string_to_date(date_str, "%Y-%m-%d")
365		return {
366		'title': title,
367		'img': [i['src'] for i in imgs],
368		'month': day.month,
369		'year': day.year,
370		'day': day.day,
371		'prefix': title + '-'
372		}
373
374
		@@ 375-396 (lines=22) @@
372		}
373
374
375		class GenericLeMondeBlog(GenericNavigableComic):
376		"""Generic class to retrieve comics from Le Monde blogs."""
377		_categories = ('LEMONDE', 'FRANCAIS')
378		get_navi_link = get_link_rel_next
379		get_first_comic_link = simulate_first_link
380		first_url = NotImplemented
381
382		@classmethod
383		def get_comic_info(cls, soup, link):
384		"""Get information about a particular comics."""
385		url2 = soup.find('link', rel='shortlink')['href']
386		title = soup.find('meta', property='og:title')['content']
387		date_str = soup.find("span", class_="entry-date").string
388		day = string_to_date(date_str, "%d %B %Y", "fr_FR.utf8")
389		imgs = soup.find_all('meta', property='og:image')
390		return {
391		'title': title,
392		'url2': url2,
393		'img': [convert_iri_to_plain_ascii_uri(i['content']) for i in imgs],
394		'month': day.month,
395		'year': day.year,
396		'day': day.day,
397		}
398
399
		@@ 1809-1834 (lines=26) @@
1806		}
1807
1808
1809		class SafelyEndangered(GenericNavigableComic):
1810		"""Class to retrieve Safely Endangered comics."""
1811		# Also on http://tumblr.safelyendangered.com
1812		name = 'endangered'
1813		long_name = 'Safely Endangered'
1814		url = 'http://www.safelyendangered.com'
1815		get_navi_link = get_link_rel_next
1816		get_first_comic_link = simulate_first_link
1817		first_url = 'http://www.safelyendangered.com/comic/ignored/'
1818
1819		@classmethod
1820		def get_comic_info(cls, soup, link):
1821		"""Get information about a particular comics."""
1822		title = soup.find('h2', class_='post-title').string
1823		date_str = soup.find('span', class_='post-date').string
1824		day = string_to_date(date_str, '%B %d, %Y')
1825		imgs = soup.find('div', id='comic').find_all('img')
1826		alt = imgs[0]['alt']
1827		assert all(i['alt'] == i['title'] for i in imgs)
1828		return {
1829		'day': day.day,
1830		'month': day.month,
1831		'year': day.year,
1832		'img': [i['src'] for i in imgs],
1833		'title': title,
1834		'alt': alt,
1835		}
1836
1837
		@@ 919-944 (lines=26) @@
916		}
917
918
919		class MyExtraLife(GenericNavigableComic):
920		"""Class to retrieve My Extra Life comics."""
921		name = 'extralife'
922		long_name = 'My Extra Life'
923		url = 'http://www.myextralife.com'
924		get_navi_link = get_link_rel_next
925
926		@classmethod
927		def get_first_comic_link(cls):
928		"""Get link to first comics."""
929		return get_soup_at_url(cls.url).find('a', class_='comic_nav_link first_comic_link')
930
931		@classmethod
932		def get_comic_info(cls, soup, link):
933		"""Get information about a particular comics."""
934		title = soup.find("h1", class_="comic_title").string
935		date_str = soup.find("span", class_="comic_date").string
936		day = string_to_date(date_str, "%B %d, %Y")
937		imgs = soup.find_all("img", class_="comic")
938		assert all(i['alt'] == i['title'] == title for i in imgs)
939		return {
940		'title': title,
941		'img': [i['src'] for i in imgs if i["src"]],
942		'day': day.day,
943		'month': day.month,
944		'year': day.year
945		}
946
947
		@@ 3191-3212 (lines=22) @@
3188		}
3189
3190
3191		class MarketoonistComics(GenericNavigableComic):
3192		"""Class to retrieve Marketoonist Comics."""
3193		name = 'marketoonist'
3194		long_name = 'Marketoonist'
3195		url = 'https://marketoonist.com/cartoons'
3196		get_first_comic_link = simulate_first_link
3197		get_navi_link = get_link_rel_next
3198		first_url = 'https://marketoonist.com/2002/10/the-8-types-of-brand-managers-2.html'
3199
3200		@classmethod
3201		def get_comic_info(cls, soup, link):
3202		"""Get information about a particular comics."""
3203		imgs = soup.find_all('meta', property='og:image')
3204		date_str = soup.find('meta', property='article:published_time')['content'][:10]
3205		day = string_to_date(date_str, "%Y-%m-%d")
3206		title = soup.find('meta', property='og:title')['content']
3207		return {
3208		'img': [i['content'] for i in imgs],
3209		'day': day.day,
3210		'month': day.month,
3211		'year': day.year,
3212		'title': title,
3213		}
3214
3215

SylvainDe / ComicBookMaker

Code Duplication Length = 22-26 lines in 6 locations

comics.py 6 locations