Code Duplication - SylvainDe/ComicBookMaker - Measure and Improve Code Quality continuously with Scrutinizer

Code Duplication Length = 22-27 lines in 4 locations

comics.py 4 locations




class ButterSafe(GenericListableComic):
    """Class to retrieve Butter Safe comics."""
    name = 'butter'
    long_name = 'ButterSafe'
    url = 'http://buttersafe.com'
    get_url_from_archive_element = get_href
    comic_link_re = re.compile('^%s/([0-9]*)/([0-9]*)/([0-9]*)/.*' % url)

    @classmethod
    def get_archive_elements(cls):
        archive_url = urljoin_wrapper(cls.url, 'archive/')
        return reversed(get_soup_at_url(archive_url).find_all('a', href=cls.comic_link_re))

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        url = cls.get_url_from_archive_element(link)
        title = link.string
        year, month, day = [int(s) for s in cls.comic_link_re.match(url).groups()]
        img = soup.find('div', id='comic').find('img')
        assert img['alt'] == title
        return {
            'title': title,
            'day': day,
            'month': month,
            'year': year,
            'img': [img['src']],
        }


class CalvinAndHobbes(GenericComic):



class AbstruseGoose(GenericListableComic):
    """Class to retrieve AbstruseGoose Comics."""
    name = 'abstruse'
    long_name = 'Abstruse Goose'
    url = 'http://abstrusegoose.com'
    get_url_from_archive_element = get_href
    comic_url_re = re.compile('^%s/([0-9]*)$' % url)
    comic_img_re = re.compile('^%s/strips/.*' % url)

    @classmethod
    def get_archive_elements(cls):
        archive_url = urljoin_wrapper(cls.url, 'archive')
        return get_soup_at_url(archive_url).find_all('a', href=cls.comic_url_re)

    @classmethod
    def get_comic_info(cls, soup, archive_elt):
        comic_url = cls.get_url_from_archive_element(archive_elt)
        num = int(cls.comic_url_re.match(comic_url).groups()[0])
        return {
            'num': num,
            'title': archive_elt.string,
            'img': [soup.find('img', src=cls.comic_img_re)['src']]
        }


class PhDComics(GenericNavigableComic):

    @classmethod
    def get_first_comic_link(cls):
        """Get link to first comics."""
        return get_soup_at_url(cls.url).find('a', title="First")

    @classmethod
    def get_navi_link(cls, last_soup, next_):
        """Get link to next or previous comic."""
        return last_soup.find('a', title='Next' if next_ else 'Previous')

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        title = soup.find('h1').string
        date_str = soup.find('span', class_='date').string.strip()
        day = string_to_date(date_str, "%B %d, %Y")
        imgs = soup.find('div', class_='comic').find_all('img', alt='', title='')
        return {
            'title': title,
            'img': [i['src'] for i in imgs],
            'month': day.month,
            'year': day.year,
            'day': day.day,
        }


class ChuckleADuck(GenericNavigableComic):
    """Class to retrieve Chuckle-A-Duck comics."""
    name = 'chuckleaduck'
    long_name = 'Chuckle-A-duck'

            'year': day.year
        }


class PerryBibleFellowship(GenericListableComic):  # Is now navigable too
    """Class to retrieve Perry Bible Fellowship comics."""
    name = 'pbf'
    long_name = 'Perry Bible Fellowship'
    url = 'http://pbfcomics.com'
    get_url_from_archive_element = join_cls_url_to_href

    @classmethod
    def get_archive_elements(cls):
        soup = get_soup_at_url(cls.url)
        thumbnails = soup.find('div', id='all_thumbnails')
        return reversed(thumbnails.find_all('a'))

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        name = soup.find('meta', property='og:title')['content']
        imgs = soup.find_all('meta', property='og:image')
        assert len(imgs) == 1
        return {
            'name': name,
            'img': [i['content'] for i in imgs],
        }


		@@ 1387-1413 (lines=27) @@
1384
1385
1386		class ButterSafe(GenericListableComic):
1387		"""Class to retrieve Butter Safe comics."""
1388		name = 'butter'
1389		long_name = 'ButterSafe'
1390		url = 'http://buttersafe.com'
1391		get_url_from_archive_element = get_href
1392		comic_link_re = re.compile('^%s/([0-9])/([0-9])/([0-9])/.' % url)
1393
1394		@classmethod
1395		def get_archive_elements(cls):
1396		archive_url = urljoin_wrapper(cls.url, 'archive/')
1397		return reversed(get_soup_at_url(archive_url).find_all('a', href=cls.comic_link_re))
1398
1399		@classmethod
1400		def get_comic_info(cls, soup, link):
1401		"""Get information about a particular comics."""
1402		url = cls.get_url_from_archive_element(link)
1403		title = link.string
1404		year, month, day = [int(s) for s in cls.comic_link_re.match(url).groups()]
1405		img = soup.find('div', id='comic').find('img')
1406		assert img['alt'] == title
1407		return {
1408		'title': title,
1409		'day': day,
1410		'month': month,
1411		'year': year,
1412		'img': [img['src']],
1413		}
1414
1415
1416		class CalvinAndHobbes(GenericComic):
		@@ 1453-1474 (lines=22) @@
1450
1451
1452		class AbstruseGoose(GenericListableComic):
1453		"""Class to retrieve AbstruseGoose Comics."""
1454		name = 'abstruse'
1455		long_name = 'Abstruse Goose'
1456		url = 'http://abstrusegoose.com'
1457		get_url_from_archive_element = get_href
1458		comic_url_re = re.compile('^%s/([0-9]*)$' % url)
1459		comic_img_re = re.compile('^%s/strips/.*' % url)
1460
1461		@classmethod
1462		def get_archive_elements(cls):
1463		archive_url = urljoin_wrapper(cls.url, 'archive')
1464		return get_soup_at_url(archive_url).find_all('a', href=cls.comic_url_re)
1465
1466		@classmethod
1467		def get_comic_info(cls, soup, archive_elt):
1468		comic_url = cls.get_url_from_archive_element(archive_elt)
1469		num = int(cls.comic_url_re.match(comic_url).groups()[0])
1470		return {
1471		'num': num,
1472		'title': archive_elt.string,
1473		'img': [soup.find('img', src=cls.comic_img_re)['src']]
1474		}
1475
1476
1477		class PhDComics(GenericNavigableComic):
		@@ 2063-2086 (lines=24) @@
2060		@classmethod
2061		def get_first_comic_link(cls):
2062		"""Get link to first comics."""
2063		return get_soup_at_url(cls.url).find('a', title="First")
2064
2065		@classmethod
2066		def get_navi_link(cls, last_soup, next_):
2067		"""Get link to next or previous comic."""
2068		return last_soup.find('a', title='Next' if next_ else 'Previous')
2069
2070		@classmethod
2071		def get_comic_info(cls, soup, link):
2072		"""Get information about a particular comics."""
2073		title = soup.find('h1').string
2074		date_str = soup.find('span', class_='date').string.strip()
2075		day = string_to_date(date_str, "%B %d, %Y")
2076		imgs = soup.find('div', class_='comic').find_all('img', alt='', title='')
2077		return {
2078		'title': title,
2079		'img': [i['src'] for i in imgs],
2080		'month': day.month,
2081		'year': day.year,
2082		'day': day.day,
2083		}
2084
2085
2086		class ChuckleADuck(GenericNavigableComic):
2087		"""Class to retrieve Chuckle-A-Duck comics."""
2088		name = 'chuckleaduck'
2089		long_name = 'Chuckle-A-duck'
		@@ 1048-1069 (lines=22) @@
1045		'year': day.year
1046		}
1047
1048
1049		class PerryBibleFellowship(GenericListableComic): # Is now navigable too
1050		"""Class to retrieve Perry Bible Fellowship comics."""
1051		name = 'pbf'
1052		long_name = 'Perry Bible Fellowship'
1053		url = 'http://pbfcomics.com'
1054		get_url_from_archive_element = join_cls_url_to_href
1055
1056		@classmethod
1057		def get_archive_elements(cls):
1058		soup = get_soup_at_url(cls.url)
1059		thumbnails = soup.find('div', id='all_thumbnails')
1060		return reversed(thumbnails.find_all('a'))
1061
1062		@classmethod
1063		def get_comic_info(cls, soup, link):
1064		"""Get information about a particular comics."""
1065		name = soup.find('meta', property='og:title')['content']
1066		imgs = soup.find_all('meta', property='og:image')
1067		assert len(imgs) == 1
1068		return {
1069		'name': name,
1070		'img': [i['content'] for i in imgs],
1071		}
1072

SylvainDe / ComicBookMaker

Code Duplication Length = 22-27 lines in 4 locations

comics.py 4 locations