Code Duplication - SylvainDe/ComicBookMaker - Measure and Improve Code Quality continuously with Scrutinizer

Code Duplication Length = 16-20 lines in 3 locations

comics.py 3 locations


    get_first_comic_link = simulate_first_link
    first_url = 'http://respawncomic.com/comic/c0001/'

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        title = soup.find('meta', property='og:title')['content']
        author = soup.find('meta', attrs={'name': 'shareaholic:article_author_name'})['content']
        date_str = soup.find('meta', attrs={'name': 'shareaholic:article_published_time'})['content']
        date_str = date_str[:10]
        day = string_to_date(date_str, "%Y-%m-%d")
        imgs = soup.find_all('meta', property='og:image')
        skip_imgs = {
            'http://respawncomic.com/wp-content/uploads/2016/03/site/HAROLD2.png',
            'http://respawncomic.com/wp-content/uploads/2016/03/site/DEVA.png'
        }
        return {
            'title': title,
            'author': author,
            'day': day.day,
            'month': day.month,
            'year': day.year,
            'img': [i['content'] for i in imgs if i['content'] not in skip_imgs],
        }



    get_first_comic_link = get_a_comicnavbase_comicnavfirst
    get_navi_link = get_a_rel_next

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        title = soup.find('meta', property='og:title')['content']
        metadesc = soup.find('meta', property='og:description')
        desc = metadesc['content'] if metadesc else ""
        author = soup.find('meta', attrs={'name': 'shareaholic:article_author_name'})['content']
        date_str = soup.find('meta', attrs={'name': 'shareaholic:article_published_time'})['content']
        date_str = date_str[:10]
        day = string_to_date(date_str, "%Y-%m-%d")
        imgs = soup.find_all('meta', property='og:image')
        return {
            'img': [i['content'] for i in imgs],
            'title': title,
            'author': author,
            'desc': desc,
            'day': day.day,
            'month': day.month,
            'year': day.year
        }



        li = last_soup.find('li', class_='prev' if next_ else 'next')
        return li.find('a') if li else None

    @classmethod
    def get_comic_info(cls, soup, link):
        """Get information about a particular comics."""
        short_url = soup.find('link', rel='shortlink')['href']
        title = soup.find('meta', attrs={'name': 'twitter:title'})['content']
        imgs = soup.find_all('meta', property='og:image')
        date_str = soup.find('span', property='dc:date')['content']
        date_str = date_str[:10]
        day = string_to_date(date_str, "%Y-%m-%d")
        return {
            'short_url': short_url,
            'title': title,
            'img': [i['content'] for i in imgs],
            'day': day.day,
            'month': day.month,
            'year': day.year,
        }



		@@ 1756-1775 (lines=20) @@
1753		get_first_comic_link = simulate_first_link
1754		first_url = 'http://respawncomic.com/comic/c0001/'
1755
1756		@classmethod
1757		def get_comic_info(cls, soup, link):
1758		"""Get information about a particular comics."""
1759		title = soup.find('meta', property='og:title')['content']
1760		author = soup.find('meta', attrs={'name': 'shareaholic:article_author_name'})['content']
1761		date_str = soup.find('meta', attrs={'name': 'shareaholic:article_published_time'})['content']
1762		date_str = date_str[:10]
1763		day = string_to_date(date_str, "%Y-%m-%d")
1764		imgs = soup.find_all('meta', property='og:image')
1765		skip_imgs = {
1766		'http://respawncomic.com/wp-content/uploads/2016/03/site/HAROLD2.png',
1767		'http://respawncomic.com/wp-content/uploads/2016/03/site/DEVA.png'
1768		}
1769		return {
1770		'title': title,
1771		'author': author,
1772		'day': day.day,
1773		'month': day.month,
1774		'year': day.year,
1775		'img': [i['content'] for i in imgs if i['content'] not in skip_imgs],
1776		}
1777
1778
		@@ 1002-1020 (lines=19) @@
999		get_first_comic_link = get_a_comicnavbase_comicnavfirst
1000		get_navi_link = get_a_rel_next
1001
1002		@classmethod
1003		def get_comic_info(cls, soup, link):
1004		"""Get information about a particular comics."""
1005		title = soup.find('meta', property='og:title')['content']
1006		metadesc = soup.find('meta', property='og:description')
1007		desc = metadesc['content'] if metadesc else ""
1008		author = soup.find('meta', attrs={'name': 'shareaholic:article_author_name'})['content']
1009		date_str = soup.find('meta', attrs={'name': 'shareaholic:article_published_time'})['content']
1010		date_str = date_str[:10]
1011		day = string_to_date(date_str, "%Y-%m-%d")
1012		imgs = soup.find_all('meta', property='og:image')
1013		return {
1014		'img': [i['content'] for i in imgs],
1015		'title': title,
1016		'author': author,
1017		'desc': desc,
1018		'day': day.day,
1019		'month': day.month,
1020		'year': day.year
1021		}
1022
1023
		@@ 501-516 (lines=16) @@
498		li = last_soup.find('li', class_='prev' if next_ else 'next')
499		return li.find('a') if li else None
500
501		@classmethod
502		def get_comic_info(cls, soup, link):
503		"""Get information about a particular comics."""
504		short_url = soup.find('link', rel='shortlink')['href']
505		title = soup.find('meta', attrs={'name': 'twitter:title'})['content']
506		imgs = soup.find_all('meta', property='og:image')
507		date_str = soup.find('span', property='dc:date')['content']
508		date_str = date_str[:10]
509		day = string_to_date(date_str, "%Y-%m-%d")
510		return {
511		'short_url': short_url,
512		'title': title,
513		'img': [i['content'] for i in imgs],
514		'day': day.day,
515		'month': day.month,
516		'year': day.year,
517		}
518
519

SylvainDe / ComicBookMaker

Code Duplication Length = 16-20 lines in 3 locations

comics.py 3 locations