Code Duplication    Length = 18-21 lines in 5 locations

tests/test_stemmer.py 5 locations

@@ 542-562 (lines=21) @@
539
        self.assertEqual(sb_german('über'), 'uber')
540
        self.assertEqual(sb_german('ueber'), 'ueb')
541
542
    def test_sb_dutch_snowball(self):
543
        """Test abydos.stemmer.sb_dutch (Snowball testset).
544
545
        These test cases are from
546
        http://snowball.tartarus.org/algorithms/dutch/diffs.txt
547
        """
548
        # base case
549
        self.assertEqual(sb_dutch(''), '')
550
551
        #  Snowball Dutch test set
552
        with codecs.open(TESTDIR+'/corpora/snowball_dutch.csv',
553
                         encoding='utf-8') as snowball_testset:
554
            next(snowball_testset)
555
            for line in snowball_testset:
556
                if line[0] != '#':
557
                    line = line.strip().split(',')
558
                    word, stem = line[0], line[1]
559
                    self.assertEqual(sb_dutch(word), stem.lower())
560
561
        # missed branch test cases
562
        self.assertEqual(sb_dutch('zondulielijk'), 'zondulie')
563
564
    def test_sb_norwegian_snowball(self):
565
        """Test abydos.stemmer.sb_norwegian (Snowball testset).
@@ 469-489 (lines=21) @@
466
    abydos.stemmer.sb_danish
467
    """
468
469
    def test_sb_german_snowball(self):
470
        """Test abydos.stemmer.sb_german (Snowball testset).
471
472
        These test cases are from
473
        http://snowball.tartarus.org/algorithms/german/diffs.txt
474
        """
475
        # base case
476
        self.assertEqual(sb_german(''), '')
477
478
        #  Snowball German test set
479
        with codecs.open(TESTDIR+'/corpora/snowball_german.csv',
480
                         encoding='utf-8') as snowball_testset:
481
            next(snowball_testset)
482
            for line in snowball_testset:
483
                if line[0] != '#':
484
                    line = line.strip().split(',')
485
                    word, stem = line[0], line[1]
486
                    self.assertEqual(sb_german(word), stem.lower())
487
488
        # missed branch test cases
489
        self.assertEqual(sb_german('ikeit'), 'ikeit')
490
491
    def test_sb_german_snowball_alt(self):
492
        """Test abydos.stemmer.sb_german (alternate vowels)."""
@@ 602-619 (lines=18) @@
599
                    word, stem = line[0], line[1]
600
                    self.assertEqual(sb_swedish(word), stem.lower())
601
602
    def test_sb_danish_snowball(self):
603
        """Test abydos.stemmer.sb_danish (Snowball testset).
604
605
        These test cases are from
606
        http://snowball.tartarus.org/algorithms/danish/diffs.txt
607
        """
608
        # base case
609
        self.assertEqual(sb_danish(''), '')
610
611
        #  Snowball Danish test set
612
        with codecs.open(TESTDIR+'/corpora/snowball_danish.csv',
613
                         encoding='utf-8') as snowball_testset:
614
            next(snowball_testset)
615
            for line in snowball_testset:
616
                if line[0] != '#':
617
                    line = line.strip().split(',')
618
                    word, stem = line[0], line[1]
619
                    self.assertEqual(sb_danish(word), stem.lower())
620
621
622
class CLEFTestCases(unittest.TestCase):
@@ 583-600 (lines=18) @@
580
                    word, stem = line[0], line[1]
581
                    self.assertEqual(sb_norwegian(word), stem.lower())
582
583
    def test_sb_swedish_snowball(self):
584
        """Test abydos.stemmer.sb_swedish (Snowball testset).
585
586
        These test cases are from
587
        http://snowball.tartarus.org/algorithms/swedish/diffs.txt
588
        """
589
        # base case
590
        self.assertEqual(sb_swedish(''), '')
591
592
        #  Snowball Swedish test set
593
        with codecs.open(TESTDIR+'/corpora/snowball_swedish.csv',
594
                         encoding='utf-8') as snowball_testset:
595
            next(snowball_testset)
596
            for line in snowball_testset:
597
                if line[0] != '#':
598
                    line = line.strip().split(',')
599
                    word, stem = line[0], line[1]
600
                    self.assertEqual(sb_swedish(word), stem.lower())
601
602
    def test_sb_danish_snowball(self):
603
        """Test abydos.stemmer.sb_danish (Snowball testset).
@@ 564-581 (lines=18) @@
561
        # missed branch test cases
562
        self.assertEqual(sb_dutch('zondulielijk'), 'zondulie')
563
564
    def test_sb_norwegian_snowball(self):
565
        """Test abydos.stemmer.sb_norwegian (Snowball testset).
566
567
        These test cases are from
568
        http://snowball.tartarus.org/algorithms/norwegian/diffs.txt
569
        """
570
        # base case
571
        self.assertEqual(sb_norwegian(''), '')
572
573
        #  Snowball Norwegian test set
574
        with codecs.open(TESTDIR+'/corpora/snowball_norwegian.csv',
575
                         encoding='utf-8') as snowball_testset:
576
            next(snowball_testset)
577
            for line in snowball_testset:
578
                if line[0] != '#':
579
                    line = line.strip().split(',')
580
                    word, stem = line[0], line[1]
581
                    self.assertEqual(sb_norwegian(word), stem.lower())
582
583
    def test_sb_swedish_snowball(self):
584
        """Test abydos.stemmer.sb_swedish (Snowball testset).