Random sampling scores (OpenNMT#1285)

* In random sampling, make scores be score of EOS.
lneukom · Feb 12, 2019 · a3eaeb6 · a3eaeb6
1 parent e2799c6
commit a3eaeb6
Show file tree

Hide file tree

Showing 4 changed files with 365 additions and 13 deletions.
diff --git a/onmt/tests/test_random_sampling.py b/onmt/tests/test_random_sampling.py
@@ -0,0 +1,313 @@
+import unittest
+from onmt.translate.random_sampling import RandomSampling
+
+import torch
+
+
+class TestRandomSampling(unittest.TestCase):
+    BATCH_SZ = 3
+    INP_SEQ_LEN = 53
+    DEAD_SCORE = -1e20
+
+    BLOCKED_SCORE = -10e20
+
+    def test_advance_with_repeats_gets_blocked(self):
+        n_words = 100
+        repeat_idx = 47
+        ngram_repeat = 3
+        for batch_sz in [1, 3]:
+            samp = RandomSampling(
+                0, 1, 2, batch_sz, torch.device("cpu"), 0, ngram_repeat, set(),
+                False, 30, 1., 5, torch.randint(0, 30, (batch_sz,)))
+            for i in range(ngram_repeat + 4):
+                # predict repeat_idx over and over again
+                word_probs = torch.full(
+                    (batch_sz, n_words), -float('inf'))
+                word_probs[:, repeat_idx] = 0
+                attns = torch.randn(1, batch_sz, 53)
+                samp.advance(word_probs, attns)
+                if i <= ngram_repeat:
+                    expected_scores = torch.zeros((batch_sz, 1))
+                    self.assertTrue(samp.topk_scores.equal(expected_scores))
+                else:
+                    self.assertTrue(
+                        samp.topk_scores.equal(
+                            torch.tensor(self.BLOCKED_SCORE)
+                            .repeat(batch_sz, 1)))
+
+    def test_advance_with_some_repeats_gets_blocked(self):
+        # batch 0 and 7 will repeat, the rest will advance
+        n_words = 100
+        repeat_idx = 47
+        other_repeat_idx = 12
+        ngram_repeat = 3
+        for batch_sz in [1, 3, 13]:
+            samp = RandomSampling(
+                0, 1, 2, batch_sz, torch.device("cpu"), 0, ngram_repeat, set(),
+                False, 30, 1., 5, torch.randint(0, 30, (batch_sz,)))
+            for i in range(ngram_repeat + 4):
+                word_probs = torch.full(
+                    (batch_sz, n_words), -float('inf'))
+                # predict the same thing in batch 0 and 7 every i
+                word_probs[0, repeat_idx] = 0
+                if batch_sz > 7:
+                    word_probs[7, other_repeat_idx] = 0
+                # push around what the other batches predict
+                word_probs[1:7, repeat_idx + i] = 0
+                if batch_sz > 7:
+                    word_probs[8:, repeat_idx + i] = 0
+                attns = torch.randn(1, batch_sz, 53)
+                samp.advance(word_probs, attns)
+                if i <= ngram_repeat:
+                    self.assertFalse(
+                        samp.topk_scores.eq(
+                            self.BLOCKED_SCORE).any())
+                else:
+                    # now batch 0 and 7 die
+                    self.assertTrue(samp.topk_scores[0].eq(self.BLOCKED_SCORE))
+                    if batch_sz > 7:
+                        self.assertTrue(samp.topk_scores[7].eq(
+                            self.BLOCKED_SCORE))
+                    self.assertFalse(
+                        samp.topk_scores[1:7].eq(
+                            self.BLOCKED_SCORE).any())
+                    if batch_sz > 7:
+                        self.assertFalse(
+                            samp.topk_scores[8:].eq(
+                                self.BLOCKED_SCORE).any())
+
+    def test_repeating_excluded_index_does_not_die(self):
+        # batch 0 will repeat excluded idx, batch 1 will repeat
+        n_words = 100
+        repeat_idx = 47  # will be repeated and should be blocked
+        repeat_idx_ignored = 7  # will be repeated and should not be blocked
+        ngram_repeat = 3
+        for batch_sz in [1, 3, 17]:
+            samp = RandomSampling(
+                0, 1, 2, batch_sz, torch.device("cpu"), 0, ngram_repeat,
+                {repeat_idx_ignored}, False, 30, 1., 5,
+                torch.randint(0, 30, (batch_sz,)))
+            for i in range(ngram_repeat + 4):
+                word_probs = torch.full(
+                    (batch_sz, n_words), -float('inf'))
+                word_probs[0, repeat_idx_ignored] = 0
+                if batch_sz > 1:
+                    word_probs[1, repeat_idx] = 0
+                    word_probs[2:, repeat_idx + i] = 0
+                attns = torch.randn(1, batch_sz, 53)
+                samp.advance(word_probs, attns)
+                if i <= ngram_repeat:
+                    self.assertFalse(samp.topk_scores.eq(
+                        self.BLOCKED_SCORE).any())
+                else:
+                    # now batch 1 dies
+                    self.assertFalse(samp.topk_scores[0].eq(
+                        self.BLOCKED_SCORE).any())
+                    if batch_sz > 1:
+                        self.assertTrue(samp.topk_scores[1].eq(
+                            self.BLOCKED_SCORE).all())
+                        self.assertFalse(samp.topk_scores[2:].eq(
+                            self.BLOCKED_SCORE).any())
+
+    def test_doesnt_predict_eos_if_shorter_than_min_len(self):
+        # batch 0 will always predict EOS. The other batches will predict
+        # non-eos scores.
+        for batch_sz in [1, 3]:
+            n_words = 100
+            _non_eos_idxs = [47]
+            valid_score_dist = torch.log_softmax(torch.tensor(
+                [6., 5.]), dim=0)
+            min_length = 5
+            eos_idx = 2
+            lengths = torch.randint(0, 30, (batch_sz,))
+            samp = RandomSampling(
+                0, 1, 2, batch_sz, torch.device("cpu"), min_length,
+                False, set(), False, 30, 1., 1, lengths)
+            all_attns = []
+            for i in range(min_length + 4):
+                word_probs = torch.full(
+                    (batch_sz, n_words), -float('inf'))
+                # "best" prediction is eos - that should be blocked
+                word_probs[0, eos_idx] = valid_score_dist[0]
+                # include at least one prediction OTHER than EOS
+                # that is greater than -1e20
+                word_probs[0, _non_eos_idxs[0]] = valid_score_dist[1]
+                word_probs[1:, _non_eos_idxs[0] + i] = 0
+
+                attns = torch.randn(1, batch_sz, 53)
+                all_attns.append(attns)
+                samp.advance(word_probs, attns)
+                if i < min_length:
+                    self.assertTrue(
+                        samp.topk_scores[0].allclose(valid_score_dist[1]))
+                    self.assertTrue(
+                        samp.topk_scores[1:].eq(0).all())
+                elif i == min_length:
+                    # now batch 0 has ended and no others have
+                    self.assertTrue(samp.is_finished[0, :].eq(1).all())
+                    self.assertTrue(samp.is_finished[1:, 1:].eq(0).all())
+                else:  # i > min_length
+                    break
+
+    def test_returns_correct_scores_deterministic(self):
+        for batch_sz in [1, 13]:
+            for temp in [1., 3.]:
+                n_words = 100
+                _non_eos_idxs = [47, 51, 13, 88, 99]
+                valid_score_dist_1 = torch.log_softmax(torch.tensor(
+                    [6., 5., 4., 3., 2., 1.]), dim=0)
+                valid_score_dist_2 = torch.log_softmax(torch.tensor(
+                    [6., 1.]), dim=0)
+                eos_idx = 2
+                lengths = torch.randint(0, 30, (batch_sz,))
+                samp = RandomSampling(
+                    0, 1, 2, batch_sz, torch.device("cpu"), 0,
+                    False, set(), False, 30, temp, 1, lengths)
+
+                # initial step
+                i = 0
+                word_probs = torch.full(
+                    (batch_sz, n_words), -float('inf'))
+                # batch 0 dies on step 0
+                word_probs[0, eos_idx] = valid_score_dist_1[0]
+                # include at least one prediction OTHER than EOS
+                # that is greater than -1e20
+                word_probs[0, _non_eos_idxs] = valid_score_dist_1[1:]
+                word_probs[1:, _non_eos_idxs[0] + i] = 0
+
+                attns = torch.randn(1, batch_sz, 53)
+                samp.advance(word_probs, attns)
+                self.assertTrue(samp.is_finished[0].eq(1).all())
+                samp.update_finished()
+                self.assertEqual(
+                    samp.scores[0], [valid_score_dist_1[0] / temp])
+                if batch_sz == 1:
+                    self.assertTrue(samp.done)
+                    continue
+                else:
+                    self.assertFalse(samp.done)
+
+                # step 2
+                i = 1
+                word_probs = torch.full(
+                    (batch_sz - 1, n_words), -float('inf'))
+                # (old) batch 8 dies on step 1
+                word_probs[7, eos_idx] = valid_score_dist_2[0]
+                word_probs[0:7, _non_eos_idxs[:2]] = valid_score_dist_2
+                word_probs[8:, _non_eos_idxs[:2]] = valid_score_dist_2
+
+                attns = torch.randn(1, batch_sz, 53)
+                samp.advance(word_probs, attns)
+
+                self.assertTrue(samp.is_finished[7].eq(1).all())
+                samp.update_finished()
+                self.assertEqual(
+                    samp.scores[8], [valid_score_dist_2[0] / temp])
+
+                # step 3
+                i = 2
+                word_probs = torch.full(
+                    (batch_sz - 2, n_words), -float('inf'))
+                # everything dies
+                word_probs[:, eos_idx] = 0
+
+                attns = torch.randn(1, batch_sz, 53)
+                samp.advance(word_probs, attns)
+
+                self.assertTrue(samp.is_finished.eq(1).all())
+                samp.update_finished()
+                for b in range(batch_sz):
+                    if b != 0 and b != 8:
+                        self.assertEqual(samp.scores[b], [0])
+                self.assertTrue(samp.done)
+
+    def test_returns_correct_scores_non_deterministic(self):
+        for batch_sz in [1, 13]:
+            for temp in [1., 3.]:
+                n_words = 100
+                _non_eos_idxs = [47, 51, 13, 88, 99]
+                valid_score_dist_1 = torch.log_softmax(torch.tensor(
+                    [6., 5., 4., 3., 2., 1.]), dim=0)
+                valid_score_dist_2 = torch.log_softmax(torch.tensor(
+                    [6., 1.]), dim=0)
+                eos_idx = 2
+                lengths = torch.randint(0, 30, (batch_sz,))
+                samp = RandomSampling(
+                    0, 1, 2, batch_sz, torch.device("cpu"), 0,
+                    False, set(), False, 30, temp, 2, lengths)
+
+                # initial step
+                i = 0
+                for _ in range(100):
+                    word_probs = torch.full(
+                        (batch_sz, n_words), -float('inf'))
+                    # batch 0 dies on step 0
+                    word_probs[0, eos_idx] = valid_score_dist_1[0]
+                    # include at least one prediction OTHER than EOS
+                    # that is greater than -1e20
+                    word_probs[0, _non_eos_idxs] = valid_score_dist_1[1:]
+                    word_probs[1:, _non_eos_idxs[0] + i] = 0
+
+                    attns = torch.randn(1, batch_sz, 53)
+                    samp.advance(word_probs, attns)
+                    if samp.is_finished[0].eq(1).all():
+                        break
+                else:
+                    self.fail("Batch 0 never ended (very unlikely but maybe "
+                              "due to stochasticisty. If so, please increase "
+                              "the range of the for-loop.")
+                samp.update_finished()
+                self.assertEqual(
+                    samp.scores[0], [valid_score_dist_1[0] / temp])
+                if batch_sz == 1:
+                    self.assertTrue(samp.done)
+                    continue
+                else:
+                    self.assertFalse(samp.done)
+
+                # step 2
+                i = 1
+                for _ in range(100):
+                    word_probs = torch.full(
+                        (batch_sz - 1, n_words), -float('inf'))
+                    # (old) batch 8 dies on step 1
+                    word_probs[7, eos_idx] = valid_score_dist_2[0]
+                    word_probs[0:7, _non_eos_idxs[:2]] = valid_score_dist_2
+                    word_probs[8:, _non_eos_idxs[:2]] = valid_score_dist_2
+
+                    attns = torch.randn(1, batch_sz, 53)
+                    samp.advance(word_probs, attns)
+                    if samp.is_finished[7].eq(1).all():
+                        break
+                else:
+                    self.fail("Batch 8 never ended (very unlikely but maybe "
+                              "due to stochasticisty. If so, please increase "
+                              "the range of the for-loop.")
+
+                samp.update_finished()
+                self.assertEqual(
+                    samp.scores[8], [valid_score_dist_2[0] / temp])
+
+                # step 3
+                i = 2
+                for _ in range(250):
+                    word_probs = torch.full(
+                        (samp.alive_seq.shape[0], n_words), -float('inf'))
+                    # everything dies
+                    word_probs[:, eos_idx] = 0
+
+                    attns = torch.randn(1, batch_sz, 53)
+                    samp.advance(word_probs, attns)
+                    if samp.is_finished.any():
+                        samp.update_finished()
+                    if samp.is_finished.eq(1).all():
+                        break
+                else:
+                    self.fail("All batches never ended (very unlikely but "
+                              "maybe due to stochasticisty. If so, please "
+                              "increase the range of the for-loop.")
+
+                for b in range(batch_sz):
+                    if b != 0 and b != 8:
+                        self.assertEqual(samp.scores[b], [0])
+                self.assertTrue(samp.done)
diff --git a/onmt/translate/decode_strategy.py b/onmt/translate/decode_strategy.py
@@ -31,9 +31,9 @@ class DecodeStrategy(object):
         predictions (list[list[torch.LongTensor]]): For each batch, holds a
             list of beam prediction sequences.
         scores (list[list[torch.FloatTensor]]): For each batch, holds a
-            list of beam scores.
+            list of scores.
         attention (list[list[torch.FloatTensor or list[]]]): For each
-            batch, holds a list of beam attention sequence tensors
+            batch, holds a list of attention sequence tensors
             (or empty lists) having shape ``(step, inp_seq_len)`` where
             ``inp_seq_len`` is the length of the sample (not the max
             length of all inp seqs).