Spaces:

shivanshneu
/

translingo

Sleeping

App Files Files Community

Ratan1 commited on 28 days ago

Commit

9618094

1 Parent(s): aad62f1

finalized

Browse files

Files changed (2) hide show

inference/beam_search.py +17 -7
inference/translate.py +6 -6

inference/beam_search.py CHANGED Viewed

@@ -15,11 +15,11 @@ class BeamSearch:
     """Beam search decoder for transformer models"""
     def __init__(self, beam_size: int = 4, length_penalty: float = 0.6,
-                 coverage_penalty: float = 0.0, no_repeat_ngram_size: int = 0):
         self.beam_size = beam_size
         self.length_penalty = length_penalty
         self.coverage_penalty = coverage_penalty
-        self.no_repeat_ngram_size = no_repeat_ngram_size
     def search(self, model, src: torch.Tensor, max_length: int = 100,
                bos_id: int = 2, eos_id: int = 3, pad_id: int = 0) -> List[List[int]]:
@@ -51,7 +51,11 @@ class BeamSearch:
             all_candidates = []
             for batch_idx in range(batch_size):
-                # Skip if all beams are finished
                 if all(hyp.finished for hyp in beams[batch_idx]):
                     continue
@@ -98,19 +102,21 @@ class BeamSearch:
                     for token_rank, (token_log_prob, token_id) in enumerate(
                         zip(beam_log_probs, beam_indices_local)):
                         # Apply no-repeat penalty
-                        if self._has_repeated_ngram(hypothesis.tokens + [token_id.item()]):
                             continue
                         new_log_prob = hypothesis.log_prob + token_log_prob.item()
                         # Apply length penalty
-                        score = self._apply_length_penalty(new_log_prob, len(hypothesis.tokens) + 1)
                         candidates.append((
                             score,
                             BeamHypothesis(
-                                tokens=hypothesis.tokens + [token_id.item()],
                                 log_prob=new_log_prob,
                                 finished=(token_id.item() == eos_id)
                             )
@@ -123,6 +129,10 @@ class BeamSearch:
                 for score, hypothesis in candidates[:self.beam_size]:
                     new_beams.append(hypothesis)
                 beams[batch_idx] = new_beams
         # Extract best sequences
@@ -202,4 +212,4 @@ class GreedyDecoder:
                 tokens = tokens[:eos_idx + 1]
             results.append(tokens)
-        return results

     """Beam search decoder for transformer models"""
     def __init__(self, beam_size: int = 4, length_penalty: float = 0.6,
+                 coverage_penalty: float = 0.0, no_repeat_ngram_size: int = 3):
         self.beam_size = beam_size
         self.length_penalty = length_penalty
         self.coverage_penalty = coverage_penalty
+        self.no_repeat_ngram_size = no_repeat_ngram_size  # Changed default from 0 to 3
     def search(self, model, src: torch.Tensor, max_length: int = 100,
                bos_id: int = 2, eos_id: int = 3, pad_id: int = 0) -> List[List[int]]:
             all_candidates = []
             for batch_idx in range(batch_size):
+                # NEW: Stop if the BEST beam (first one after sorting) is finished
+                if beams[batch_idx] and beams[batch_idx][0].finished:
+                    continue
+                # Also skip if all beams are finished
                 if all(hyp.finished for hyp in beams[batch_idx]):
                     continue
                     for token_rank, (token_log_prob, token_id) in enumerate(
                         zip(beam_log_probs, beam_indices_local)):
+                        new_tokens = hypothesis.tokens + [token_id.item()]
                         # Apply no-repeat penalty
+                        if self._has_repeated_ngram(new_tokens):
                             continue
                         new_log_prob = hypothesis.log_prob + token_log_prob.item()
                         # Apply length penalty
+                        score = self._apply_length_penalty(new_log_prob, len(new_tokens))
                         candidates.append((
                             score,
                             BeamHypothesis(
+                                tokens=new_tokens,
                                 log_prob=new_log_prob,
                                 finished=(token_id.item() == eos_id)
                             )
                 for score, hypothesis in candidates[:self.beam_size]:
                     new_beams.append(hypothesis)
+                # If we have no candidates, keep the old beams
+                if not new_beams:
+                    new_beams = beams[batch_idx]
                 beams[batch_idx] = new_beams
         # Extract best sequences
                 tokens = tokens[:eos_idx + 1]
             results.append(tokens)
+        return results

inference/translate.py CHANGED Viewed

@@ -37,16 +37,16 @@ class Translator:
         self.eos_id = self.sp.eos_id()
         self.pad_id = self.sp.pad_id()
-        # Decoder
         self.use_beam_search = use_beam_search
         if use_beam_search:
-            self.decoder = BeamSearch(beam_size=beam_size)
         logger.info(f"Translator initialized on {self.device}")
         logger.info(f"Vocab size: {self.sp.vocab_size()}")
         logger.info(f"Using {'beam search' if use_beam_search else 'greedy'} decoding")
-    def translate(self, text: str, max_length: int = 100) -> str:
         """
         Translate a single text
@@ -93,7 +93,7 @@ class Translator:
         return translated_text
-    def translate_batch(self, texts: List[str], max_length: int = 100) -> List[str]:
         """
         Translate multiple texts in batch
@@ -149,7 +149,7 @@ class Translator:
         return results
-    def translate_with_attention(self, text: str, max_length: int = 100) -> Tuple[str, torch.Tensor]:
         """
         Translate and return attention weights
@@ -253,4 +253,4 @@ if __name__ == "__main__":
     checkpoint_path = sys.argv[1]
     tokenizer_path = sys.argv[2]
-    interactive_translation(checkpoint_path, tokenizer_path)

         self.eos_id = self.sp.eos_id()
         self.pad_id = self.sp.pad_id()
+        # Decoder - with no_repeat_ngram_size=3 to prevent repetition
         self.use_beam_search = use_beam_search
         if use_beam_search:
+            self.decoder = BeamSearch(beam_size=beam_size, no_repeat_ngram_size=3)
         logger.info(f"Translator initialized on {self.device}")
         logger.info(f"Vocab size: {self.sp.vocab_size()}")
         logger.info(f"Using {'beam search' if use_beam_search else 'greedy'} decoding")
+    def translate(self, text: str, max_length: int = 50) -> str:  # Changed default from 100 to 50
         """
         Translate a single text
         return translated_text
+    def translate_batch(self, texts: List[str], max_length: int = 50) -> List[str]:  # Changed from 100 to 50
         """
         Translate multiple texts in batch
         return results
+    def translate_with_attention(self, text: str, max_length: int = 50) -> Tuple[str, torch.Tensor]:
         """
         Translate and return attention weights
     checkpoint_path = sys.argv[1]
     tokenizer_path = sys.argv[2]
+    interactive_translation(checkpoint_path, tokenizer_path)