fix slice bug (#4470)

supotato6 · web-flow · commit 1eff3be4b215 · 2025-08-22T16:39:26.000+08:00
diff --git a/paddlex/inference/models/multilingual_speech_recognition/processors.py b/paddlex/inference/models/multilingual_speech_recognition/processors.py
@@ -1342,6 +1342,7 @@ def __init__(self, tokenizer: Tokenizer, sample_begin: int):
 
     def apply(self, logits: paddle.Tensor, tokens: paddle.Tensor):
         if tokens.shape[1] == self.sample_begin:
+            logits.contiguous()
             logits[:, self.tokenizer.encode(" ").input_ids + [self.tokenizer.eot]] = (
                 -np.inf
             )
@@ -1352,6 +1353,7 @@ def __init__(self, suppress_tokens: Sequence[int]):
         self.suppress_tokens = list(suppress_tokens)
 
     def apply(self, logits: paddle.Tensor, tokens: paddle.Tensor):
+        logits.contiguous()
         logits[:, self.suppress_tokens] = -np.inf
 
 
@@ -1369,6 +1371,7 @@ def __init__(
     def apply(self, logits: paddle.Tensor, tokens: paddle.Tensor):
         # suppress <|notimestamps|> which is handled by without_timestamps
         if self.tokenizer.no_timestamps is not None:
+            logits.contiguous()
             logits[:, self.tokenizer.no_timestamps] = -np.inf
 
         # timestamps have to appear in pairs, except directly before EOT; mask logits accordingly
@@ -1382,6 +1385,7 @@ def apply(self, logits: paddle.Tensor, tokens: paddle.Tensor):
             )
 
             if last_was_timestamp:
+                logits.contiguous()
                 if penultimate_was_timestamp:  # has to be non-timestamp
                     logits[k, self.tokenizer.timestamp_begin :] = -np.inf
                 else:  # cannot be normal text tokens
@@ -1395,6 +1399,7 @@ def apply(self, logits: paddle.Tensor, tokens: paddle.Tensor):
             last_allowed = (
                 self.tokenizer.timestamp_begin + self.max_initial_timestamp_index
             )
+            logits.contiguous()
             logits[:, last_allowed + 1 :] = -np.inf
 
         # if sum of probability over timestamps is above any other token, sample timestamp
@@ -1413,6 +1418,7 @@ def apply(self, logits: paddle.Tensor, tokens: paddle.Tensor):
                 logprobs[k, : self.tokenizer.timestamp_begin]
             )
             if timestamp_logprob > max_text_token_logprob:
+                logits.contiguous()
                 logits[k, : self.tokenizer.timestamp_begin] = -np.inf