[API Compatibility] add torch.nn.utils.rnn.pad_sequence and torch.nn.utils.rnn.unpad_sequence -part (#826)

Manfredss · web-flow · commit 1628c71637f9 · 2026-02-15T17:42:39.000+08:00
add paconvert tests for torch.nn.utils.rnn.pad_sequence and torch.nn.utils.rnn.unpad_sequence
diff --git a/paconvert/api_mapping.json b/paconvert/api_mapping.json
@@ -10284,6 +10284,12 @@
   "torch.nn.utils.vector_to_parameters": {
     "Matcher": "ChangePrefixMatcher"
   },
+  "torch.nn.utils.rnn.pad_sequence": {
+    "Matcher": "ChangePrefixMatcher"
+  },
+  "torch.nn.utils.rnn.unpad_sequence": {
+    "Matcher": "ChangePrefixMatcher"
+  },
   "torch.nn.utils.weight_norm": {
     "Matcher": "GenericMatcher",
     "paddle_api": "paddle.nn.utils.weight_norm",
diff --git a/tests/test_nn_utils_rnn_pad_sequence.py b/tests/test_nn_utils_rnn_pad_sequence.py
@@ -0,0 +1,188 @@
+# Copyright (c) 2023 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import textwrap
+
+from apibase import APIBase
+
+obj = APIBase("torch.nn.utils.rnn.pad_sequence")
+
+
+def test_case_1():
+    """basic usage with default parameters"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        c = torch.tensor([6.0])
+        result = pad_sequence([a, b, c])
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_2():
+    """batch_first=True"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        c = torch.tensor([6.0])
+        result = pad_sequence([a, b, c], batch_first=True)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_3():
+    """custom padding_value"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        result = pad_sequence([a, b], padding_value=-1.0)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_4():
+    """all positional arguments"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        result = pad_sequence([a, b], True, -1.0)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_5():
+    """all keyword arguments"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        result = pad_sequence(sequences=[a, b], batch_first=True, padding_value=0.0)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_6():
+    """keyword arguments in shuffled order"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        result = pad_sequence(padding_value=2.0, batch_first=False, sequences=[a, b])
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_7():
+    """2D input tensors"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([[1.0, 2.0], [3.0, 4.0], [5.0, 6.0]])
+        b = torch.tensor([[7.0, 8.0]])
+        result = pad_sequence([a, b], batch_first=True, padding_value=0.0)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_8():
+    """using torch.nn.utils.rnn.pad_sequence full path"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        result = torch.nn.utils.rnn.pad_sequence([a, b], batch_first=True)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_9():
+    """sequences of same length"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0, 6.0])
+        result = pad_sequence([a, b], batch_first=True)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_10():
+    """integer dtype input"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([1, 2, 3, 4])
+        b = torch.tensor([5, 6])
+        result = pad_sequence([a, b], batch_first=False, padding_value=0)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_11():
+    """batch_first=False with custom padding_value"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0, 4.0])
+        b = torch.tensor([5.0, 6.0])
+        c = torch.tensor([7.0, 8.0, 9.0])
+        result = pad_sequence([a, b, c], batch_first=False, padding_value=-100.0)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_12():
+    """single sequence input"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        result = pad_sequence([a])
+        """
+    )
+    obj.run(pytorch_code, ["result"])
diff --git a/tests/test_nn_utils_rnn_unpad_sequence.py b/tests/test_nn_utils_rnn_unpad_sequence.py
@@ -0,0 +1,196 @@
+# Copyright (c) 2023 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import textwrap
+
+from apibase import APIBase
+
+obj = APIBase("torch.nn.utils.rnn.unpad_sequence")
+
+
+def test_case_1():
+    """basic usage with batch_first=True"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence, unpad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        c = torch.tensor([6.0])
+        padded = pad_sequence([a, b, c], batch_first=True)
+        lengths = torch.tensor([3, 2, 1])
+        result = unpad_sequence(padded, lengths, batch_first=True)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_2():
+    """batch_first=False (default)"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence, unpad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        padded = pad_sequence([a, b], batch_first=False)
+        lengths = torch.tensor([3, 2])
+        result = unpad_sequence(padded, lengths, batch_first=False)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_3():
+    """all positional arguments"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence, unpad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        padded = pad_sequence([a, b], True)
+        lengths = torch.tensor([3, 2])
+        result = unpad_sequence(padded, lengths, True)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_4():
+    """all keyword arguments"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence, unpad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        padded = pad_sequence([a, b], batch_first=True)
+        lengths = torch.tensor([3, 2])
+        result = unpad_sequence(padded_sequences=padded, lengths=lengths, batch_first=True)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_5():
+    """keyword arguments in shuffled order"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence, unpad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        padded = pad_sequence([a, b], batch_first=True)
+        lengths = torch.tensor([3, 2])
+        result = unpad_sequence(batch_first=True, lengths=lengths, padded_sequences=padded)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_6():
+    """default batch_first (omitted)"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence, unpad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        padded = pad_sequence([a, b])
+        lengths = torch.tensor([3, 2])
+        result = unpad_sequence(padded, lengths)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_7():
+    """2D input tensors"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence, unpad_sequence
+        a = torch.tensor([[1.0, 2.0], [3.0, 4.0], [5.0, 6.0]])
+        b = torch.tensor([[7.0, 8.0]])
+        padded = pad_sequence([a, b], batch_first=True)
+        lengths = torch.tensor([3, 1])
+        result = unpad_sequence(padded, lengths, batch_first=True)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_8():
+    """using full path torch.nn.utils.rnn.unpad_sequence"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        b = torch.tensor([4.0, 5.0])
+        padded = pad_sequence([a, b], batch_first=True)
+        lengths = torch.tensor([3, 2])
+        result = torch.nn.utils.rnn.unpad_sequence(padded, lengths, batch_first=True)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_9():
+    """single sequence"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence, unpad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0])
+        padded = pad_sequence([a], batch_first=True)
+        lengths = torch.tensor([3])
+        result = unpad_sequence(padded, lengths, batch_first=True)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_10():
+    """integer dtype"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence, unpad_sequence
+        a = torch.tensor([1, 2, 3, 4])
+        b = torch.tensor([5, 6])
+        padded = pad_sequence([a, b], batch_first=True)
+        lengths = torch.tensor([4, 2])
+        result = unpad_sequence(padded, lengths, batch_first=True)
+        """
+    )
+    obj.run(pytorch_code, ["result"])
+
+
+def test_case_11():
+    """multiple sequences with varying lengths"""
+    pytorch_code = textwrap.dedent(
+        """
+        import torch
+        from torch.nn.utils.rnn import pad_sequence, unpad_sequence
+        a = torch.tensor([1.0, 2.0, 3.0, 4.0])
+        b = torch.tensor([5.0, 6.0])
+        c = torch.tensor([7.0, 8.0, 9.0])
+        padded = pad_sequence([a, b, c], batch_first=True)
+        lengths = torch.tensor([4, 2, 3])
+        result = unpad_sequence(padded, lengths, batch_first=True)
+        """
+    )
+    obj.run(pytorch_code, ["result"])