Fix more inefficient PT operations (#37060)

* Fix inefficient operations * Remove cpu() call * Reorder detach() * Reorder detach() * tolist without detach * item without detach * Update src/transformers/models/rag/modeling_rag.py Co-authored-by: Joao Gante <joaofranciscocardosogante@gmail.com> * Update tests/models/encodec/test_modeling_encodec.py Co-authored-by: Joao Gante <joaofranciscocardosogante@gmail.com> * Use detach().cpu().numpy * Revert some numpy operations * More fixes --------- Co-authored-by: Joao Gante <joaofranciscocardosogante@gmail.com>
2025-03-31 23:31:24 +08:00
parent a1e389e637
commit 786d9c5ed9
54 changed files with 106 additions and 104 deletions
--- a/tests/generation/test_beam_search.py
+++ b/tests/generation/test_beam_search.py
@@ -522,9 +522,9 @@ class ConstrainedBeamSearchTester:
        # set to same device. we don't care what device.

        if not isinstance(tensor_1, list):
-            tensor_1 = tensor_1.cpu().tolist()
+            tensor_1 = tensor_1.tolist()
        if not isinstance(tensor_2, list):
-            tensor_2 = tensor_2.cpu().tolist()
+            tensor_2 = tensor_2.tolist()

        in_order = len(tensor_1) <= len(tensor_2)
        longer = tensor_2 if in_order else tensor_1
--- a/tests/generation/test_utils.py
+++ b/tests/generation/test_utils.py
@@ -2595,9 +2595,9 @@ class GenerationTesterMixin:
        # set to same device. we don't care what device.

        if not isinstance(tensor_1, list):
-            tensor_1 = tensor_1.cpu().tolist()
+            tensor_1 = tensor_1.tolist()
        if not isinstance(tensor_2, list):
-            tensor_2 = tensor_2.cpu().tolist()
+            tensor_2 = tensor_2.tolist()

        in_order = len(tensor_1) <= len(tensor_2)
        longer = tensor_2 if in_order else tensor_1