From bb26534f55bbeff31427f31db39dfabd701c4600 Mon Sep 17 00:00:00 2001 From: Ubuntu Date: Fri, 6 Dec 2024 14:24:11 +0000 Subject: [PATCH] fix output_end in untilize_with_unpadding --- .../unit_tests/operations/test_to_layout_5D.py | 4 ++++ .../untilize_with_unpadding.cpp | 14 ++++++++++---- 2 files changed, 14 insertions(+), 4 deletions(-) diff --git a/tests/ttnn/unit_tests/operations/test_to_layout_5D.py b/tests/ttnn/unit_tests/operations/test_to_layout_5D.py index 6348810532e..7d19b72e857 100644 --- a/tests/ttnn/unit_tests/operations/test_to_layout_5D.py +++ b/tests/ttnn/unit_tests/operations/test_to_layout_5D.py @@ -1,3 +1,7 @@ +# SPDX-FileCopyrightText: © 2024 Tenstorrent Inc. + +# SPDX-License-Identifier: Apache-2.0 + import torch import ttnn import pytest diff --git a/ttnn/cpp/ttnn/operations/data_movement/untilize_with_unpadding/untilize_with_unpadding.cpp b/ttnn/cpp/ttnn/operations/data_movement/untilize_with_unpadding/untilize_with_unpadding.cpp index d8b355da498..0215c6869a5 100644 --- a/ttnn/cpp/ttnn/operations/data_movement/untilize_with_unpadding/untilize_with_unpadding.cpp +++ b/ttnn/cpp/ttnn/operations/data_movement/untilize_with_unpadding/untilize_with_unpadding.cpp @@ -65,15 +65,21 @@ ttnn::Tensor ExecuteUntilizeWithUnpadding::invoke( // MT: Currently only uint32 is moved to DST directly, fp32 is converted to fp16b bool fp32_dest_acc_en = input_tensor.get_dtype() == DataType::UINT32; - std::vector output_end; - for (auto index = 0; index < input_tensor.get_shape().rank(); ++index) { - output_end.push_back(input_tensor.get_shape()[index] - 1); + std::vector output_end_vector; + tt::tt_metal::LegacyShape output_end = tt::tt_metal::LegacyShape{}; + if (input_tensor.get_shape().rank() > 4) { + for (auto index = 0; index < input_tensor.get_shape().rank(); ++index) { + output_end_vector.push_back(input_tensor.get_shape()[index] - 1); + } + output_end = squeeze_output_shape(LegacyShape(output_end_vector)); + } else { + output_end = output_tensor_end; } auto base_untilize = [=](const ttnn::Tensor& input_tensor) { return operation::run( UntilizeWithUnpadding{ - squeeze_output_shape(LegacyShape(output_end)), + output_end, memory_config.value_or(input_tensor.memory_config()), use_multicore, use_pack_untilize,