tenstorrent · arakhmati · Jun 4, 2024 · May 30, 2024 · Jun 3, 2024
@@ -2,6 +2,8 @@
 
 # SPDX-License-Identifier: Apache-2.0
 
+import pytest
+
 import torch
 import ttnn
 import tt_lib
@@ -19,6 +21,7 @@
 from tests.ttnn.utils_for_testing import assert_with_pcc
 
 
+@pytest.mark.skip(reason="https://github.com/tenstorrent/tt-metal/issues/9076")
 @skip_for_wormhole_b0()
 def test_mistral_attention_inference(model_location_generator, device, reset_seeds):
     model_path = model_location_generator("mistral-7B-v0.1", model_subdir="Mistral")

diff --git a/tt_eager/tt_dnn/op_library/bmm/bmm_op.cpp b/tt_eager/tt_dnn/op_library/bmm/bmm_op.cpp
@@ -1041,7 +1041,7 @@ void Matmul::validate(
                 // subbblock constraint
                 TT_FATAL(program_config.out_subblock_w == per_core_N || program_config.out_subblock_h == 1);
                 // tensor in1
-                TT_FATAL(input_tensor_b.memory_config().memory_layout == TensorMemoryLayout::INTERLEAVED);
+                TT_FATAL(input_tensor_b.memory_config().memory_layout == TensorMemoryLayout::WIDTH_SHARDED);
             } else if constexpr (std::is_same_v<ProgramConfigType, MatmulMultiCoreReuseMultiCastProgramConfig>) {
                 if (input_tensor_a.memory_config().is_sharded()) {
                     auto tensor_a_memory_layout = input_tensor_a.memory_config().memory_layout;

diff --git a/tt_eager/tt_dnn/op_library/operation.hpp b/tt_eager/tt_dnn/op_library/operation.hpp
@@ -528,9 +528,6 @@ struct DeviceOperation final {
                const Tensors& input_tensors,
                const OptionalConstTensors& optional_input_tensors,
                const OptionalTensors& optional_output_tensors) -> void {
-                if (ttnn::CONFIG.enable_fast_runtime_mode) {
-                    return;
-                }
                 const auto& operation = *reinterpret_cast<const std::decay_t<T>*>(&storage);
                 if constexpr (
                     (detail::implements_validate<T>() or

@@ -57,7 +57,7 @@ def validate(self, name):
             if self.enable_fast_runtime_mode:
                 if self.enable_logging:
                     logger.warning(
-                        "Running in fast runtime mode without logging. Please disable fast runtime mode if you want to enable logging."
+                        "Logging cannot be enabled in fast runtime mode. Please disable fast runtime mode if you want to enable logging."
                     )
 
         if name in {