diff --git a/tt_eager/tt_dnn/op_library/nlp_tms/nlp_tms.hpp b/tt_eager/tt_dnn/op_library/nlp_tms/nlp_tms.hpp index b8771e17f4a..9484ecce53e 100644 --- a/tt_eager/tt_dnn/op_library/nlp_tms/nlp_tms.hpp +++ b/tt_eager/tt_dnn/op_library/nlp_tms/nlp_tms.hpp @@ -151,7 +151,7 @@ inline std::vector nlp_create_qkv_heads_decode( Tensor(operation::get_workers_for_op_output({input_tensor})), Tensor(operation::get_workers_for_op_output({input_tensor}))}; operation::launch_op( - [num_heads, num_kv_heads, mem_config] (std::vector input_tensors, const std::vector>& optional_input_tensors) mutable -> std::vector { + [num_heads, num_kv_heads, mem_config] (std::vector input_tensors, const std::vector>& optional_input_tensors, const std::vector>& optional_output_tensors) mutable -> std::vector { const uint32_t num_kv_heads_val = num_kv_heads.value_or(num_heads); // Infer head_dim