Skip to content

Commit

Permalink
#8865: Additionaly optimize binary override_runtime_arguments
Browse files Browse the repository at this point in the history
  • Loading branch information
nemanjagrujic committed Jul 25, 2024
1 parent 279ac04 commit d51728f
Showing 1 changed file with 1 addition and 3 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -185,7 +185,7 @@ BinaryDeviceOperation::BroadcastHeightAndWidthMultiCore::create(
num_tensor_tiles_per_core = num_tiles_per_core_group_2;
} else {
tt_metal::SetRuntimeArgs(program, binary_reader_kernel_id, core, std::vector<uint32_t>(7, 0));
tt_metal::SetRuntimeArgs(program, bcast_kernel_id, core, std::vector<uint32_t>(3, 0));
tt_metal::SetRuntimeArgs(program, bcast_kernel_id, core, {1, 1, 0});
tt_metal::SetRuntimeArgs(program, unary_writer_kernel_id, core, std::vector<uint32_t>(3, 0));
continue;
}
Expand Down Expand Up @@ -349,8 +349,6 @@ void BinaryDeviceOperation::BroadcastHeightAndWidthMultiCore::override_runtime_a
binary_reader_args[5] = num_tiles_read % HtWt;
binary_reader_args[6] = bnc1 ? 0 : num_tiles_read / HtWt;

bcast_kernel_args[0] = 1; // B
bcast_kernel_args[1] = 1; // Ht
bcast_kernel_args[2] = num_tensor_tiles_per_core; // Wt

unary_writer_args[0] = dst_buffer->address();
Expand Down

0 comments on commit d51728f

Please sign in to comment.