Skip to content

Commit

Permalink
test diff threshold
Browse files Browse the repository at this point in the history
  • Loading branch information
nardoTT committed Feb 19, 2025
1 parent 8c9f534 commit 23b5886
Show file tree
Hide file tree
Showing 4 changed files with 9 additions and 8 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -90,7 +90,7 @@ operation::ProgramWithCallbacks TilizeWithValPadding::create_program(
if (input_tensor_a.memory_config().is_sharded()) {
return detail::tilize_with_val_padding_multi_core_sharded(input_tensor_a, output_tensor, this->pad_value);
}
if (!this->enough_space_height) {
if (!this->enough_space_height || this->enough_space_width) {
return detail::tilize_with_val_padding_multi_core_block_interleaved(
input_tensor_a, output_tensor, this->pad_value);
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -687,9 +687,9 @@ operation::ProgramWithCallbacks tilize_with_val_padding_multi_core_interleaved(
if (num_tiles_per_row > num_tiles_per_col) {
return tilize_with_val_padding_multi_core_col_interleaved(a, output, pad_value);
}
if (num_tiles_per_col > threshold_row_block || num_tiles_per_row > num_tiles_per_col) {
return tilize_with_val_padding_multi_core_block_interleaved(a, output, pad_value);
}
// if (num_tiles_per_col > threshold_row_block || num_tiles_per_row > num_tiles_per_col) {
// return tilize_with_val_padding_multi_core_block_interleaved(a, output, pad_value);
// }
}

auto [ncores, all_cores, core_range, core_range_cliff, nblocks_per_core, nblocks_per_core_cliff] =
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -115,7 +115,7 @@ operation::ProgramWithCallbacks UntilizeWithUnpadding::create_program(
return detail::untilize_with_unpadding_single_core(
input_tensor_a, output_tensor, this->use_pack_untilize, this->fp32_dest_acc_en);
}
if (!this->enough_space_height) {
if (!this->enough_space_height || !this->enough_space_width) {
return detail::untilize_with_unpadding_multi_core_block_interleaved(
input_tensor_a, output_tensor, this->use_pack_untilize, this->fp32_dest_acc_en);
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -675,9 +675,10 @@ operation::ProgramWithCallbacks untilize_with_unpadding_multi_core_interleaved(
if (num_tiles_per_row > num_tiles_per_col) {
return untilize_with_unpadding_multi_core_col_interleaved(a, output, use_pack_untilize, fp32_dest_acc_en);
}
if (num_tiles_per_col > threshold_row_block || num_tiles_per_row > num_tiles_per_col) {
return untilize_with_unpadding_multi_core_block_interleaved(a, output, use_pack_untilize, fp32_dest_acc_en);
}
// if (num_tiles_per_col > threshold_row_block || num_tiles_per_row > num_tiles_per_col) {
// return untilize_with_unpadding_multi_core_block_interleaved(a, output, use_pack_untilize,
// fp32_dest_acc_en);
// }
}

auto [ncores, all_cores, core_range, core_range_cliff, nblocks_per_core, nblocks_per_core_cliff] =
Expand Down

0 comments on commit 23b5886

Please sign in to comment.