Skip to content

Commit

Permalink
undo breaking change in segmented radix sort config (#548)
Browse files Browse the repository at this point in the history
  • Loading branch information
nolmoonen committed Apr 9, 2024
1 parent 609ae19 commit 3178ba4
Show file tree
Hide file tree
Showing 8 changed files with 827 additions and 1,056 deletions.
1 change: 1 addition & 0 deletions benchmark/benchmark_device_segmented_radix_sort_keys.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -285,6 +285,7 @@ int main(int argc, char* argv[])
// Add benchmarks
std::vector<benchmark::internal::Benchmark*> benchmarks;
#ifdef BENCHMARK_CONFIG_TUNING
(void)min_size;
const int parallel_instance = parser.get<int>("parallel_instance");
const int parallel_instances = parser.get<int>("parallel_instances");
config_autotune_register::register_benchmark_subset(benchmarks,
Expand Down
25 changes: 12 additions & 13 deletions benchmark/benchmark_device_segmented_radix_sort_keys.parallel.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -291,16 +291,15 @@ struct device_segmented_radix_sort_benchmark_generator
rocprim::segmented_radix_sort_config<
LongBits,
ShortBits,
BlockSize,
ItemsPerThread,
EnableUnpartitionedWarpSort,
rocprim::kernel_config<BlockSize, ItemsPerThread>,
rocprim::WarpSortConfig<LogicalWarpSizeSmall / 2,
ItemsPerThread / 2,
BlockSize,
PartitioningThreshold,
LogicalWarpSizeSmall,
ItemsPerThread,
BlockSize>>>>());
BlockSize>,
EnableUnpartitionedWarpSort>>>());
}
};

Expand All @@ -321,15 +320,15 @@ struct device_segmented_radix_sort_benchmark_generator
}
else
{
storage.emplace_back(std::make_unique<device_segmented_radix_sort_benchmark<
Key,
rocprim::segmented_radix_sort_config<
LongBits,
ShortBits,
BlockSize,
ItemsPerThread,
EnableUnpartitionedWarpSort,
rocprim::DisabledWarpSortConfig>>>());
storage.emplace_back(
std::make_unique<device_segmented_radix_sort_benchmark<
Key,
rocprim::segmented_radix_sort_config<
LongBits,
ShortBits,
rocprim::kernel_config<BlockSize, ItemsPerThread>,
rocprim::DisabledWarpSortConfig,
EnableUnpartitionedWarpSort>>>());
}
}
};
Expand Down
1 change: 1 addition & 0 deletions benchmark/benchmark_device_segmented_radix_sort_pairs.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -309,6 +309,7 @@ int main(int argc, char* argv[])
// Add benchmarks
std::vector<benchmark::internal::Benchmark*> benchmarks;
#ifdef BENCHMARK_CONFIG_TUNING
(void)min_size;
const int parallel_instance = parser.get<int>("parallel_instance");
const int parallel_instances = parser.get<int>("parallel_instances");
config_autotune_register::register_benchmark_subset(benchmarks,
Expand Down
27 changes: 13 additions & 14 deletions benchmark/benchmark_device_segmented_radix_sort_pairs.parallel.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -330,16 +330,15 @@ struct device_segmented_radix_sort_benchmark_generator
rocprim::segmented_radix_sort_config<
LongBits,
ShortBits,
BlockSize,
ItemsPerThread,
EnableUnpartitionedWarpSort,
rocprim::kernel_config<BlockSize, ItemsPerThread>,
rocprim::WarpSortConfig<LogicalWarpSizeSmall / 2,
ItemsPerThread / 2,
BlockSize,
PartitioningThreshold,
LogicalWarpSizeSmall,
ItemsPerThread,
BlockSize>>>>());
BlockSize>,
EnableUnpartitionedWarpSort>>>());
}
};

Expand All @@ -360,16 +359,16 @@ struct device_segmented_radix_sort_benchmark_generator
}
else
{
storage.emplace_back(std::make_unique<device_segmented_radix_sort_benchmark<
Key,
Value,
rocprim::segmented_radix_sort_config<
LongBits,
ShortBits,
BlockSize,
ItemsPerThread,
EnableUnpartitionedWarpSort,
rocprim::DisabledWarpSortConfig>>>());
storage.emplace_back(
std::make_unique<device_segmented_radix_sort_benchmark<
Key,
Value,
rocprim::segmented_radix_sort_config<
LongBits,
ShortBits,
rocprim::kernel_config<BlockSize, ItemsPerThread>,
rocprim::DisabledWarpSortConfig,
EnableUnpartitionedWarpSort>>>());
}
}
};
Expand Down
Loading

0 comments on commit 3178ba4

Please sign in to comment.