Skip to content

Commit

Permalink
feat(ttm): add task level parallelism
Browse files Browse the repository at this point in the history
  • Loading branch information
bassoy committed Nov 22, 2024
1 parent fb3c0fa commit 32053ff
Show file tree
Hide file tree
Showing 3 changed files with 247 additions and 86 deletions.
2 changes: 2 additions & 0 deletions include/tlib/detail/tags.h
Original file line number Diff line number Diff line change
Expand Up @@ -25,13 +25,15 @@ namespace tlib::ttm::parallel_policy
struct sequential_t {}; // sequential loops and sequential gemm
struct parallel_blas_t {}; // multithreaded gemm
struct parallel_loop_t {}; // omp_for with single threaded gemm
struct parallel_taskloop_t {}; // omp_task for each loop with single threaded gemm
struct parallel_loop_blas_t {}; // omp_for with multi-threaded gemm
struct batched_gemm_t {}; // multithreaded batched gemm with collapsed loops
struct combined_t {};

inline constexpr sequential_t sequential;
inline constexpr parallel_blas_t parallel_blas;
inline constexpr parallel_loop_t parallel_loop;
inline constexpr parallel_taskloop_t parallel_taskloop;
inline constexpr parallel_loop_blas_t parallel_loop_blas;
inline constexpr batched_gemm_t batched_gemm;
inline constexpr combined_t combined;
Expand Down
Loading

0 comments on commit 32053ff

Please sign in to comment.