diff --git a/_sources/api_for_sycl_kernels/random.rst b/_sources/api_for_sycl_kernels/random.rst
index 9e82d86c7b..6e200cc01a 100644
--- a/_sources/api_for_sycl_kernels/random.rst
+++ b/_sources/api_for_sycl_kernels/random.rst
@@ -11,53 +11,79 @@ Random Number Engines
 ---------------------
 
 Random number engines use seed data as an entropy source to generate pseudo-random numbers. 
-|onedpl_short| provides several class templates for customized engines, they are defined in the header
-``<oneapi/dpl/random>``.
-
-============================== =========================================================================================================
-Engine                         Description
-============================== =========================================================================================================
-``linear_congruential_engine`` Implements a linear congruential algorithm
-``subtract_with_carry_engine`` Implements a subtract-with-carry algorithm
-``discard_block_engine``       Implements a discard block adaptor
-============================== =========================================================================================================
+|onedpl_short| provides several class templates for customizable engines, defined in the header
+``<oneapi/dpl/random>`` under the ``oneapi::dpl::`` namespace.
+
+=============================== ============================================
+Engine                          Description
+=============================== ============================================
+``linear_congruential_engine``  Implements a linear congruential algorithm
+``subtract_with_carry_engine``  Implements a subtract-with-carry algorithm
+``discard_block_engine``        Implements a discard block adaptor
+``experimental::philox_engine`` Implements a Philox algorithm
+=============================== ============================================
 
 Predefined Random Number Engines
 --------------------------------
 
-Predefined random number engines are instantiations of random number engines class templates. 
-The types below are defined in the header ``<oneapi/dpl/random>`` under the ``oneapi::dpl::`` namespace.
-
-===================================================================== =========================================================================================================
-Type                                                                  Description
-===================================================================== =========================================================================================================
-``minstd_rand0``                                                      ``oneapi::dpl::linear_congruential_engine<std::uint32_t, 16807, 0, 2147483647>``
-``minstd_rand``                                                       ``oneapi::dpl::linear_congruential_engine<std::uint32_t, 48271, 0, 2147483647>``
-``ranlux24_base``                                                     ``oneapi::dpl::subtract_with_carry_engine<std::uint32_t, 24, 10, 24>``
-``ranlux48_base``                                                     ``oneapi::dpl::subtract_with_carry_engine<std::uint64_t, 48, 5, 12>``
-``ranlux24``                                                          ``oneapi::dpl::discard_block_engine<ranlux24_base, 223, 23>``
-``ranlux48``                                                          ``oneapi::dpl::discard_block_engine<ranlux48_base, 389, 11>``
-===================================================================== =========================================================================================================
-
-The engines described below can efficiently generate vectors of random numbers. These types are
-defined in the header ``<oneapi/dpl/random>`` under the ``oneapi::dpl::`` namespace.
-
-===================================================================== =========================================================================================================
-Type                                                                  Description
-===================================================================== =========================================================================================================
-``template<std::int32_t N> minstd_rand0_vec<N>``                      ``oneapi::dpl::linear_congruential_engine<sycl::vec<std::uint32_t, N>, 16807, 0, 2147483647>``
-                                                                      minstd_rand0 for a vector generation case
-``template<std::int32_t N> minstd_rand_vec<N>``                       ``oneapi::dpl::linear_congruential_engine<sycl::vec<std::uint32_t, N>, 48271, 0, 2147483647>``
-                                                                      minstd_rand for a vector generation case
-``template<std::int32_t N> ranlux24_base_vec<N>``                     ``oneapi::dpl::subtract_with_carry_engine<sycl::vec<std::uint32_t, N>, 24, 10, 24>``
-                                                                      ranlux24_base for a vector generation case
-``template<std::int32_t N> ranlux48_base_vec<N>``                     ``oneapi::dpl::subtract_with_carry_engine<sycl::vec<std::uint64_t, N>, 48, 5, 12>``
-                                                                      ranlux48_base for a vector generation case
-``template<std::int32_t N> ranlux24_vec<N>``                          ``oneapi::dpl::discard_block_engine<ranlux24_base_vec<N>, 223, 23>``
-                                                                      ranlux24 for a vector generation case
-``template<std::int32_t N> ranlux48_vec<N>``                          ``oneapi::dpl::discard_block_engine<ranlux48_base_vec<N>, 389, 11>``
-                                                                      ranlux48 for vector generation case
-===================================================================== =========================================================================================================
+Predefined random number engines are instantiations of the random number engines class templates
+with selected engine parameters.
+
+The types below are defined in the header ``<oneapi/dpl/random>`` in the same namespaces as their
+respective class templates.
+
+================== =================================================================================
+Type               Description
+================== =================================================================================
+``minstd_rand0``   ``oneapi::dpl::linear_congruential_engine<std::uint32_t, 16807, 0, 2147483647>``
+``minstd_rand``    ``oneapi::dpl::linear_congruential_engine<std::uint32_t, 48271, 0, 2147483647>``
+``ranlux24_base``  ``oneapi::dpl::subtract_with_carry_engine<std::uint32_t, 24, 10, 24>``
+``ranlux48_base``  ``oneapi::dpl::subtract_with_carry_engine<std::uint64_t, 48, 5, 12>``
+``ranlux24``       ``oneapi::dpl::discard_block_engine<ranlux24_base, 223, 23>``
+``ranlux48``       ``oneapi::dpl::discard_block_engine<ranlux48_base, 389, 11>``
+``philox4x32``     ``oneapi::dpl::experimental::philox_engine<std::uint_fast32_t, 32, 4, 10, 0xCD9E8D57, 0x9E3779B9, 0xD2511F53, 0xBB67AE85>``
+``philox4x64``     ``oneapi::dpl::experimental::philox_engine<std::uint_fast64_t, 64, 4, 10, 0xCA5A826395121157, 0x9E3779B97F4A7C15, 0xD2E7470EE14C6C93, 0xBB67AE8584CAA73B>``
+================== =================================================================================
+
+The following predefined engines can efficiently generate vectors of random numbers.
+They differ from the scalar engines above by using ``sycl::vec<T, N>`` as the data type,
+while other engine parameters remain the same.
+
+================================================== ===============================================================================================
+Type                                               Description
+================================================== ===============================================================================================
+``template<std::int32_t N> minstd_rand0_vec<N>``   ``oneapi::dpl::linear_congruential_engine<sycl::vec<std::uint32_t, N>, 16807, 0, 2147483647>``
+
+                                                   ``minstd_rand0`` that generates a vector.
+-------------------------------------------------- -----------------------------------------------------------------------------------------------
+``template<std::int32_t N> minstd_rand_vec<N>``    ``oneapi::dpl::linear_congruential_engine<sycl::vec<std::uint32_t, N>, 48271, 0, 2147483647>``
+
+                                                   ``minstd_rand`` that generates a vector.
+-------------------------------------------------- -----------------------------------------------------------------------------------------------
+``template<std::int32_t N> ranlux24_base_vec<N>``  ``oneapi::dpl::subtract_with_carry_engine<sycl::vec<std::uint32_t, N>, 24, 10, 24>``
+
+                                                   ``ranlux24_base`` that generates a vector.
+-------------------------------------------------- -----------------------------------------------------------------------------------------------
+``template<std::int32_t N> ranlux48_base_vec<N>``  ``oneapi::dpl::subtract_with_carry_engine<sycl::vec<std::uint64_t, N>, 48, 5, 12>``
+
+                                                   ``ranlux48_base`` that generates a vector.
+-------------------------------------------------- -----------------------------------------------------------------------------------------------
+``template<std::int32_t N> ranlux24_vec<N>``       ``oneapi::dpl::discard_block_engine<ranlux24_base_vec<N>, 223, 23>``
+
+                                                   ``ranlux24`` that generates a vector.
+-------------------------------------------------- -----------------------------------------------------------------------------------------------
+``template<std::int32_t N> ranlux48_vec<N>``       ``oneapi::dpl::discard_block_engine<ranlux48_base_vec<N>, 389, 11>``
+
+                                                   ``ranlux48`` that generates a vector.
+-------------------------------------------------- -----------------------------------------------------------------------------------------------
+``template<std::int32_t N> philox4x32_vec<N>``     ``oneapi::dpl::experimental::philox_engine<sycl::vec<std::uint_fast32_t, N>, 32, 4, 10, 0xCD9E8D57, 0x9E3779B9, 0xD2511F53, 0xBB67AE85>``
+
+                                                   ``philox4x32`` that generates a vector.
+-------------------------------------------------- -----------------------------------------------------------------------------------------------
+``template<std::int32_t N> philox4x64_vec<N>``     ``oneapi::dpl::experimental::philox_engine<sycl::vec<std::uint_fast64_t, N>, 64, 4, 10, 0xCA5A826395121157, 0x9E3779B97F4A7C15, 0xD2E7470EE14C6C93, 0xBB67AE8584CAA73B>``
+
+                                                   ``philox4x64`` that generates a vector.
+================================================== ===============================================================================================
 
 Random Number Distributions
 ---------------------------
@@ -66,9 +92,9 @@ Random number distributions process the output of random number engines in such
 resulting output is distributed according to a defined statistical probability density function. They
 are defined in the header ``<oneapi/dpl/random>`` under the ``oneapi::dpl::`` namespace.
 
-============================== =========================================================================================================
+============================== ============================================================================
 Distribution                   Description
-============================== =========================================================================================================
+============================== ============================================================================
 ``uniform_int_distribution``   Produces integer values evenly distributed across a range
 ``uniform_real_distribution``  Produces real values evenly distributed across a range
 ``normal_distribution``        Produces real values according to the Normal (Gaussian) distribution
@@ -79,7 +105,10 @@ Distribution                   Description
 ``lognormal_distribution``     Produces real values according to the Lognormal distribution
 ``extreme_value_distribution`` Produces real values according to the Extreme value (Gumbel) distribution
 ``cauchy_distribution``        Produces real values according to the Cauchy distribution
-============================== =========================================================================================================
+============================== ============================================================================
+
+.. note::
+  ``bernoulli_distribution``, ``geometric_distribution``, and ``uniform_int_distribution`` can only be used on devices with FP64 support as they rely on double precision in their implementation (use ``sycl::aspect::fp64`` to check if the device supports FP64).
 
 Usage Model of |onedpl_short| Random Number Generation Functionality
 --------------------------------------------------------------------
diff --git a/_sources/api_for_sycl_kernels/tested_standard_cpp_api.rst b/_sources/api_for_sycl_kernels/tested_standard_cpp_api.rst
index af87a010f9..cd7691bb60 100644
--- a/_sources/api_for_sycl_kernels/tested_standard_cpp_api.rst
+++ b/_sources/api_for_sycl_kernels/tested_standard_cpp_api.rst
@@ -463,9 +463,9 @@ C++ Standard API                      libstdc++  libc++     MSVC
 These tests were done for the following versions of the standard C++ library:
 
 ============================================= =============================================
-libstdc++(GNU)                                Provided with GCC*-7.5.0, GCC*-9.3.0
+libstdc++ (GNU)                               Provided with GCC*-7.5.0, GCC*-9.3.0
 --------------------------------------------- ---------------------------------------------
-libc++(LLVM)                                  Provided with Clang*-11.0
+libc++ (LLVM)                                 Provided with Clang*-11.0
 --------------------------------------------- ---------------------------------------------
 Microsoft Visual C++* (MSVC) Standard Library Provided with Microsoft Visual Studio* 2017;
                                               Microsoft Visual Studio 2019; and Microsoft 
diff --git a/_sources/api_for_sycl_kernels/utility_function_object_classes.rst b/_sources/api_for_sycl_kernels/utility_function_object_classes.rst
index b760041ebf..af1f368442 100644
--- a/_sources/api_for_sycl_kernels/utility_function_object_classes.rst
+++ b/_sources/api_for_sycl_kernels/utility_function_object_classes.rst
@@ -2,11 +2,11 @@ Utility Function Object Classes
 ##################################
 
 The definitions of the utility function objects are available through the
-``oneapi/dpl/functional`` header.  All function objects are implemented in the ``oneapi::dpl`` namespace.
+``<oneapi/dpl/functional>`` header.  All function objects are implemented in the ``oneapi::dpl`` namespace.
 
-* ``identity``: A C++11 implementation of the C++20 ``std::identity`` function object type, where the operator() returns the
-  argument unchanged.
-* ``minimum``: A function object type where the operator() applies ``std::less`` to its arguments, then returns the
-  lesser argument unchanged.
-* ``maximum``: A function object type where the operator() applies ``std::greater`` to its arguments, then returns the
-  greater argument unchanged.
\ No newline at end of file
+* ``identity``: A function object type where the operator() returns the argument unchanged.
+  It is an implementation of ``std::identity`` that can be used prior to C++20.
+* ``minimum``: A function object type where the operator() applies ``std::less`` to its arguments,
+  then returns the lesser argument unchanged.
+* ``maximum``: A function object type where the operator() applies ``std::greater`` to its arguments,
+  then returns the greater argument unchanged.
\ No newline at end of file
diff --git a/_sources/api_for_sycl_kernels_main.rst b/_sources/api_for_sycl_kernels_main.rst
index 333f9e24c2..2a9aad44a7 100644
--- a/_sources/api_for_sycl_kernels_main.rst
+++ b/_sources/api_for_sycl_kernels_main.rst
@@ -1,5 +1,5 @@
-API for the SYCL* Kernels
-#########################
+API for SYCL* Kernels
+#####################
 
 |onedpl_long| (|onedpl_short|) includes the following APIs for SYCL* kernels:
 
@@ -13,9 +13,8 @@ API for the SYCL* Kernels
 .. toctree::
    :maxdepth: 2
    :titlesonly:
-   :glob:
    :hidden:
 
-   api_for_sycl_kernels/random
    api_for_sycl_kernels/tested_standard_cpp_api
-   api_for_sycl_kernels/utility_function_object_classes
\ No newline at end of file
+   api_for_sycl_kernels/random
+   api_for_sycl_kernels/utility_function_object_classes
diff --git a/_sources/cmake_support.rst b/_sources/cmake_support.rst
index 61eb16ef28..2d50cfa506 100644
--- a/_sources/cmake_support.rst
+++ b/_sources/cmake_support.rst
@@ -17,7 +17,10 @@ Requirements
 ============
 The minimal supported CMake version for |onedpl_short| is 3.11 on Linux and 3.20 on Windows.
 
-The supported `CMake Generator <https://cmake.org/cmake/help/latest/manual/cmake-generators.7.html#ninja-generators>`_ for Linux is `Unix Makefiles <https://cmake.org/cmake/help/latest/generator/Unix%20Makefiles.html>`_ (default). In the Windows environment, the supported generator is `Ninja <https://cmake.org/cmake/help/latest/generator/Ninja.html>`_ as described in the `Intel® oneAPI DPC++/C++ Compiler Developer Guide and Reference <https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/current/use-cmake-with-the-compiler.html>`_ which may be specified via ``-GNinja``.
+The supported `CMake Generator <https://cmake.org/cmake/help/latest/manual/cmake-generators.7.html#ninja-generators>`_
+for Linux is `Unix Makefiles <https://cmake.org/cmake/help/latest/generator/Unix%20Makefiles.html>`_ (default).
+In the Windows environment, the supported generator is `Ninja <https://cmake.org/cmake/help/latest/generator/Ninja.html>`_
+which may be specified via ``-GNinja`` as described in the |dpcpp_cmake_support|_.
 
 |onedpl_short| Backend Options
 ==============================
diff --git a/_sources/dynamic_selection_api/auto_tune_policy.rst b/_sources/dynamic_selection_api/auto_tune_policy.rst
index 4bdf3ea792..8ab8a2be46 100644
--- a/_sources/dynamic_selection_api/auto_tune_policy.rst
+++ b/_sources/dynamic_selection_api/auto_tune_policy.rst
@@ -1,248 +1,260 @@
-Auto-Tune Policy
-################
-
-The dynamic selection API is an experimental feature in the |onedpl_long| 
-(|onedpl_short|) that selects an *execution resource* based on a chosen 
-*selection policy*. There are several policies provided as part 
-of the API. Policies encapsulate the logic and any associated state needed 
-to make a selection. 
-
-The auto-tune policy selects resources using runtime profiling. ``auto_tune_policy`` 
-is useful for determining which resource performs best
-for a given kernel. The choice is made based on runtime performance
-history, so this policy is only useful for kernels that have stable
-performance. Initially, this policy acts like ``round_robin_policy``,
-rotating through each resource (one or more times). Then, once it has
-determined which resource is performing best, it uses that resource
-thereafter. Optionally, a resampling interval can be set to return to
-the profiling phase periodically.
-
-.. code:: cpp
-
-  namespace oneapi::dpl::experimental {
-  
-    template<typename Backend = sycl_backend> 
-    class auto_tune_policy {
-    public:
-      // useful types
-      using resource_type = typename Backend::resource_type;
-      using wait_type = typename Backend::wait_type;
-      
-      class selection_type {
-      public:
-        auto_tune_policy<Backend> get_policy() const;
-        resource_type unwrap() const;
-      };
-      
-      // constructors
-      auto_tune_policy(deferred_initialization_t);
-      auto_tune_policy(uint64_t resample_interval_in_milliseconds = 0);
-      auto_tune_policy(const std::vector<resource_type>& u,
-                       uint64_t resample_interval_in_milliseconds = 0);  
-  
-      // deferred initializer
-      void initialize(uint64_t resample_interval_in_milliseconds = 0);
-      void initialize(const std::vector<resource_type>& u,
-                      uint64_t resample_interval_in_milliseconds = 0);
-                      
-      // queries
-      auto get_resources() const;
-      auto get_submission_group();
-      
-      // other implementation defined functions...
-    };
-  
-  }
-  
-This policy can be used with all the dynamic selection functions, such as ``select``, ``submit``,
-and ``submit_and_wait``. It can also be used with ``policy_traits``.
-
-Example
--------
-
-In the following example, an ``auto_tune_policy`` is used to dynamically select between 
-two queues, a CPU queue and a GPU queue. 
-
-.. code:: cpp
-
-  #include <oneapi/dpl/dynamic_selection>
-  #include <sycl/sycl.hpp>
-  #include <iostream>
-
-  namespace ex = oneapi::dpl::experimental;
-
-  int main() {
-    std::vector<sycl::queue> r { sycl::queue{sycl::cpu_selector_v},
-                                 sycl::queue{sycl::gpu_selector_v} };
-
-    const std::size_t N = 10000;
-    std::vector<float> av(N, 0.0);
-    std::vector<float> bv(N, 0.0);
-    std::vector<float> cv(N, 0.0);
-    for (int i = 0; i < N; ++i) {
-      av[i] = bv[i] = i;
-    }
-
-    ex::auto_tune_policy p{r}; // (1)
-
-    {
-      sycl::buffer<float> a_b(av);
-      sycl::buffer<float> b_b(bv);
-      sycl::buffer<float> c_b(cv);
-
-
-      for (int i = 0; i < 6; ++i) {
-        ex::submit_and_wait(p, [&](sycl::queue q) { // (2)
-          // (3)
-          std::cout << (q.get_device().is_cpu() ? "using cpu\n" : "using gpu\n");
-          return q.submit([&](sycl::handler &h) { // (4)
-            sycl::accessor a_a(a_b, h, sycl::read_only);
-            sycl::accessor b_a(b_b, h, sycl::read_only);
-            sycl::accessor c_a(c_b, h, sycl::read_write);
-            h.parallel_for(N, [=](auto i) { c_a[i] = a_a[i] + b_a[i]; }); 
-          });
-        }); 
-      };  
-    }
-
-    for (int i = 0; i < N; ++i) {
-      if (cv[i] != 2*i) {
-         std::cout << "ERROR!\n";
-      }   
-    }
-    std::cout << "Done.\n";
-  }
-
-The key points in this example are:
-
-#. An ``auto_tune_policy`` is constructed to select between the CPU and GPU.
-#. ``submit_and_wait`` is invoked with the policy as the first argument. The selected queue will be passed to the user-provided function.
-#. For clarity when run, the type of device is displayed.
-#. The queue is used in function to perform and asynchronous offload. The SYCL event returned from the call to ``submit`` is returned. Returning an event is required for functions passed to ``submit`` and ``submit_and_wait``.
-
-Selection Algorithm
--------------------
- 
-The selection algorithm for ``auto_tune_policy`` uses runtime profiling
-to choose the best resource for the given function. A simplified, expository 
-implementation of the selection algorithm follows:
- 
-.. code::
-
-  template<typename Function, typename ...Args>
-  selection_type auto_tune_policy::select(Function&& f, Args&&...args) {
-    if (initialized_) {
-      auto k = make_task_key(f, args...);
-      auto tuner = get_tuner(k);
-      auto offset = tuner->get_resource_to_profile();
-      if (offset == use_best) {
-        return selection_type {*this, tuner->best_resource_, tuner}; 
-      } else {
-        auto r = resources_[offset];
-        return selection{*this, r, tuner}; 
-      }
-    } else {
-      throw std::logic_error(“selected called before initialization”);
-    } 
-  }
-
-where ``make_task_key`` combines the inputs, including the function and its
-arguments, into a key that uniquely identifies the user function that is being
-profiled. ``tuner`` is the encapsulated logic for performing runtime profiling
-and choosing the best option for a given key. When the call to ``get_resource_to_profile()``
-return ``use_best``, the tuner is not in the profiling phase, and so the previously
-determined best resource is used. Otherwise, the resource at index ``offset`` 
-in the ``resources_`` vector is used and its resulting performance is profiled. 
-When an ``auto_tune_policy`` is initialized with a non-zero resample interval,
-the policy will periodically return to the profiling phase base on the provided
-interval value.
-
-Constructors
-------------
-
-``auto_tune_policy`` provides three constructors.
-
-.. list-table:: ``auto_tune_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``auto_tune_policy(deferred_initialization_t);``
-    - Defers initialization. An ``initialize`` function must be called prior to use.
-  * - ``auto_tune_policy(uint64_t resample_interval_in_milliseconds = 0);``
-    - Initialized to use the default set of resources. An optional resampling interval can be provided.
-  * - ``auto_tune_policy(const std::vector<resource_type>& u, uint64_t resample_interval_in_milliseconds = 0);``
-    - Overrides the default set of resources. An optional resampling interval can be provided.
-
-Deferred Initialization
------------------------
-
-A ``auto_tune_policy`` that was constructed with deferred initialization must be 
-initialized by calling one its ``initialize`` member functions before it can be used
-to select or submit.
-
-.. list-table:: ``auto_tune_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``initialize(uint64_t resample_interval_in_milliseconds = 0);``
-    - Initialize to use the default set of resources. An optional resampling interval can be provided.
-  * - ``initialize(const std::vector<resource_type>& u, uint64_t resample_interval_in_milliseconds = 0);``
-    - Overrides the default set of resources. An optional resampling interval can be provided.
-
-Queries
--------
-
-A ``auto_tune_policy`` has ``get_resources`` and ``get_submission_group`` 
-member functions.
-
-.. list-table:: ``auto_tune_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``std::vector<resource_type> get_resources();``
-    - Returns the set of resources the policy is selecting from.
-  * - ``auto get_submission_group();``
-    - Returns an object that can be used to wait for all active submissions.
-
-Reporting Requirements
-----------------------
-
-If a resource returned by ``select`` is used directly without calling
-``submit`` or ``submit_and_wait``, it may be necessary to call ``report``
-to provide feedback to the policy. The ``auto_tune_policy`` tracks the
-performance of submissions on each device via callbacks that report
-the execution time. The instrumentation to report these events is included 
-in the implementations of ``submit`` and ``submit_and_wait``.  However, if you 
-use ``select`` and then submit work directly to the selected resource, it 
-is necessary to explicitly report these events.
-
-.. list-table:: ``auto_tune_policy`` reporting requirements
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - ``execution_info``
-    - is reporting required?
-  * - ``task_submission``
-    - No
-  * - ``task_completion``
-    - No
-  * - ``task_time``
-    - Yes
-
-In generic code, it is possible to perform compile-time checks to avoid
-reporting overheads when reporting is not needed, while still writing 
-code that will work with any policy, as demonstrated below:
-
-.. code:: cpp
-
-  auto s = select(my_policy);
-  if constexpr (report_info_v<decltype(s), execution_info::task_submission_t>)
-  {
-    s.report(execution_info::task_submission);
-  }
+Auto-Tune Policy
+################
+
+The dynamic selection API is an experimental feature in the |onedpl_long| 
+(|onedpl_short|) that selects an *execution resource* based on a chosen 
+*selection policy*. There are several policies provided as part 
+of the API. Policies encapsulate the logic and any associated state needed 
+to make a selection. 
+
+The auto-tune policy selects resources using runtime profiling. ``auto_tune_policy`` 
+is useful for determining which resource performs best
+for a given kernel. The choice is made based on runtime performance
+history, so this policy is only useful for kernels that have stable
+performance. Initially, this policy acts like ``round_robin_policy``,
+rotating through each resource (one or more times). Then, once it has
+determined which resource is performing best, it uses that resource
+thereafter. Optionally, a resampling interval can be set to return to
+the profiling phase periodically.
+
+.. code:: cpp
+
+  namespace oneapi::dpl::experimental {
+  
+    template<typename Backend = sycl_backend> 
+    class auto_tune_policy {
+    public:
+      // useful types
+      using resource_type = typename Backend::resource_type;
+      using wait_type = typename Backend::wait_type;
+      
+      class selection_type {
+      public:
+        auto_tune_policy<Backend> get_policy() const;
+        resource_type unwrap() const;
+      };
+      
+      // constructors
+      auto_tune_policy(deferred_initialization_t);
+      auto_tune_policy(uint64_t resample_interval_in_milliseconds = 0);
+      auto_tune_policy(const std::vector<resource_type>& u,
+                       uint64_t resample_interval_in_milliseconds = 0);
+  
+      // deferred initializer
+      void initialize(uint64_t resample_interval_in_milliseconds = 0);
+      void initialize(const std::vector<resource_type>& u,
+                      uint64_t resample_interval_in_milliseconds = 0);
+                      
+      // queries
+      auto get_resources() const;
+      auto get_submission_group();
+      
+      // other implementation defined functions...
+    };
+  
+  }
+  
+This policy can be used with all the dynamic selection functions, such as ``select``, ``submit``,
+and ``submit_and_wait``. It can also be used with ``policy_traits``.
+
+Example
+-------
+
+In the following example, an ``auto_tune_policy`` is used to dynamically select between 
+two queues, a CPU queue and a GPU queue. 
+
+.. code:: cpp
+
+  #include <oneapi/dpl/dynamic_selection>
+  #include <sycl/sycl.hpp>
+  #include <iostream>
+
+  namespace ex = oneapi::dpl::experimental;
+
+  int main() {
+    std::vector<sycl::queue> r { sycl::queue{sycl::cpu_selector_v},
+                                 sycl::queue{sycl::gpu_selector_v} };
+
+    const std::size_t N = 10000;
+    std::vector<float> av(N, 0.0);
+    std::vector<float> bv(N, 0.0);
+    std::vector<float> cv(N, 0.0);
+    for (int i = 0; i < N; ++i) {
+      av[i] = bv[i] = i;
+    }
+
+    ex::auto_tune_policy p{r}; // (1)
+
+    {
+      sycl::buffer<float> a_b(av);
+      sycl::buffer<float> b_b(bv);
+      sycl::buffer<float> c_b(cv);
+
+
+      for (int i = 0; i < 6; ++i) {
+        ex::submit_and_wait(p, [&](sycl::queue q) { // (2)
+          // (3)
+          std::cout << (q.get_device().is_cpu() ? "using cpu\n" : "using gpu\n");
+          return q.submit([&](sycl::handler &h) { // (4)
+            sycl::accessor a_a(a_b, h, sycl::read_only);
+            sycl::accessor b_a(b_b, h, sycl::read_only);
+            sycl::accessor c_a(c_b, h, sycl::read_write);
+            h.parallel_for(N, [=](auto i) { c_a[i] = a_a[i] + b_a[i]; }); 
+          });
+        }); 
+      };  
+    }
+
+    for (int i = 0; i < N; ++i) {
+      if (cv[i] != 2*i) {
+         std::cout << "ERROR!\n";
+      }   
+    }
+    std::cout << "Done.\n";
+  }
+
+The key points in this example are:
+
+#. An ``auto_tune_policy`` is constructed to select between the CPU and GPU.
+#. ``submit_and_wait`` is invoked with the policy as the first argument. The selected queue will be passed to the user-provided function.
+#. For clarity when run, the type of device is displayed.
+#. The queue is used in function to perform and asynchronous offload. The SYCL event returned from the call to ``submit`` is returned. Returning an event is required for functions passed to ``submit`` and ``submit_and_wait``.
+
+Selection Algorithm
+-------------------
+ 
+The selection algorithm for ``auto_tune_policy`` uses runtime profiling
+to choose the best resource for the given function. A simplified, expository 
+implementation of the selection algorithm follows:
+ 
+.. code:: cpp
+
+  template<typename Function, typename ...Args>
+  selection_type auto_tune_policy::select(Function&& f, Args&&...args) {
+    if (initialized_) {
+      auto k = make_task_key(f, args...);
+      auto tuner = get_tuner(k);
+      auto offset = tuner->get_resource_to_profile();
+      if (offset == use_best) {
+        return selection_type {*this, tuner->best_resource_, tuner}; 
+      } else {
+        auto r = resources_[offset];
+        return selection{*this, r, tuner}; 
+      }
+    } else {
+      throw std::logic_error("selected called before initialization");
+    } 
+  }
+
+where ``make_task_key`` combines the inputs, including the function and its
+arguments, into a key that uniquely identifies the user function that is being
+profiled. ``tuner`` is the encapsulated logic for performing runtime profiling
+and choosing the best option for a given key. When the call to ``get_resource_to_profile()``
+return ``use_best``, the tuner is not in the profiling phase, and so the previously
+determined best resource is used. Otherwise, the resource at index ``offset`` 
+in the ``resources_`` vector is used and its resulting performance is profiled. 
+When an ``auto_tune_policy`` is initialized with a non-zero resample interval,
+the policy will periodically return to the profiling phase base on the provided
+interval value.
+
+Constructors
+------------
+
+``auto_tune_policy`` provides three constructors.
+
+.. list-table:: ``auto_tune_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``auto_tune_policy(deferred_initialization_t);``
+    - Defers initialization. An ``initialize`` function must be called prior to use.
+  * - ``auto_tune_policy(uint64_t resample_interval_in_milliseconds = 0);``
+    - Initialized to use the default set of resources. An optional resampling interval can be provided.
+  * - ``auto_tune_policy(const std::vector<resource_type>& u, uint64_t resample_interval_in_milliseconds = 0);``
+    - Overrides the default set of resources. An optional resampling interval can be provided.
+
+.. Note::
+
+   When initializing the ``auto_tune_policy`` with SYCL queues, constructing the queues with the
+   ``sycl::property::queue::enable_profiling`` property allows a more accurate determination of the
+   best-performing device to be made.
+
+Deferred Initialization
+-----------------------
+
+A ``auto_tune_policy`` that was constructed with deferred initialization must be 
+initialized by calling one its ``initialize`` member functions before it can be used
+to select or submit.
+
+.. list-table:: ``auto_tune_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``initialize(uint64_t resample_interval_in_milliseconds = 0);``
+    - Initialize to use the default set of resources. An optional resampling interval can be provided.
+  * - ``initialize(const std::vector<resource_type>& u, uint64_t resample_interval_in_milliseconds = 0);``
+    - Overrides the default set of resources. An optional resampling interval can be provided.
+
+.. Note::
+
+   When initializing the ``auto_tune_policy`` with SYCL queues, constructing the queues with the
+   ``sycl::property::queue::enable_profiling`` property allows a more accurate determination of the
+   best-performing device to be made.
+
+Queries
+-------
+
+A ``auto_tune_policy`` has ``get_resources`` and ``get_submission_group`` 
+member functions.
+
+.. list-table:: ``auto_tune_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``std::vector<resource_type> get_resources();``
+    - Returns the set of resources the policy is selecting from.
+  * - ``auto get_submission_group();``
+    - Returns an object that can be used to wait for all active submissions.
+
+Reporting Requirements
+----------------------
+
+If a resource returned by ``select`` is used directly without calling
+``submit`` or ``submit_and_wait``, it may be necessary to call ``report``
+to provide feedback to the policy. The ``auto_tune_policy`` tracks the
+performance of submissions on each device via callbacks that report
+the execution time. The instrumentation to report these events is included 
+in the implementations of ``submit`` and ``submit_and_wait``.  However, if you 
+use ``select`` and then submit work directly to the selected resource, it 
+is necessary to explicitly report these events.
+
+.. list-table:: ``auto_tune_policy`` reporting requirements
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - ``execution_info``
+    - is reporting required?
+  * - ``task_submission``
+    - No
+  * - ``task_completion``
+    - No
+  * - ``task_time``
+    - Yes
+
+In generic code, it is possible to perform compile-time checks to avoid
+reporting overheads when reporting is not needed, while still writing 
+code that will work with any policy, as demonstrated below:
+
+.. code:: cpp
+
+  auto s = select(my_policy);
+  if constexpr (report_info_v<decltype(s), execution_info::task_submission_t>)
+  {
+    s.report(execution_info::task_submission);
+  }
diff --git a/_sources/dynamic_selection_api/dynamic_load_policy.rst b/_sources/dynamic_selection_api/dynamic_load_policy.rst
index ffd7dae485..93a1f6c482 100644
--- a/_sources/dynamic_selection_api/dynamic_load_policy.rst
+++ b/_sources/dynamic_selection_api/dynamic_load_policy.rst
@@ -1,231 +1,231 @@
-Dynamic Load Policy
-###################
-
-The dynamic selection API is an experimental feature in the |onedpl_long| 
-(|onedpl_short|) that selects an *execution resource* based on a chosen 
-*selection policy*. There are several policies provided as part 
-of the API. Policies encapsulate the logic and any associated state needed 
-to make a selection. 
-
-The dynamic load policy tracks the number of submissions currently submitted but not yet completed on each 
-resource and selects the resource that has the fewest unfinished submissions. 
-``dynamic_load_policy`` is useful for offloading kernels of varying cost to devices 
-of varying performance. A load-based assignment may achieve a good load balancing 
-by submitting tasks to a resource that completes work faster.
-
-.. code:: cpp
-
-  namespace oneapi::dpl::experimental {
-  
-    template<typename Backend = sycl_backend> 
-    class dynamic_load_policy {
-    public:
-      // useful types
-      using resource_type = typename Backend::resource_type;
-      using wait_type = typename Backend::wait_type;
-      
-      class selection_type {
-      public:
-        dynamic_load_policy<Backend> get_policy() const;
-        resource_type unwrap() const;
-      };
-      
-      // constructors
-      dynamic_load_policy(deferred_initialization_t);
-      dynamic_load_policy();
-      dynamic_load_policy(const std::vector<resource_type>& u);  
-  
-      // deferred initializer
-      void initialize();
-      void initialize(const std::vector<resource_type>& u);
-                      
-      // queries
-      auto get_resources() const;
-      auto get_submission_group();
-      
-      // other implementation defined functions...
-    };
-  
-  }
-  
-This policy can be used with all the dynamic selection functions, such as ``select``, ``submit``,
-and ``submit_and_wait``. It can also be used with ``policy_traits``.
-
-Example
--------
-
-The following example demonstrates a simple approach to send work to more than
-one queue concurrently using ``dynamic_load_policy``. The policy selects the
-resource with the fewest number of unfinished submissions.
-
-.. code:: cpp
-
-  #include <oneapi/dpl/dynamic_selection>
-  #include <sycl/sycl.hpp>
-  #include <iostream>
-
-  const std::size_t N = 10000;
-  namespace ex = oneapi::dpl::experimental;
-
-  void f(sycl::handler& h, float* v);
-  void do_cpu_work();
-
-  int dynamic_load_example(std::vector<sycl::queue>& devices, 
-                           std::vector<float *>& usm_data) {
-
-    ex::dynamic_load_policy p{devices}; // (1)
-
-    auto num_devices = p.get_resources().size();
-    auto num_arrays = usm_data.size();
-    // (2)
-    auto submission_group_size = num_arrays;
-
-    std::cout << "Running with " << num_devices << " queues\n"
-              << "             " << num_arrays  << " usm arrays\n"
-              << "Will perform " << submission_group_size << " concurrent offloads\n";
-
-
-    for (int i = 0; i < 100; i+=submission_group_size) { // (3)
-      for (int j = 0; j < submission_group_size; ++j) {  // (4)
-        ex::submit(p, [&](sycl::queue q) { // (5)
-          float *data = usm_data[j];
-          return q.submit([=](sycl::handler &h) { // (6) 
-            f(h, data);
-          });
-        }); 
-        do_cpu_work(); // (7)
-      }   
-      ex::wait(p.get_submission_group()); // (8) 
-    }
-    return 0;
-  }
-
-The key points in this example are:
-
-#. A ``dynamic_load_policy`` is constructed that selects from queues in the ``devices`` vector.
-#. The total number of concurrent offloads, ``submission_group_size``, will be limited to the number of USM arrays. In this example, we allow multiple simultaneous offloads to the same queue. The only limitation is that there should be enough available vectors to support the concurrent executions.
-#. The outer ``i``-loop iterates from 0 to 99, stepping by the ``submission_group_size``. This number of submissions will be offloaded concurrently.
-#. The inner ``j``-loop iterates over ``submission_group_size`` submissions.
-#. ``submit`` is used to select a queue and pass it to the user's function, but does not block until the event returned by that function completes. This provides the opportunity for concurrency across the submissions.
-#. The queue is used in a function to perform an asynchronous offload. The SYCL event returned from the call to ``submit`` is returned. Returning an event is required for functions passed to ``submit`` and ``submit_and_wait``.
-#. Some additional work is done between calls to ``submit``. ``dynamic_load_policy`` is most useful when there is time for work to complete on some devices before the next assignment is made. If all submissions are performed simultaneously, all devices will appear equally loaded, since the fast devices would have had no time to complete their work.
-#. ``wait`` is called to block for all the concurrent ``submission_group_size`` submissions to complete.
-
-Selection Algorithm
--------------------
- 
-The selection algorithm for ``dynamic_load_policy`` chooses the resource
-that has the fewest number of unfinished offloads. The number of unfinished
-offloads is the difference between the number of reported task submissions 
-and then number of reported task completions. This value is tracked for each 
-available resource.
-
-Simplified, expository implementation of the selection algorithm:
- 
-.. code::
-
-  template<typename... Args>
-  selection_type dynamic_load_policy::select(Args&& ...) {
-    if (initialized_) {
-      auto least_loaded_resource = find_least_loaded(resources_);
-      return selection_type{dynamic_load_policy<Backend>(*this), least_loaded};
-    } else {
-      throw std::logic_error("select called before initialialization");
-    }
-  }
-
-where ``resources_`` is a container of resources, such as 
-``std::vector`` of ``sycl::queue``.  The function ``find_least_loaded``
-iterates through the resources available to the policy and returns the
-resource with the fewest number of unfinished offloads. 
-
-Constructors
-------------
-
-``dynamic_load_policy`` provides three constructors.
-
-.. list-table:: ``dynamic_load_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``dynamic_load_policy(deferred_initialization_t);``
-    - Defers initialization. An ``initialize`` function must be called prior to use.
-  * - ``dynamic_load_policy();``
-    - Initialized to use the default set of resources.
-  * - ``dynamic_load_policy(const std::vector<resource_type>& u);``
-    - Overrides the default set of resources.
-
-Deferred Initialization
------------------------
-
-A ``dynamic_load_policy`` that was constructed with deferred initialization must be 
-initialized by calling one of its ``initialize`` member functions before it can be used
-to select or submit.
-
-.. list-table:: ``dynamic_load_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``initialize();``
-    - Initialize to use the default set of resources.
-  * - ``initialize(const std::vector<resource_type>& u);``
-    - Overrides the default set of resources.
-
-Queries
--------
-
-A ``dynamic_load_policy`` has ``get_resources`` and ``get_submission_group`` 
-member functions.
-
-.. list-table:: ``dynamic_load_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``std::vector<resource_type> get_resources();``
-    - Returns the set of resources the policy is selecting from.
-  * - ``auto get_submission_group();``
-    - Returns an object that can be used to wait for all active submissions.
-
-Reporting Requirements
-----------------------
-
-If a resource returned by ``select`` is used directly without calling
-``submit`` or ``submit_and_wait``, it may be necessary to call ``report``
-to provide feedback to the policy. The ``dynamic_load_policy`` tracks the
-number of outstanding submissions on each device via callbacks that report
-when a submission is started, and when it is completed. The instrumentation
-to report these events is included in the implementations of 
-``submit`` and ``submit_and_wait``.  However, if you use ``select`` and then
-submit work directly to the selected resource, it is necessary to explicitly
-report these events.
-
-.. list-table:: ``dynamic_load_policy`` reporting requirements
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - ``execution_info``
-    - is reporting required?
-  * - ``task_submission``
-    - Yes
-  * - ``task_completion``
-    - Yes
-  * - ``task_time``
-    - No
-
-In generic code, it is possible to perform compile-time checks to avoid
-reporting overheads when reporting is not needed, while still writing 
-code that will work with any policy, as demonstrated below:
-
-.. code:: cpp
-
-  auto s = select(my_policy);
-  if constexpr (report_info_v<decltype(s), execution_info::task_submission_t>)
-  {
-    s.report(execution_info::task_submission);
-  }
+Dynamic Load Policy
+###################
+
+The dynamic selection API is an experimental feature in the |onedpl_long| 
+(|onedpl_short|) that selects an *execution resource* based on a chosen 
+*selection policy*. There are several policies provided as part 
+of the API. Policies encapsulate the logic and any associated state needed 
+to make a selection. 
+
+The dynamic load policy tracks the number of submissions currently submitted but not yet completed on each 
+resource and selects the resource that has the fewest unfinished submissions. 
+``dynamic_load_policy`` is useful for offloading kernels of varying cost to devices 
+of varying performance. A load-based assignment may achieve a good load balancing 
+by submitting tasks to a resource that completes work faster.
+
+.. code:: cpp
+
+  namespace oneapi::dpl::experimental {
+  
+    template<typename Backend = sycl_backend> 
+    class dynamic_load_policy {
+    public:
+      // useful types
+      using resource_type = typename Backend::resource_type;
+      using wait_type = typename Backend::wait_type;
+      
+      class selection_type {
+      public:
+        dynamic_load_policy<Backend> get_policy() const;
+        resource_type unwrap() const;
+      };
+      
+      // constructors
+      dynamic_load_policy(deferred_initialization_t);
+      dynamic_load_policy();
+      dynamic_load_policy(const std::vector<resource_type>& u);  
+  
+      // deferred initializer
+      void initialize();
+      void initialize(const std::vector<resource_type>& u);
+                      
+      // queries
+      auto get_resources() const;
+      auto get_submission_group();
+      
+      // other implementation defined functions...
+    };
+  
+  }
+  
+This policy can be used with all the dynamic selection functions, such as ``select``, ``submit``,
+and ``submit_and_wait``. It can also be used with ``policy_traits``.
+
+Example
+-------
+
+The following example demonstrates a simple approach to send work to more than
+one queue concurrently using ``dynamic_load_policy``. The policy selects the
+resource with the fewest number of unfinished submissions.
+
+.. code:: cpp
+
+  #include <oneapi/dpl/dynamic_selection>
+  #include <sycl/sycl.hpp>
+  #include <iostream>
+
+  const std::size_t N = 10000;
+  namespace ex = oneapi::dpl::experimental;
+
+  void f(sycl::handler& h, float* v);
+  void do_cpu_work();
+
+  int dynamic_load_example(std::vector<sycl::queue>& devices, 
+                           std::vector<float *>& usm_data) {
+
+    ex::dynamic_load_policy p{devices}; // (1)
+
+    auto num_devices = p.get_resources().size();
+    auto num_arrays = usm_data.size();
+    // (2)
+    auto submission_group_size = num_arrays;
+
+    std::cout << "Running with " << num_devices << " queues\n"
+              << "             " << num_arrays  << " usm arrays\n"
+              << "Will perform " << submission_group_size << " concurrent offloads\n";
+
+
+    for (int i = 0; i < 100; i+=submission_group_size) { // (3)
+      for (int j = 0; j < submission_group_size; ++j) {  // (4)
+        ex::submit(p, [&](sycl::queue q) { // (5)
+          float *data = usm_data[j];
+          return q.submit([=](sycl::handler &h) { // (6) 
+            f(h, data);
+          });
+        }); 
+        do_cpu_work(); // (7)
+      }   
+      ex::wait(p.get_submission_group()); // (8) 
+    }
+    return 0;
+  }
+
+The key points in this example are:
+
+#. A ``dynamic_load_policy`` is constructed that selects from queues in the ``devices`` vector.
+#. The total number of concurrent offloads, ``submission_group_size``, will be limited to the number of USM arrays. In this example, we allow multiple simultaneous offloads to the same queue. The only limitation is that there should be enough available vectors to support the concurrent executions.
+#. The outer ``i``-loop iterates from 0 to 99, stepping by the ``submission_group_size``. This number of submissions will be offloaded concurrently.
+#. The inner ``j``-loop iterates over ``submission_group_size`` submissions.
+#. ``submit`` is used to select a queue and pass it to the user's function, but does not block until the event returned by that function completes. This provides the opportunity for concurrency across the submissions.
+#. The queue is used in a function to perform an asynchronous offload. The SYCL event returned from the call to ``submit`` is returned. Returning an event is required for functions passed to ``submit`` and ``submit_and_wait``.
+#. Some additional work is done between calls to ``submit``. ``dynamic_load_policy`` is most useful when there is time for work to complete on some devices before the next assignment is made. If all submissions are performed simultaneously, all devices will appear equally loaded, since the fast devices would have had no time to complete their work.
+#. ``wait`` is called to block for all the concurrent ``submission_group_size`` submissions to complete.
+
+Selection Algorithm
+-------------------
+ 
+The selection algorithm for ``dynamic_load_policy`` chooses the resource
+that has the fewest number of unfinished offloads. The number of unfinished
+offloads is the difference between the number of reported task submissions 
+and then number of reported task completions. This value is tracked for each 
+available resource.
+
+Simplified, expository implementation of the selection algorithm:
+ 
+.. code:: cpp
+
+  template<typename... Args>
+  selection_type dynamic_load_policy::select(Args&& ...) {
+    if (initialized_) {
+      auto least_loaded_resource = find_least_loaded(resources_);
+      return selection_type{dynamic_load_policy<Backend>(*this), least_loaded};
+    } else {
+      throw std::logic_error("select called before initialialization");
+    }
+  }
+
+where ``resources_`` is a container of resources, such as 
+``std::vector`` of ``sycl::queue``.  The function ``find_least_loaded``
+iterates through the resources available to the policy and returns the
+resource with the fewest number of unfinished offloads. 
+
+Constructors
+------------
+
+``dynamic_load_policy`` provides three constructors.
+
+.. list-table:: ``dynamic_load_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``dynamic_load_policy(deferred_initialization_t);``
+    - Defers initialization. An ``initialize`` function must be called prior to use.
+  * - ``dynamic_load_policy();``
+    - Initialized to use the default set of resources.
+  * - ``dynamic_load_policy(const std::vector<resource_type>& u);``
+    - Overrides the default set of resources.
+
+Deferred Initialization
+-----------------------
+
+A ``dynamic_load_policy`` that was constructed with deferred initialization must be 
+initialized by calling one of its ``initialize`` member functions before it can be used
+to select or submit.
+
+.. list-table:: ``dynamic_load_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``initialize();``
+    - Initialize to use the default set of resources.
+  * - ``initialize(const std::vector<resource_type>& u);``
+    - Overrides the default set of resources.
+
+Queries
+-------
+
+A ``dynamic_load_policy`` has ``get_resources`` and ``get_submission_group`` 
+member functions.
+
+.. list-table:: ``dynamic_load_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``std::vector<resource_type> get_resources();``
+    - Returns the set of resources the policy is selecting from.
+  * - ``auto get_submission_group();``
+    - Returns an object that can be used to wait for all active submissions.
+
+Reporting Requirements
+----------------------
+
+If a resource returned by ``select`` is used directly without calling
+``submit`` or ``submit_and_wait``, it may be necessary to call ``report``
+to provide feedback to the policy. The ``dynamic_load_policy`` tracks the
+number of outstanding submissions on each device via callbacks that report
+when a submission is started, and when it is completed. The instrumentation
+to report these events is included in the implementations of 
+``submit`` and ``submit_and_wait``.  However, if you use ``select`` and then
+submit work directly to the selected resource, it is necessary to explicitly
+report these events.
+
+.. list-table:: ``dynamic_load_policy`` reporting requirements
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - ``execution_info``
+    - is reporting required?
+  * - ``task_submission``
+    - Yes
+  * - ``task_completion``
+    - Yes
+  * - ``task_time``
+    - No
+
+In generic code, it is possible to perform compile-time checks to avoid
+reporting overheads when reporting is not needed, while still writing 
+code that will work with any policy, as demonstrated below:
+
+.. code:: cpp
+
+  auto s = select(my_policy);
+  if constexpr (report_info_v<decltype(s), execution_info::task_submission_t>)
+  {
+    s.report(execution_info::task_submission);
+  }
diff --git a/_sources/dynamic_selection_api/fixed_resource_policy.rst b/_sources/dynamic_selection_api/fixed_resource_policy.rst
index eb2ceda028..664d9e0477 100644
--- a/_sources/dynamic_selection_api/fixed_resource_policy.rst
+++ b/_sources/dynamic_selection_api/fixed_resource_policy.rst
@@ -1,244 +1,244 @@
-Fixed-Resource Policy
-#####################
-
-The dynamic selection API is an experimental feature in the |onedpl_long| 
-(|onedpl_short|) that selects an *execution resource* based on a chosen 
-*selection policy*. There are several policies provided as part 
-of the API. Policies encapsulate the logic and any associated state needed 
-to make a selection. 
-
-The fixed-resource policy always returns the same resource selection. 
-``fixed_resource_policy`` is designed for two primary scenarios: 
-
-#. debugging the use of dynamic selection
-#. special casing a dynamic selection capable application for a specific resource when it is known to be best on that platform.
-
-.. code:: cpp
-
-  namespace oneapi::dpl::experimental {
-  
-    template<typename Backend = sycl_backend> 
-    class fixed_resource_policy {
-    public:
-      // useful types
-      using resource_type = typename Backend::resource_type;
-      using wait_type = typename Backend::wait_type;
-      
-      class selection_type {
-      public:
-        fixed_resource_policy<Backend> get_policy() const;
-        resource_type unwrap() const;
-      };
-      
-      // constructors
-      fixed_resource_policy(deferred_initialization_t);
-      fixed_resource_policy(std::size_t offset = 0);
-      fixed_resource_policy(const std::vector<resource_type>& u,  
-                            std::size_t offset = 0);
-  
-      // deferred initializers
-      void initialize(std::size_t offset = 0);
-      void initialize(const std::vector<resource_type>& u, 
-                      std::size_t offset = 0);
-                      
-      // queries
-      auto get_resources() const;
-      auto get_submission_group();
-      
-      // other implementation defined functions...
-    };
-  
-  }
-  
-This policy can be used with all the dynamic selection functions, such as ``select``, ``submit``,
-and ``submit_and_wait``. It can also be used with ``policy_traits``.
-
-
-Example
--------
-
-In the following example, a ``fixed_resource_policy`` is used when the code is
-compiled so that it selects a specific device.  When ``USE_CPU`` is defined at 
-compile-time, this example always uses the CPU queue. When ``USE_GPU`` is defined 
-at compile-time, it always uses the GPU queue. Otherwise, it uses an 
-``auto_tune_policy`` to dynamically select between these two queues. Such a scenario 
-could be used for debugging or simply to maintain the dynamic selection code even if 
-the best device to use is known for some subset of platforms.  
-
-.. code:: cpp
-
-  #include <oneapi/dpl/dynamic_selection>
-  #include <sycl/sycl.hpp>
-  #include <iostream>
-
-  namespace ex = oneapi::dpl::experimental;
-
-  int main() {
-    std::vector<sycl::queue> r { sycl::queue{sycl::cpu_selector_v},
-                                 sycl::queue{sycl::gpu_selector_v} };
-
-    const std::size_t N = 10000;
-    std::vector<float> av(N, 0.0);
-    std::vector<float> bv(N, 0.0);
-    std::vector<float> cv(N, 0.0);
-    for (int i = 0; i < N; ++i) {
-      av[i] = bv[i] = i;
-    }
-
-  #if USE_CPU
-    ex::fixed_resource_policy p{r};    // (1) uses index 0 of r, the cpu
-  #elif USE_GPU
-    ex::fixed_resource_policy p{r, 1}; // (2) uses index 1 of r, the gpu
-  #else 
-    ex::auto_tune_policy p{r};
-  #endif
-
-    {
-      sycl::buffer<float> a_b(av);
-      sycl::buffer<float> b_b(bv);
-      sycl::buffer<float> c_b(cv);
-
-
-      for (int i = 0; i < 6; ++i) {
-        ex::submit_and_wait(p, [&](sycl::queue q) { // (3)
-          // (4)
-          std::cout << (q.get_device().is_cpu() ? "using cpu\n" : "using gpu\n");
-          return q.submit([&](sycl::handler &h) {   // (5)
-            sycl::accessor a_a(a_b, h, sycl::read_only);
-            sycl::accessor b_a(b_b, h, sycl::read_only);
-            sycl::accessor c_a(c_b, h, sycl::read_write);
-            h.parallel_for(N, [=](auto i) { c_a[i] = a_a[i] + b_a[i]; }); 
-          });
-        }); 
-      };  
-    }
-
-    for (int i = 0; i < N; ++i) {
-      if (cv[i] != 2*i) {
-         std::cout << "ERROR!\n";
-      }
-    }
-    std::cout << "Done.\n";
-  }
-  
-The key points in this example are:
-
-#. If ``USE_CPU`` is defined, a ``fixed_resouce_policy`` is constructed that targets the CPU.
-#. If ``USE_GPU`` is defined, a ``fixed_resouce_policy`` is constructed that targets the GPU.
-#. ``submit_and_wait`` is invoked with the policy as the first argument. The selected queue will be passed to the user-provided function.
-#. For clarity when run, the type of device is displayed.
-#. The queue is used in a function to perform an asynchronous offload. The SYCL event returned from the call to ``submit`` is returned. Returning an event is required for functions passed to ``submit`` and ``submit_and_wait``.
-
-Selection Algorithm
--------------------
- 
-The selection algorithm for ``fixed_resource_policy`` always returns 
-the same specific resource from its set of resources. The index of the
-resource is set during construction or deferred initialization.
-
-Simplified, expository implementation of the selection algorithm:
- 
-.. code::
-
-  template<typename... Args>
-  selection_type fixed_resource_policy::select(Args&& ...) {
-    if (initialized_) {
-      return selection_type{*this, resources_[fixed_offset_]};
-    } else {
-      throw std::logic_error(“select called before initialization”);
-    }
-  }
-
-where ``resources_`` is a container of resources, such as 
-``std::vector`` of ``sycl::queue``, and ``fixed_offset_`` stores a
-fixed integer offset. Both ``resources_`` and ``fixed_offset`` 
-are set during construction or deferred initialization of the policy
-and then remain constant. 
-
-Constructors
-------------
-
-``fixed_resource_policy`` provides three constructors.
-
-.. list-table:: ``fixed_resource_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``fixed_resource_policy(deferred_initialization_t);``
-    - Defers initialization. An ``initialize`` function must be called prior to use.
-  * - ``fixed_resource_policy(std::size_t offset = 0);``
-    - Sets the index for the resource to be selected. Uses the default set of resources.
-  * - ``fixed_resource_policy(const std::vector<resource_type>& u, std::size_t offset = 0);``
-    - Overrides the default set of resources and optionally sets the index for the resource to be selected.
-
-Deferred Initialization
------------------------
-
-A ``fixed_resource_policy`` that was constructed with deferred initialization must be 
-initialized by calling one its ``initialize`` member functions before it can be used
-to select or submit.
-
-.. list-table:: ``fixed_resource_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``initialize(std::size_t offset = 0);``
-    - Sets the index for the resource to be selected. Uses the default set of resources.
-  * - ``initialize(const std::vector<resource_type>& u, std::size_t offset = 0);``
-    - Overrides the default set of resources and optionally sets the index for the resource to be selected.
-
-Queries
--------
-
-A ``fixed_resource_policy`` has ``get_resources`` and ``get_submission_group`` 
-member functions. 
-
-.. list-table:: ``fixed_resource_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``std::vector<resource_type> get_resources();``
-    - Returns the set of resources the policy is selecting from.
-  * - ``auto get_submission_group();``
-    - Returns an object that can be used to wait for all active submissions.
-
-Reporting Requirements
-----------------------
-
-If a resource returned by ``select`` is used directly without calling
-``submit`` or ``submit_and_wait``, it may be necessary to call ``report``
-to provide feedback to the policy. However, the ``fixed_resource_policy`` 
-does not require any feedback about the system state or the behavior of 
-the workload. Therefore, no explicit reporting of execution information 
-is needed, as is summarized in the table below.
-
-.. list-table:: ``fixed_resource_policy`` reporting requirements
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - ``execution_info``
-    - is reporting required?
-  * - ``task_submission``
-    - No
-  * - ``task_completion``
-    - No
-  * - ``task_time``
-    - No
-
-In generic code, it is possible to perform compile-time checks to avoid
-reporting overheads when reporting is not needed, while still writing 
-code that will work with any policy, as demonstrated below:
-
-.. code:: cpp
-
-  auto s = select(my_policy);
-  if constexpr (report_info_v<decltype(s), execution_info::task_submission_t>)
-  {
-    s.report(execution_info::task_submission);
-  }
+Fixed-Resource Policy
+#####################
+
+The dynamic selection API is an experimental feature in the |onedpl_long| 
+(|onedpl_short|) that selects an *execution resource* based on a chosen 
+*selection policy*. There are several policies provided as part 
+of the API. Policies encapsulate the logic and any associated state needed 
+to make a selection. 
+
+The fixed-resource policy always returns the same resource selection. 
+``fixed_resource_policy`` is designed for two primary scenarios: 
+
+#. debugging the use of dynamic selection
+#. special casing a dynamic selection capable application for a specific resource when it is known to be best on that platform.
+
+.. code:: cpp
+
+  namespace oneapi::dpl::experimental {
+  
+    template<typename Backend = sycl_backend>
+    class fixed_resource_policy {
+    public:
+      // useful types
+      using resource_type = typename Backend::resource_type;
+      using wait_type = typename Backend::wait_type;
+      
+      class selection_type {
+      public:
+        fixed_resource_policy<Backend> get_policy() const;
+        resource_type unwrap() const;
+      };
+      
+      // constructors
+      fixed_resource_policy(deferred_initialization_t);
+      fixed_resource_policy(std::size_t offset = 0);
+      fixed_resource_policy(const std::vector<resource_type>& u,
+                            std::size_t offset = 0);
+  
+      // deferred initializers
+      void initialize(std::size_t offset = 0);
+      void initialize(const std::vector<resource_type>& u,
+                      std::size_t offset = 0);
+                      
+      // queries
+      auto get_resources() const;
+      auto get_submission_group();
+      
+      // other implementation defined functions...
+    };
+  
+  }
+  
+This policy can be used with all the dynamic selection functions, such as ``select``, ``submit``,
+and ``submit_and_wait``. It can also be used with ``policy_traits``.
+
+
+Example
+-------
+
+In the following example, a ``fixed_resource_policy`` is used when the code is
+compiled so that it selects a specific device.  When ``USE_CPU`` is defined at 
+compile-time, this example always uses the CPU queue. When ``USE_GPU`` is defined 
+at compile-time, it always uses the GPU queue. Otherwise, it uses an 
+``auto_tune_policy`` to dynamically select between these two queues. Such a scenario 
+could be used for debugging or simply to maintain the dynamic selection code even if 
+the best device to use is known for some subset of platforms.  
+
+.. code:: cpp
+
+  #include <oneapi/dpl/dynamic_selection>
+  #include <sycl/sycl.hpp>
+  #include <iostream>
+
+  namespace ex = oneapi::dpl::experimental;
+
+  int main() {
+    std::vector<sycl::queue> r { sycl::queue{sycl::cpu_selector_v},
+                                 sycl::queue{sycl::gpu_selector_v} };
+
+    const std::size_t N = 10000;
+    std::vector<float> av(N, 0.0);
+    std::vector<float> bv(N, 0.0);
+    std::vector<float> cv(N, 0.0);
+    for (int i = 0; i < N; ++i) {
+      av[i] = bv[i] = i;
+    }
+
+  #if USE_CPU
+    ex::fixed_resource_policy p{r};    // (1) uses index 0 of r, the cpu
+  #elif USE_GPU
+    ex::fixed_resource_policy p{r, 1}; // (2) uses index 1 of r, the gpu
+  #else 
+    ex::auto_tune_policy p{r};
+  #endif
+
+    {
+      sycl::buffer<float> a_b(av);
+      sycl::buffer<float> b_b(bv);
+      sycl::buffer<float> c_b(cv);
+
+
+      for (int i = 0; i < 6; ++i) {
+        ex::submit_and_wait(p, [&](sycl::queue q) { // (3)
+          // (4)
+          std::cout << (q.get_device().is_cpu() ? "using cpu\n" : "using gpu\n");
+          return q.submit([&](sycl::handler &h) {   // (5)
+            sycl::accessor a_a(a_b, h, sycl::read_only);
+            sycl::accessor b_a(b_b, h, sycl::read_only);
+            sycl::accessor c_a(c_b, h, sycl::read_write);
+            h.parallel_for(N, [=](auto i) { c_a[i] = a_a[i] + b_a[i]; }); 
+          });
+        }); 
+      };  
+    }
+
+    for (int i = 0; i < N; ++i) {
+      if (cv[i] != 2*i) {
+         std::cout << "ERROR!\n";
+      }
+    }
+    std::cout << "Done.\n";
+  }
+  
+The key points in this example are:
+
+#. If ``USE_CPU`` is defined, a ``fixed_resouce_policy`` is constructed that targets the CPU.
+#. If ``USE_GPU`` is defined, a ``fixed_resouce_policy`` is constructed that targets the GPU.
+#. ``submit_and_wait`` is invoked with the policy as the first argument. The selected queue will be passed to the user-provided function.
+#. For clarity when run, the type of device is displayed.
+#. The queue is used in a function to perform an asynchronous offload. The SYCL event returned from the call to ``submit`` is returned. Returning an event is required for functions passed to ``submit`` and ``submit_and_wait``.
+
+Selection Algorithm
+-------------------
+ 
+The selection algorithm for ``fixed_resource_policy`` always returns 
+the same specific resource from its set of resources. The index of the
+resource is set during construction or deferred initialization.
+
+Simplified, expository implementation of the selection algorithm:
+ 
+.. code:: cpp
+
+  template<typename... Args>
+  selection_type fixed_resource_policy::select(Args&& ...) {
+    if (initialized_) {
+      return selection_type{*this, resources_[fixed_offset_]};
+    } else {
+      throw std::logic_error("select called before initialization");
+    }
+  }
+
+where ``resources_`` is a container of resources, such as 
+``std::vector`` of ``sycl::queue``, and ``fixed_offset_`` stores a
+fixed integer offset. Both ``resources_`` and ``fixed_offset`` 
+are set during construction or deferred initialization of the policy
+and then remain constant. 
+
+Constructors
+------------
+
+``fixed_resource_policy`` provides three constructors.
+
+.. list-table:: ``fixed_resource_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``fixed_resource_policy(deferred_initialization_t);``
+    - Defers initialization. An ``initialize`` function must be called prior to use.
+  * - ``fixed_resource_policy(std::size_t offset = 0);``
+    - Sets the index for the resource to be selected. Uses the default set of resources.
+  * - ``fixed_resource_policy(const std::vector<resource_type>& u, std::size_t offset = 0);``
+    - Overrides the default set of resources and optionally sets the index for the resource to be selected.
+
+Deferred Initialization
+-----------------------
+
+A ``fixed_resource_policy`` that was constructed with deferred initialization must be 
+initialized by calling one its ``initialize`` member functions before it can be used
+to select or submit.
+
+.. list-table:: ``fixed_resource_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``initialize(std::size_t offset = 0);``
+    - Sets the index for the resource to be selected. Uses the default set of resources.
+  * - ``initialize(const std::vector<resource_type>& u, std::size_t offset = 0);``
+    - Overrides the default set of resources and optionally sets the index for the resource to be selected.
+
+Queries
+-------
+
+A ``fixed_resource_policy`` has ``get_resources`` and ``get_submission_group`` 
+member functions. 
+
+.. list-table:: ``fixed_resource_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``std::vector<resource_type> get_resources();``
+    - Returns the set of resources the policy is selecting from.
+  * - ``auto get_submission_group();``
+    - Returns an object that can be used to wait for all active submissions.
+
+Reporting Requirements
+----------------------
+
+If a resource returned by ``select`` is used directly without calling
+``submit`` or ``submit_and_wait``, it may be necessary to call ``report``
+to provide feedback to the policy. However, the ``fixed_resource_policy`` 
+does not require any feedback about the system state or the behavior of 
+the workload. Therefore, no explicit reporting of execution information 
+is needed, as is summarized in the table below.
+
+.. list-table:: ``fixed_resource_policy`` reporting requirements
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - ``execution_info``
+    - is reporting required?
+  * - ``task_submission``
+    - No
+  * - ``task_completion``
+    - No
+  * - ``task_time``
+    - No
+
+In generic code, it is possible to perform compile-time checks to avoid
+reporting overheads when reporting is not needed, while still writing 
+code that will work with any policy, as demonstrated below:
+
+.. code:: cpp
+
+  auto s = select(my_policy);
+  if constexpr (report_info_v<decltype(s), execution_info::task_submission_t>)
+  {
+    s.report(execution_info::task_submission);
+  }
diff --git a/_sources/dynamic_selection_api/functions.rst b/_sources/dynamic_selection_api/functions.rst
index 6dd574b502..63083b8f54 100644
--- a/_sources/dynamic_selection_api/functions.rst
+++ b/_sources/dynamic_selection_api/functions.rst
@@ -42,9 +42,7 @@ An example that calls ``select`` using a ``round_robin_policy``:
     }
   }
   
-The output of this example:
-
-.. code::
+The output of this example is::
 
   selected queue is cpu
   selected queue is gpu
@@ -134,9 +132,7 @@ submitted to the selected queue.
     }
   }
 
-The output from this example:
-
-.. code::
+The output from this example is::
 
   (j == 0): submit to cpu
   (i == 0): async work on main thread
@@ -204,9 +200,7 @@ command groups can be submitted to the selected queue.
     }
   }
 
-The output from this example:
-
-.. code::
+The output from this example is::
 
   (j == 0): submit to cpu
   (i == 0): async work on main thread
@@ -269,9 +263,7 @@ the object returned by ``get_submission_group()`` to ``wait``:
     std::cout << "done waiting for all submissions\n";
   }
   
-The output from this example:
-
-.. code::
+The output from this example is::
 
   (j == 0): submit to cpu
   (i == 0): async work on main thread
@@ -345,9 +337,7 @@ submitted to the selected queue.
     }
   }
 
-The output from this example:
-
-.. code::
+The output from this example is::
 
   (j == 0): submit to cpu
   (i == 0): submission done
@@ -410,9 +400,7 @@ submitted to the selected queue.
   }
 
 
-The output from this example:
-
-.. code::
+The output from this example is::
 
   (j == 0): submit to cpu
   (i == 0): submission done
@@ -462,9 +450,7 @@ selects from. The following example demonstrates the use of the function
       std::cout << "queue is " << ((q.get_device().is_gpu()) ? "gpu\n" : "not-gpu\n");
   }
   
-The output from this example on a test machine is shown below. 
-
-.. code::
+The output from this example on a test machine is::
 
   Resources in explicitly set policy
   queue is cpu
diff --git a/_sources/dynamic_selection_api/policies.rst b/_sources/dynamic_selection_api/policies.rst
index f74a2f0dca..afb156b7a8 100644
--- a/_sources/dynamic_selection_api/policies.rst
+++ b/_sources/dynamic_selection_api/policies.rst
@@ -100,9 +100,7 @@ An example, demonstrating this difference, is shown below:
     print_type("p2 selection 4: ", p2s4);
   }
 
-The output of this example:
-
-.. code::
+The output of this example is::
 
   p1 selection 1: cpu
   p2 selection 1: cpu
@@ -125,7 +123,6 @@ More detailed information about the API is provided in the following sections:
 .. toctree::
    :maxdepth: 2
    :titlesonly:
-   :glob:
 
    fixed_resource_policy
    round_robin_policy
diff --git a/_sources/dynamic_selection_api/round_robin_policy.rst b/_sources/dynamic_selection_api/round_robin_policy.rst
index 0d766dc566..ead7101d94 100644
--- a/_sources/dynamic_selection_api/round_robin_policy.rst
+++ b/_sources/dynamic_selection_api/round_robin_policy.rst
@@ -1,222 +1,222 @@
-Round-Robin Policy
-##################
-
-The dynamic selection API is an experimental feature in the |onedpl_long| 
-(|onedpl_short|) that selects an *execution resource* based on a chosen 
-*selection policy*. There are several policies provided as part 
-of the API. Policies encapsulate the logic and any associated state needed 
-to make a selection. 
-
-The round-robin policy cycles through the set of resources at each selection. ``round_robin_policy`` 
-is useful for offloading kernels of similar cost to devices of similar
-capabilities. In those cases, a round-robin assignment of kernels to devices
-will achieve a good load balancing.
-
-.. code:: cpp
-
-  namespace oneapi::dpl::experimental {
-  
-    template<typename Backend = sycl_backend> 
-    class round_robin_policy {
-    public:
-      // useful types
-      using resource_type = typename Backend::resource_type;
-      using wait_type = typename Backend::wait_type;
-      
-      class selection_type {
-      public:
-        round_robin_policy<Backend> get_policy() const;
-        resource_type unwrap() const;
-      };
-      
-      // constructors
-      round_robin_policy(deferred_initialization_t);
-      round_robin_policy();
-      round_robin_policy(const std::vector<resource_type>& u);  
-  
-      // deferred initializer
-      void initialize();
-      void initialize(const std::vector<resource_type>& u);
-                      
-      // queries
-      auto get_resources() const;
-      auto get_submission_group();
-      
-      // other implementation defined functions...
-    };
-  
-  }
-  
-This policy can be used with all the dynamic selection functions, such as ``select``, ``submit``,
-and ``submit_and_wait``. It can also be used with ``policy_traits``.
-
-Example
--------
-
-The following example demonstrates a simple approach to send work to each 
-queue in a set of queues, and then wait for all devices to complete the work
-before repeating the process. A ``round_robin_policy`` is used rotate through
-the available devices.
-
-.. code:: cpp
-
-  #include <oneapi/dpl/dynamic_selection>
-  #include <sycl/sycl.hpp>
-  #include <iostream>
-
-  const std::size_t N = 10000;
-  namespace ex = oneapi::dpl::experimental;
-
- void f(sycl::handler& h, float* v);
-
-
-  int round_robin_example(std::vector<sycl::queue>& similar_devices, 
-                          std::vector<float*>& usm_data) {
-
-    ex::round_robin_policy p{similar_devices}; // (1)
-
-    auto num_devices = p.get_resources().size();
-    auto num_arrays = usm_data.size();
-
-    // (2)
-    auto submission_group_size = (num_arrays < num_devices) ? num_arrays : num_devices;
-
-    std::cout << "Running with " << num_devices << " queues\n"
-              << "             " << num_arrays  << " usm arrays\n"
-              << "Will perform " << submission_group_size << " concurrent offloads\n";
-
-    for (int i = 0; i < 100; i += submission_group_size) { // (3)
-      for (int j = 0; j < submission_group_size; ++j) {  // (4)
-        ex::submit(p, [&](sycl::queue q) { // (5)
-          float* data = usm_data[j];
-          return q.submit([=](sycl::handler &h) { // (6)
-            f(h, data);
-          });
-        }); 
-      }   
-      ex::wait(p.get_submission_group()); // (7)
-    }
-    return 0;
-  }
-
-The key points in this example are:
-
-#. A ``round_robin_policy`` is constructed that rotates between the CPU and GPU queues.
-#. The total number of concurrent offloads, ``submission_group_size``, will be limited to the number of USM arrays or the number of queues, whichever is smaller. 
-#. The outer ``i``-loop iterates from 0 to 99, stepping by the ``submission_group_size``. This number of submissions will be offload concurrently.
-#. The inner ``j``-loop iterates over ``submission_group_size`` submissions.
-#. ``submit`` is used to select a queue and pass it to the user's function, but does not block until the event returned by that function completes. This provides the opportunity for concurrency across the submissions.
-#. The queue is used in a function to perform an asynchronous offload. The SYCL event returned from the call to ``submit`` is returned. Returning an event is required for functions passed to ``submit`` and ``submit_and_wait``.
-#. ``wait`` is called to block for all the concurrent ``submission_group_size`` submissions to complete.
-
-Selection Algorithm
--------------------
- 
-The selection algorithm for ``round_robin_policy`` rotates through
-the elements of the set of available resources. A simplified, expository 
-implementation of the selection algorithm follows:
- 
-.. code::
-
-  template<typename ...Args>
-  selection_type round_robin_policy::select(Args&&...) {
-    if (initialized_) {
-      auto& r = resources_[next_context_++ % num_resources_];
-      return selection_type{*this, r};
-    } else {
-      throw std::logic_error(“selected called before initialization”);
-    }
-  }
-
-where ``resources_`` is a container of resources, such as 
-``std::vector`` of ``sycl::queue``, ``next_context_`` is 
-a counter that increments at each selection, and ``num_resources_``
-is the size of the ``resources_`` vector.
-
-Constructors
-------------
-
-``round_robin_policy`` provides three constructors.
-
-.. list-table:: ``round_robin_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``round_round_policy(deferred_initialization_t);``
-    - Defers initialization. An ``initialize`` function must be called prior to use.
-  * - ``round_robin_policy();``
-    - Initialized to use the default set of resources.
-  * - ``round_robin_policy(const std::vector<resource_type>& u);``
-    - Overrides the default set of resources.
-
-Deferred Initialization
------------------------
-
-A ``round_robin_policy`` that was constructed with deferred initialization must be 
-initialized by calling one its ``initialize`` member functions before it can be used
-to select or submit.
-
-.. list-table:: ``round_robin_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``initialize();``
-    - Initialize to use the default set of resources.
-  * - ``initialize(const std::vector<resource_type>& u);``
-    - Overrides the default set of resources.
-
-Queries
--------
-
-A ``round_robin_policy`` has ``get_resources`` and ``get_submission_group`` 
-member functions.
-
-.. list-table:: ``round_robin_policy`` constructors
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - Signature
-    - Description
-  * - ``std::vector<resource_type> get_resources();``
-    - Returns the set of resources the policy is selecting from.
-  * - ``auto get_submission_group();``
-    - Returns an object that can be used to wait for all active submissions.
-
-Reporting Requirements
-----------------------
-
-If a resource returned by ``select`` is used directly without calling
-``submit`` or ``submit_and_wait``, it may be necessary to call ``report``
-to provide feedback to the policy. However, the ``round_robin_policy`` 
-does not require any feedback about the system state or the behavior of 
-the workload. Therefore, no explicit reporting of execution information 
-is needed, as is summarized in the table below.
-
-.. list-table:: ``round_robin_policy`` reporting requirements
-  :widths: 50 50
-  :header-rows: 1
-  
-  * - ``execution_info``
-    - is reporting required?
-  * - ``task_submission``
-    - No
-  * - ``task_completion``
-    - No
-  * - ``task_time``
-    - No
-
-In generic code, it is possible to perform compile-time checks to avoid
-reporting overheads when reporting is not needed, while still writing 
-code that will work with any policy, as demonstrated below:
-
-.. code:: cpp
-
-  auto s = select(my_policy);
-  if constexpr (report_info_v<decltype(s), execution_info::task_submission_t>)
-  {
-    s.report(execution_info::task_submission);
-  }
+Round-Robin Policy
+##################
+
+The dynamic selection API is an experimental feature in the |onedpl_long|
+(|onedpl_short|) that selects an *execution resource* based on a chosen
+*selection policy*. There are several policies provided as part
+of the API. Policies encapsulate the logic and any associated state needed
+to make a selection. 
+
+The round-robin policy cycles through the set of resources at each selection. ``round_robin_policy``
+is useful for offloading kernels of similar cost to devices of similar
+capabilities. In those cases, a round-robin assignment of kernels to devices
+will achieve a good load balancing.
+
+.. code:: cpp
+
+  namespace oneapi::dpl::experimental {
+  
+    template<typename Backend = sycl_backend> 
+    class round_robin_policy {
+    public:
+      // useful types
+      using resource_type = typename Backend::resource_type;
+      using wait_type = typename Backend::wait_type;
+      
+      class selection_type {
+      public:
+        round_robin_policy<Backend> get_policy() const;
+        resource_type unwrap() const;
+      };
+      
+      // constructors
+      round_robin_policy(deferred_initialization_t);
+      round_robin_policy();
+      round_robin_policy(const std::vector<resource_type>& u);
+  
+      // deferred initializer
+      void initialize();
+      void initialize(const std::vector<resource_type>& u);
+                      
+      // queries
+      auto get_resources() const;
+      auto get_submission_group();
+      
+      // other implementation defined functions...
+    };
+  
+  }
+  
+This policy can be used with all the dynamic selection functions, such as ``select``, ``submit``,
+and ``submit_and_wait``. It can also be used with ``policy_traits``.
+
+Example
+-------
+
+The following example demonstrates a simple approach to send work to each 
+queue in a set of queues, and then wait for all devices to complete the work
+before repeating the process. A ``round_robin_policy`` is used rotate through
+the available devices.
+
+.. code:: cpp
+
+  #include <oneapi/dpl/dynamic_selection>
+  #include <sycl/sycl.hpp>
+  #include <iostream>
+
+  const std::size_t N = 10000;
+  namespace ex = oneapi::dpl::experimental;
+
+ void f(sycl::handler& h, float* v);
+
+
+  int round_robin_example(std::vector<sycl::queue>& similar_devices,
+                          std::vector<float*>& usm_data) {
+
+    ex::round_robin_policy p{similar_devices}; // (1)
+
+    auto num_devices = p.get_resources().size();
+    auto num_arrays = usm_data.size();
+
+    // (2)
+    auto submission_group_size = (num_arrays < num_devices) ? num_arrays : num_devices;
+
+    std::cout << "Running with " << num_devices << " queues\n"
+              << "             " << num_arrays  << " usm arrays\n"
+              << "Will perform " << submission_group_size << " concurrent offloads\n";
+
+    for (int i = 0; i < 100; i += submission_group_size) { // (3)
+      for (int j = 0; j < submission_group_size; ++j) {  // (4)
+        ex::submit(p, [&](sycl::queue q) { // (5)
+          float* data = usm_data[j];
+          return q.submit([=](sycl::handler &h) { // (6)
+            f(h, data);
+          });
+        }); 
+      }   
+      ex::wait(p.get_submission_group()); // (7)
+    }
+    return 0;
+  }
+
+The key points in this example are:
+
+#. A ``round_robin_policy`` is constructed that rotates between the CPU and GPU queues.
+#. The total number of concurrent offloads, ``submission_group_size``, will be limited to the number of USM arrays or the number of queues, whichever is smaller. 
+#. The outer ``i``-loop iterates from 0 to 99, stepping by the ``submission_group_size``. This number of submissions will be offload concurrently.
+#. The inner ``j``-loop iterates over ``submission_group_size`` submissions.
+#. ``submit`` is used to select a queue and pass it to the user's function, but does not block until the event returned by that function completes. This provides the opportunity for concurrency across the submissions.
+#. The queue is used in a function to perform an asynchronous offload. The SYCL event returned from the call to ``submit`` is returned. Returning an event is required for functions passed to ``submit`` and ``submit_and_wait``.
+#. ``wait`` is called to block for all the concurrent ``submission_group_size`` submissions to complete.
+
+Selection Algorithm
+-------------------
+ 
+The selection algorithm for ``round_robin_policy`` rotates through
+the elements of the set of available resources. A simplified, expository 
+implementation of the selection algorithm follows:
+ 
+.. code:: cpp
+
+  template<typename ...Args>
+  selection_type round_robin_policy::select(Args&&...) {
+    if (initialized_) {
+      auto& r = resources_[next_context_++ % num_resources_];
+      return selection_type{*this, r};
+    } else {
+      throw std::logic_error("selected called before initialization");
+    }
+  }
+
+where ``resources_`` is a container of resources, such as 
+``std::vector`` of ``sycl::queue``, ``next_context_`` is 
+a counter that increments at each selection, and ``num_resources_``
+is the size of the ``resources_`` vector.
+
+Constructors
+------------
+
+``round_robin_policy`` provides three constructors.
+
+.. list-table:: ``round_robin_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``round_round_policy(deferred_initialization_t);``
+    - Defers initialization. An ``initialize`` function must be called prior to use.
+  * - ``round_robin_policy();``
+    - Initialized to use the default set of resources.
+  * - ``round_robin_policy(const std::vector<resource_type>& u);``
+    - Overrides the default set of resources.
+
+Deferred Initialization
+-----------------------
+
+A ``round_robin_policy`` that was constructed with deferred initialization must be 
+initialized by calling one its ``initialize`` member functions before it can be used
+to select or submit.
+
+.. list-table:: ``round_robin_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``initialize();``
+    - Initialize to use the default set of resources.
+  * - ``initialize(const std::vector<resource_type>& u);``
+    - Overrides the default set of resources.
+
+Queries
+-------
+
+A ``round_robin_policy`` has ``get_resources`` and ``get_submission_group`` 
+member functions.
+
+.. list-table:: ``round_robin_policy`` constructors
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - Signature
+    - Description
+  * - ``std::vector<resource_type> get_resources();``
+    - Returns the set of resources the policy is selecting from.
+  * - ``auto get_submission_group();``
+    - Returns an object that can be used to wait for all active submissions.
+
+Reporting Requirements
+----------------------
+
+If a resource returned by ``select`` is used directly without calling
+``submit`` or ``submit_and_wait``, it may be necessary to call ``report``
+to provide feedback to the policy. However, the ``round_robin_policy`` 
+does not require any feedback about the system state or the behavior of 
+the workload. Therefore, no explicit reporting of execution information 
+is needed, as is summarized in the table below.
+
+.. list-table:: ``round_robin_policy`` reporting requirements
+  :widths: 50 50
+  :header-rows: 1
+  
+  * - ``execution_info``
+    - is reporting required?
+  * - ``task_submission``
+    - No
+  * - ``task_completion``
+    - No
+  * - ``task_time``
+    - No
+
+In generic code, it is possible to perform compile-time checks to avoid
+reporting overheads when reporting is not needed, while still writing 
+code that will work with any policy, as demonstrated below:
+
+.. code:: cpp
+
+  auto s = select(my_policy);
+  if constexpr (report_info_v<decltype(s), execution_info::task_submission_t>)
+  {
+    s.report(execution_info::task_submission);
+  }
diff --git a/_sources/dynamic_selection_api_main.rst b/_sources/dynamic_selection_api_main.rst
index 2b3f18d97a..62c62f49e1 100644
--- a/_sources/dynamic_selection_api_main.rst
+++ b/_sources/dynamic_selection_api_main.rst
@@ -68,9 +68,7 @@ In the preceding example, the key points in the code include:
 #. The submit function returns an object that can be waited on. Calling ``wait`` on the ``done`` object blocks the main thread until the work submitted to the queue by your function is complete.
 #. The whole group of submissions made during the loop can be waited on. In this example, the call is redundant, since each submission was already waited for inside of the loop body.
  
-The output from this example is:
-
-.. code::
+The output from this example is::
 
   submit task to cpu
   submit task to gpu
@@ -86,7 +84,6 @@ More detailed information about the API is provided in the following sections:
 .. toctree::
    :maxdepth: 2
    :titlesonly:
-   :glob:
 
    dynamic_selection_api/functions
    dynamic_selection_api/policies
diff --git a/_sources/index.rst b/_sources/index.rst
index eb0588e092..f460357ad1 100644
--- a/_sources/index.rst
+++ b/_sources/index.rst
@@ -10,6 +10,7 @@ For general information, refer to the `oneDPL GitHub* repository
 
 .. toctree::
    :maxdepth: 2
+   :titlesonly:
    :caption: Get Started
 
    introduction/release_notes.rst
@@ -17,17 +18,27 @@ For general information, refer to the `oneDPL GitHub* repository
 
 .. toctree::
    :maxdepth: 2
-   :caption: Library Guide
+   :titlesonly:
+   :includehidden:
+   :caption: Core Functionality
 
    introduction
    parallel_api_main
    api_for_sycl_kernels_main
-   dynamic_selection_api_main
-   kernel_templates_main
    macros
    cmake_support
    oneDPL_2022.0_changes
 
+.. toctree::
+   :maxdepth: 1
+   :titlesonly:
+   :includehidden:
+   :caption: Technology Preview
+
+   parallel_api/async_api
+   dynamic_selection_api_main
+   kernel_templates_main
+
 .. toctree::
    :hidden:
    :caption: Notices and Disclaimers
diff --git a/_sources/introduction.rst b/_sources/introduction.rst
index 531a0f4637..77e592d33d 100644
--- a/_sources/introduction.rst
+++ b/_sources/introduction.rst
@@ -1,15 +1,11 @@
 |onedpl_long| Introduction
 #######################################
 
-Parallel API can be used with the `C++ Standard Execution
-Policies <https://en.cppreference.com/w/cpp/algorithm/execution_policy_tag_t>`_
-to enable parallelism on the host.
-
 The |onedpl_long| (|onedpl_short|) is implemented in accordance with the `oneDPL
-Specification <https://spec.oneapi.io/versions/latest/elements/oneDPL/source/index.html>`_.
+Specification <https://uxlfoundation.github.io/oneAPI-spec/spec/elements/oneDPL/source/index.html>`_.
 
-To support heterogeneity, |onedpl_short| works with the DPC++ API. More information can be found in the
-`oneAPI Specification <https://spec.oneapi.io/versions/latest/elements/sycl/source/index.html>`_.
+To support heterogeneity, |onedpl_short| uses `SYCL <https://registry.khronos.org/SYCL/>`_.
+More information about SYCL can be found in the `SYCL Specification`_.
 
 Before You Begin
 ================
@@ -24,18 +20,11 @@ page for:
 * Fixed Issues
 * Deprecation Notice
 * Known Issues and Limitations
-* Previous Release Notes 
+* Previous Release Notes
 
-Install the `Intel® oneAPI Base Toolkit (Base Kit) <https://www.intel.com/content/www/us/en/developer/tools/oneapi/base-toolkit.html#gs.xaontv>`_
+Install the `Intel® oneAPI Base Toolkit (Base Kit) <https://www.intel.com/content/www/us/en/developer/tools/oneapi/base-toolkit.html>`_
 to use |onedpl_short|.
 
-All |onedpl_short| header files are in the ``oneapi/dpl`` directory. To use the |onedpl_short| API,
-include the corresponding header in your source code with the ``#include <oneapi/dpl/…>`` directive.
-|onedpl_short| introduces the namespace ``oneapi::dpl`` for most its classes and functions.
-
-To use tested C++ standard APIs, you need to include the corresponding C++ standard header files
-and use the ``std`` namespace.
-
 System Requirements
 ===================
 
@@ -46,19 +35,56 @@ C++17 is the minimal supported version of the C++ standard.
 That means, any use of |onedpl_short| may require a C++17 compiler.
 While some APIs of the library may accidentally work with earlier versions of the C++ standard, it is no more guaranteed.
 
-To call Parallel API with the C++ standard policies, you need to install the following software:
+To call Parallel API with the C++ standard aligned policies, you need to install the following software:
 
 * A C++ compiler with support for OpenMP* 4.0 (or higher) SIMD constructs
-* Depending on what parallel backend you want to use install either:
+* Depending on what parallel backend you want to use, install either:
 
-  * |onetbb_long| or |tbb_long| 2019 and later
-  * A C++ compiler with support for OpenMP 4.5 (or higher)
+  * |onetbb_long| or |tbb_long| 2019 and later,
+  * A C++ compiler with support for OpenMP 4.5 (or higher).
 
-For more information about parallel backends, see :doc:`Execution Policies <parallel_api/execution_policies>`
+For more information about parallel backends, see :doc:`Execution Policies <parallel_api/execution_policies>`.
 
 To use Parallel API with the device execution policies, you need to install the following software:
 
-* A C++ compiler with support for SYCL 2020
+* A C++ compiler with support for SYCL 2020.
+
+Develop and Build Your Code with |onedpl_short|
+===============================================
+
+All |onedpl_short| header files are in the ``oneapi/dpl`` directory. To use the |onedpl_short| API,
+include the corresponding header in your source code with the ``#include <oneapi/dpl/…>`` directive.
+For better coexistence with the C++ standard library, include |onedpl_short| header files before the standard C++ ones.
+
+|onedpl_short| introduces the ``namespace oneapi::dpl`` for its classes and functions. For brevity,
+``namespace dpl`` is defined as an alias to ``oneapi::dpl`` and can be used interchangeably.
+
+To use :doc:`tested C++ standard APIs <api_for_sycl_kernels/tested_standard_cpp_api>` in SYCL device code,
+include the corresponding C++ standard header files and use the ``std`` namespace.
+
+Follow the steps below to build your code with |onedpl_short|:
+
+#. To build with the |dpcpp_cpp|, see the |dpcpp_gsg|_ for details.
+#. Set the environment variables for |onedpl_short| and |onetbb_short|.
+
+Here is an example of a command line used to compile code that contains |onedpl_short| parallel algorithms
+on Linux* (depending on the code, parameters within [] could be unnecessary)::
+
+  icpx [-fsycl] [-fiopenmp] program.cpp [-ltbb] -o program
+
+You may also use the |pstl_offload_option|_ of |dpcpp_cpp| powered by |onedpl_short|
+to build the standard C++ code for execution on a SYCL device::
+
+  icpx -fsycl -fsycl-pstl-offload=gpu program.cpp -o program
+
+This option redirects C++ parallel algorithms invoked with the ``std::execution::par_unseq`` policy
+to |onedpl_short| algorithms. It does not change the behavior of the |onedpl_short| algorithms and
+execution policies that are directly used in the code.
+
+Useful Information
+==================
+
+.. _library-restrictions:
 
 Difference with Standard C++ Parallel Algorithms
 ************************************************
@@ -66,25 +92,24 @@ Difference with Standard C++ Parallel Algorithms
 * oneDPL execution policies only result in parallel execution if random access iterators are provided,
   the execution will remain serial for other iterator types.
 * Function objects passed in to algorithms executed with device policies must provide ``const``-qualified ``operator()``.
-  `The SYCL specification <https://registry.khronos.org/SYCL/>`_ states that writing to such an object during a SYCL
-  kernel is undefined behavior.
-* For the following algorithms, par_unseq and unseq policies do not result in vectorized execution:
+  The `SYCL specification`_ states that writing to such an object during a SYCL kernel is undefined behavior.
+* For the following algorithms, ``par_unseq`` and ``unseq`` policies do not result in SIMD execution:
   ``includes``, ``inplace_merge``, ``merge``, ``set_difference``, ``set_intersection``,
   ``set_symmetric_difference``, ``set_union``, ``stable_partition``, ``unique``.
 * The following algorithms require additional O(n) memory space for parallel execution:
   ``copy_if``, ``inplace_merge``, ``partial_sort``, ``partial_sort_copy``, ``partition_copy``,
   ``remove``, ``remove_if``, ``rotate``, ``sort``, ``stable_sort``, ``unique``, ``unique_copy``.
 
-
 Restrictions
 ************
 
-When called with |dpcpp_short| execution policies, |onedpl_short| algorithms apply the same restrictions as
-|dpcpp_short| does (see the |dpcpp_short| specification and the SYCL specification for details), such as:
+When called with device execution policies, |onedpl_short| algorithms apply the same restrictions as
+|dpcpp_short| does (see the |dpcpp_cpp| documentation and the SYCL specification for details), such as:
 
 * Adding buffers to a lambda capture list is not allowed for lambdas passed to an algorithm.
 * Passing data types, which are not trivially copyable, is only allowed via USM,
   but not via buffers or host-allocated containers.
+* Objects of pointer-to-member types cannot be passed to an algorithm.
 * The definition of lambda functions used with parallel algorithms should not depend on preprocessor macros
   that makes it different for the host and the device. Otherwise, the behavior is undefined.
 * When used within SYCL kernels or transferred to/from a device, a container class can only hold objects
@@ -94,12 +119,11 @@ When called with |dpcpp_short| execution policies, |onedpl_short| algorithms app
 Known Limitations
 *****************
 
-* When compiled with ``-fsycl-pstl-offload`` option of Intel oneAPI DPC++/C++ compiler and with
-  ``libstdc++`` version 8 or ``libc++``, ``oneapi::dpl::execution::par_unseq`` offloads
-  standard parallel algorithms to the SYCL device similarly to ``std::execution::par_unseq``
-  in accordance with the ``-fsycl-pstl-offload`` option value.
+* The ``oneapi::dpl::execution::par_unseq`` policy is affected by ``-fsycl-pstl-offload`` option of |dpcpp_cpp|
+  when |onedpl_short| substitutes this policy for the ``std::execution::par_unseq`` policy
+  missing in a standard C++ library, particularly in libstdc++ version 8 and in libc++.
 * For ``transform_exclusive_scan`` and ``exclusive_scan`` to run in-place (that is, with the same data
-  used for both input and destination) and with an execution policy of ``unseq`` or ``par_unseq``, 
+  used for both input and destination) and with an execution policy of ``unseq`` or ``par_unseq``,
   it is required that the provided input and destination iterators are equality comparable.
   Furthermore, the equality comparison of the input and destination iterator must evaluate to true.
   If these conditions are not met, the result of these algorithm calls is undefined.
@@ -107,34 +131,27 @@ Known Limitations
   convertible to the type of the initial value if one is provided, otherwise it is convertible to the type of values
   in the processed data sequence: ``std::iterator_traits<IteratorType>::value_type``.
 * ``exclusive_scan`` and ``transform_exclusive_scan`` algorithms may provide wrong results with
-  vector execution policies when building a program with GCC 10 and using ``-O0`` option.
-* Compiling ``reduce`` and ``transform_reduce`` algorithms with the Intel DPC++ Compiler, versions 2021 and older,
-  may result in a runtime error. To fix this issue, use an Intel DPC++ Compiler version 2022 or newer.
+  unsequenced execution policies when building a program with GCC 10 and using ``-O0`` option.
+* Compiling ``reduce`` and ``transform_reduce`` algorithms with |dpcpp_cpp| versions 2021 and older
+  may result in a runtime error. To fix this issue, use |dpcpp_cpp| version 2022 or newer.
 * When compiling on Windows, add the option ``/EHsc`` to the compilation command to avoid errors with oneDPL's experimental
   ranges API that uses exceptions.
-* The use of |onedpl_short| together with the GNU C++ standard library (libstdc++) version 9 or 10 may lead to
-  compilation errors (caused by oneTBB API changes).
-  Using libstdc++ version 9 requires TBB version 2020 for the header file. This may result in compilation errors when
-  using C++17 or C++20 and TBB is not found in the environment, even if its use in |onedpl_short| is switched off.
-  To overcome these issues, include |onedpl_short| header files before the standard C++ header files,
-  or disable parallel algorithms support in the standard library. 
-  For more information, please see `Intel® oneAPI Threading Building Blocks (oneTBB) Release Notes`_.
 * The ``using namespace oneapi;`` directive in a |onedpl_short| program code may result in compilation errors
   with some compilers including GCC 7 and earlier. Instead of this directive, explicitly use
-  ``oneapi::dpl`` namespace, or create a namespace alias. 
+  the ``oneapi::dpl`` namespace, the shorter ``dpl`` namespace alias, or create your own alias.
 * ``std::array::at`` member function cannot be used in kernels because it may throw an exception;
   use ``std::array::operator[]`` instead.
 * Due to specifics of Microsoft* Visual C++, some standard floating-point math functions
   (including ``std::ldexp``, ``std::frexp``, ``std::sqrt(std::complex<float>)``) require device support
-  for double precision. 
+  for double precision.
 * ``exclusive_scan``, ``inclusive_scan``, ``exclusive_scan_by_segment``,
   ``inclusive_scan_by_segment``, ``transform_exclusive_scan``, ``transform_inclusive_scan``,
-  when used with C++ standard policies, impose limitations on the initial value type if an 
-  initial value is provided, and on the value type of the input iterator if an initial value is 
+  when used with C++ standard aligned policies, impose limitations on the initial value type if an
+  initial value is provided, and on the value type of the input iterator if an initial value is
   not provided.
   Firstly, it must satisfy the ``DefaultConstructible`` requirements.
   Secondly, a default-constructed instance of that type should act as the identity element for the binary scan function.
-* ``reduce_by_segment``, when used with C++ standard policies, imposes limitations on the value type.
+* ``reduce_by_segment``, when used with C++ standard aligned policies, imposes limitations on the value type.
   Firstly, it must satisfy the ``DefaultConstructible`` requirements.
   Secondly, a default-constructed instance of that type should act as the identity element for the binary reduction function.
 * The initial value type for ``exclusive_scan``, ``inclusive_scan``, ``exclusive_scan_by_segment``,
@@ -144,28 +161,5 @@ Known Limitations
   the dereferenced value type of the provided iterators should satisfy the ``DefaultConstructible`` requirements.
 * For ``remove``, ``remove_if``, ``unique`` the dereferenced value type of the provided
   iterators should be ``MoveConstructible``.
-* The algorithms that process uninitialized storage: ``uninitialized_copy``, ``uninitialized_copy_n``, ``uninitialized_fill``, ``uninitialized_fill_n``, ``uninitialized_fill_n``, ``uninitialized_move``, 
-  ``uninitialized_move_n``, ``uninitialized_default_construct``, ``uninitialized_default_construct_n``, ``uninitialized_value_construct``, ``uninitialized_value_construct_n``
-  should be called with a device policy when using device data and should be called with a host policy when using host data. Otherwise, the result is undefined.
-* The algorithms that destroy data: ``destroy`` and ``destroy_n`` should be called with a host policy when using host data that was initialized on the host, and should be called with a device policy when using device data that was initialized on the device. Otherwise, the result is undefined.
-
-
-Build Your Code with |onedpl_short|
-===================================
-
-Follow the steps below to build your code with |onedpl_short|:
-
-#. To build with the |dpcpp_cpp|, see the `Get Started with the Intel® oneAPI DPC++/C++ Compiler
-   <https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/get-started-guide/current/overview.html>`_
-   for details.
-#. Set the environment variables for |onedpl_short| and |onetbb_short|.
-#. To avoid naming device policy objects explicitly, add the ``-fsycl-unnamed-lambda`` option.
-
-Below is an example of a command line used to compile code that contains
-|onedpl_short| parallel algorithms on Linux* (depending on the code, parameters within [] could be unnecessary):
-
-.. code:: cpp
-
-  dpcpp [-fsycl-unnamed-lambda] test.cpp [-ltbb|-fopenmp] -o test
 
-.. _`Intel® oneAPI Threading Building Blocks (oneTBB) Release Notes`: https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-threading-building-blocks-release-notes.html
+.. _`SYCL Specification`: https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html
\ No newline at end of file
diff --git a/_sources/introduction/onedpl_gsg.rst b/_sources/introduction/onedpl_gsg.rst
index 5b598c23c3..761b7d677b 100644
--- a/_sources/introduction/onedpl_gsg.rst
+++ b/_sources/introduction/onedpl_gsg.rst
@@ -1,217 +1,223 @@
-Get Started with the |onedpl_long|
-##################################
-
-|onedpl_long| (|onedpl_short|) works with the
-`Intel® oneAPI DPC++/C++ Compiler <https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/get-started-guide/current/overview.html>`_
-to provide high-productivity APIs to developers, which can minimize SYCL*
-programming efforts across devices for high performance parallel applications.
-
-|onedpl_short| consists of the following components:
-
-* Parallel API
-* API for SYCL Kernels
-* Macros
-
-
-For general information about |onedpl_short|, visit the `oneDPL GitHub* repository <https://github.com/oneapi-src/oneDPL>`_,
-or visit the `Intel® oneAPI DPC++ Library Guide <https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/overview.html>`_
-and the `Intel® oneAPI DPC++ Library main page <https://www.intel.com/content/www/us/en/developer/tools/oneapi/dpc-library.html>`_.
-
-Quick Start
-===========
-
-Installation
-------------
-
-Visit the |onedpl_short| `Release Notes
-<https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-dpcpp-library-release-notes.html>`_
-page for:
-
-* Where to Find the Release
-* Overview
-* New Features
-* Fixed Issues
-* Known Issues and Limitations
-
-Install the `Intel® oneAPI Base Toolkit (Base Kit) <https://www.intel.com/content/www/us/en/developer/tools/oneapi/base-toolkit.html>`_
-to use |onedpl_short|.
-
-To use Parallel API, include the corresponding header files in your source code.
-
-All |onedpl_short| header files are in the ``oneapi/dpl`` directory. Use ``#include <oneapi/dpl/…>`` to include them.
-|onedpl_short| uses the namespace ``oneapi::dpl`` for most its classes and functions.
-
-To use tested C++ standard APIs, you need to include the corresponding C++ standard header files
-and use the ``std`` namespace.
-
-CMake Support
--------------
-`CMake <https://cmake.org/cmake/help/latest/index.html>`_ generates build scripts which can then be used to build and link your application. |onedpl_short| can be added to your project via CMake. 
-
-A simple example for Linux is provided below. For more detailed usage and options including details specific to Windows, please look to the `CMake Support Page <https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/cmake-support.html>`_.
-
-Simple Example CMake File
-*************************
-To use |onedpl_short| with CMake, create a CMakeLists.txt file for your project's base directory and use `find_package <https://cmake.org/cmake/help/latest/command/find_package.html>`_ and `target_link_libraries <https://cmake.org/cmake/help/latest/command/target_link_libraries.html>`_ to add oneDPL.
-For example:
-
-.. code:: cpp
-
-  project(Foo)
-  add_executable(foo foo.cpp)
-  
-  # Search to find oneDPL
-  find_package(oneDPL REQUIRED)
-  
-  # Connect oneDPL to foo
-  target_link_libraries(foo oneDPL)
-
-Simple Example CMake Invocation
-*******************************
-The following is an example CMake invocation which generates build scripts for the project in the parent directory: 
-
-.. code:: cpp
-
-  mkdir build && cd build
-  cmake -DCMAKE_CXX_COMPILER=icpx -DCMAKE_BUILD_TYPE=release ..
-
-Example Build Command
-*********************
-Once build scripts have been generated for your desired configuration following the instruction above, a `build command <https://cmake.org/cmake/help/latest/manual/cmake.1.html#build-a-project>`_ can be issued to build your project:
-
-.. code:: cpp
-
-  cmake --build .
-
-pkg-config Support
-------------------
-
-The pkg-config program is used to retrieve information about your installed libraries, and
-to compile and link against one or more libraries.
-
-Use pkg-config with |onedpl_short|
-**********************************
-
-Use pkg-config with the ``--cflags`` flag to get the include path to the oneDPL directory:
-
-.. code:: cpp
-
-  icpx -fsycl foo.cpp $(pkg-config --cflags dpl)
-  
-The ``--msvc-syntax`` flag is required when you use a Microsoft Visual C++* compiler.
-This flag converts your compiling and linking flags to the appropriate form:
-
-.. code:: cpp
-
-  icpx -fsycl foo.cpp $(pkg-config --msvc-syntax --cflags dpl)
-
-.. note::
-  Use the pkg-config tool to get rid of large hard-coded paths and make compilation more portable.
-
-
-Usage Examples
---------------
-
-|onedpl_short| sample code is available from the
-`oneAPI GitHub samples repository <https://github.com/oneapi-src/oneAPI-samples/tree/master/Libraries/oneDPL>`_.
-Each sample includes a readme with build instructions.
-
-\<oneapi/dpl/random\> Header Usage Example
-******************************************
-
-This example illustrates |onedpl_short| random number generator usage.
-The sample below shows you how to create an random number generator engine object (the source of pseudo-randomness),
-a distribution object (specifying the desired probability distribution), and how to generate
-the random numbers themselves. Random number generation is performed in a vectorized manner
-to improve the speed of your computations.
-
-This example performs its computations on your default SYCL device. You can set the
-``SYCL_DEVICE_TYPE`` environment variable to CPU or GPU.
-
-.. code:: cpp
-
-    template<int VecSize>
-    void random_fill(float* usmptr, std::size_t n) {
-        auto zero = oneapi::dpl::counting_iterator<std::size_t>(0);
-
-        std::for_each(oneapi::dpl::execution::dpcpp_default,
-            zero, zero + n/VecSize,
-            [usmptr](std::size_t i) {
-                auto offset = i * VecSize;
-
-                oneapi::dpl::minstd_rand_vec<VecSize> engine(seed, offset);
-                oneapi::dpl::uniform_real_distribution<sycl::vec<float, VecSize>> distr;
-
-                auto res = distr(engine);
-                res.store(i, sycl::global_ptr<float>(usmptr));
-            });
-    }
-
-Pi Benchmark Usage Example
-**************************
-
-This example uses a Monte Carlo method to estimate the value of π.
-The basic idea is to generate random points within a square, and to check what
-fraction of these random points lie in a quarter-circle inscribed within that square.
-The expected value is the ratio of the areas of the quarter-circle and the square (π/4).
-You can take the observed fraction of points in the quarter-circle as an estimate of π/4.
-
-This example shows you how to create an random number generator engine object (the source of pseudo-randomness),
-a distribution object (specifying the desired probability distribution), generate the
-random numbers themselves, and then perform a reduction to count quantity of points that
-fit into the square *S*. Random number generation is performed in scalar manner to simplify your code.
-
-
-.. figure:: images/pi_benchmark.png
-   :alt: An image of pi chart.
-
-.. code:: cpp
-
-    float estimated_pi;
-    {
-        sycl::queue q(sycl::gpu_selector_v);
-        auto policy = oneapi::dpl::execution::make_device_policy(q);
-
-        float sum = std::transform_reduce( policy,
-                                          oneapi::dpl::counting_iterator<int>(0),
-                                          oneapi::dpl::counting_iterator<int>(N),
-                                          0.0f,
-                                          std::plus<float>{},
-                                          [=](int n){
-                                              float local_sum = 0.0f;
-                                              oneapi::dpl::minstd_rand engine(SEED, n * ITER * 2);
-                                              oneapi::dpl::uniform_real_distribution<float> distr;
-                                              for(int i = 0; i < ITER; ++i) {
-                                                  float x = distr(engine);
-                                                  float y = distr(engine);
-                                                  if (x * x + y * y <= 1.0)
-                                                      local_sum += 1.0;
-                                              }
-                                              return local_sum / (float)ITER;
-                                          }
-        );
-        estimated_pi = 4.0f * (float)sum / N;
-    }
-
-
-Find More
-=========
-
-.. list-table::
-   :widths: 50 50
-   :header-rows: 1
-
-   * - Resource Link
-     - Description
-   * - `Intel® oneAPI DPC++ Library Guide <https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/overview.html>`_
-     - Refer to the |onedpl_short| guide for  more in depth information.
-   * - `System Requirements <https://www.intel.com/content/www/us/en/developer/articles/system-requirements/intel-oneapi-dpcpp-system-requirements.html>`_
-     - Check system requirements before you install |onedpl_short|.
-   * - `Intel® oneAPI DPC++ Library Release Notes <https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-dpcpp-library-release-notes.html>`_
-     - Check the release notes to learn about updates in the latest release.
-   * - `oneDPL Samples <https://github.com/oneapi-src/oneAPI-samples/tree/master/Libraries/oneDPL>`_
-     - Learn how to use |onedpl_short| with samples.
-   * - `Layers for Yocto* Project <https://www.intel.com/content/www/us/en/docs/oneapi-iot-toolkit/get-started-guide-linux/current/adding-oneapi-components-to-yocto-project-builds.html>`_
-     - Add oneAPI components to a Yocto project build using the meta-intel layers.
-   * - `oneAPI Samples Catalog <https://oneapi-src.github.io/oneAPI-samples/>`_
-     - Explore the complete list of oneAPI code samples in the oneAPI Samples Catalog (GitHub*). These samples were designed to help you develop, offload, and optimize multiarchitecture applications targeting CPUs, GPUs, and FPGAs.
\ No newline at end of file
+Get Started with the |onedpl_long|
+##################################
+
+|onedpl_long| (|onedpl_short|) works with the |dpcpp_cpp_with_gsg_link|_
+to provide high-productivity APIs to developers, which can minimize SYCL*
+programming efforts across devices for high performance parallel applications.
+
+|onedpl_short| consists of the following components:
+
+* Parallel API
+* API for SYCL Kernels
+* Macros
+
+
+For general information about |onedpl_short|, visit the `oneDPL GitHub* repository <https://github.com/oneapi-src/oneDPL>`_,
+or visit the |onedpl_library_guide|_ and the `Intel® oneAPI DPC++ Library main page
+<https://www.intel.com/content/www/us/en/developer/tools/oneapi/dpc-library.html>`_.
+
+Quick Start
+===========
+
+Installation
+------------
+
+Visit the |onedpl_short| `Release Notes
+<https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-dpcpp-library-release-notes.html>`_
+page for:
+
+* Where to Find the Release
+* Overview
+* New Features
+* Fixed Issues
+* Known Issues and Limitations
+
+Install the `Intel® oneAPI Base Toolkit (Base Kit) <https://www.intel.com/content/www/us/en/developer/tools/oneapi/base-toolkit.html>`_
+to use |onedpl_short|.
+
+To use Parallel API, include the corresponding header files in your source code.
+
+All |onedpl_short| header files are in the ``oneapi/dpl`` directory. Use ``#include <oneapi/dpl/…>`` to include them.
+|onedpl_short| uses the namespace ``oneapi::dpl`` for most its classes and functions.
+
+To use tested C++ standard APIs, you need to include the corresponding C++ standard header files
+and use the ``std`` namespace.
+
+CMake Support
+-------------
+`CMake <https://cmake.org/cmake/help/latest/index.html>`_ generates build scripts which can then be used
+to build and link your application. |onedpl_short| can be added to your project via CMake. 
+
+A simple example for Linux is provided below. For more detailed usage and options including details specific to Windows,
+please look to the |dpcpp_cmake_support|_.
+
+Simple Example CMake File
+*************************
+To use |onedpl_short| with CMake, create a CMakeLists.txt file for your project's base directory and use
+`find_package <https://cmake.org/cmake/help/latest/command/find_package.html>`_
+and `target_link_libraries <https://cmake.org/cmake/help/latest/command/target_link_libraries.html>`_ to add oneDPL.
+For example:
+
+.. code:: cpp
+
+  project(Foo)
+  add_executable(foo foo.cpp)
+  
+  # Search to find oneDPL
+  find_package(oneDPL REQUIRED)
+  
+  # Connect oneDPL to foo
+  target_link_libraries(foo oneDPL)
+
+Simple Example CMake Invocation
+*******************************
+The following is an example CMake invocation which generates build scripts for the project in the parent directory: 
+
+.. code:: cpp
+
+  mkdir build && cd build
+  cmake -DCMAKE_CXX_COMPILER=icpx -DCMAKE_BUILD_TYPE=release ..
+
+Example Build Command
+*********************
+Once build scripts have been generated for your desired configuration following the instruction above, a `build command
+<https://cmake.org/cmake/help/latest/manual/cmake.1.html#build-a-project>`_ can be issued to build your project:
+
+.. code:: cpp
+
+  cmake --build .
+
+pkg-config Support
+------------------
+
+The pkg-config program is used to retrieve information about your installed libraries, and
+to compile and link against one or more libraries.
+
+Use pkg-config with |onedpl_short|
+**********************************
+
+Use pkg-config with the ``--cflags`` flag to get the include path to the oneDPL directory:
+
+.. code:: cpp
+
+  icpx -fsycl foo.cpp $(pkg-config --cflags dpl)
+  
+The ``--msvc-syntax`` flag is required when you use a Microsoft Visual C++* compiler.
+This flag converts your compiling and linking flags to the appropriate form:
+
+.. code:: cpp
+
+  icpx -fsycl foo.cpp $(pkg-config --msvc-syntax --cflags dpl)
+
+.. note::
+  Use the pkg-config tool to get rid of large hard-coded paths and make compilation more portable.
+
+
+Usage Examples
+--------------
+
+|onedpl_short| sample code is available from the
+`oneAPI GitHub samples repository <https://github.com/oneapi-src/oneAPI-samples/tree/master/Libraries/oneDPL>`_.
+Each sample includes a readme with build instructions.
+
+\<oneapi/dpl/random\> Header Usage Example
+******************************************
+
+This example illustrates |onedpl_short| random number generator usage.
+The sample below shows you how to create an random number generator engine object (the source of pseudo-randomness),
+a distribution object (specifying the desired probability distribution), and how to generate
+the random numbers themselves. Random number generation is performed in a vectorized manner
+to improve the speed of your computations.
+
+This example performs its computations on your default SYCL device. You can set the
+``SYCL_DEVICE_TYPE`` environment variable to CPU or GPU.
+
+.. code:: cpp
+
+    template<int VecSize>
+    void random_fill(float* usmptr, std::size_t n) {
+        auto zero = oneapi::dpl::counting_iterator<std::size_t>(0);
+
+        std::for_each(oneapi::dpl::execution::dpcpp_default,
+            zero, zero + n/VecSize,
+            [usmptr](std::size_t i) {
+                auto offset = i * VecSize;
+
+                oneapi::dpl::minstd_rand_vec<VecSize> engine(seed, offset);
+                oneapi::dpl::uniform_real_distribution<sycl::vec<float, VecSize>> distr;
+
+                auto res = distr(engine);
+                res.store(i, sycl::global_ptr<float>(usmptr));
+            });
+    }
+
+Pi Benchmark Usage Example
+**************************
+
+This example uses a Monte Carlo method to estimate the value of π.
+The basic idea is to generate random points within a square, and to check what
+fraction of these random points lie in a quarter-circle inscribed within that square.
+The expected value is the ratio of the areas of the quarter-circle and the square (π/4).
+You can take the observed fraction of points in the quarter-circle as an estimate of π/4.
+
+This example shows you how to create an random number generator engine object (the source of pseudo-randomness),
+a distribution object (specifying the desired probability distribution), generate the
+random numbers themselves, and then perform a reduction to count quantity of points that
+fit into the square *S*. Random number generation is performed in scalar manner to simplify your code.
+
+
+.. figure:: images/pi_benchmark.png
+   :alt: An image of pi chart.
+
+.. code:: cpp
+
+    float estimated_pi;
+    {
+        sycl::queue q(sycl::gpu_selector_v);
+        auto policy = oneapi::dpl::execution::make_device_policy(q);
+
+        float sum = std::transform_reduce( policy,
+                                          oneapi::dpl::counting_iterator<int>(0),
+                                          oneapi::dpl::counting_iterator<int>(N),
+                                          0.0f,
+                                          std::plus<float>{},
+                                          [=](int n){
+                                              float local_sum = 0.0f;
+                                              oneapi::dpl::minstd_rand engine(SEED, n * ITER * 2);
+                                              oneapi::dpl::uniform_real_distribution<float> distr;
+                                              for(int i = 0; i < ITER; ++i) {
+                                                  float x = distr(engine);
+                                                  float y = distr(engine);
+                                                  if (x * x + y * y <= 1.0)
+                                                      local_sum += 1.0;
+                                              }
+                                              return local_sum / (float)ITER;
+                                          }
+        );
+        estimated_pi = 4.0f * (float)sum / N;
+    }
+
+
+Find More
+=========
+
+.. list-table::
+   :widths: 50 50
+   :header-rows: 1
+
+   * - Resource Link
+     - Description
+   * - |onedpl_library_guide|_
+     - Refer to the |onedpl_short| guide for  more in depth information.
+   * - `System Requirements <https://www.intel.com/content/www/us/en/developer/articles/system-requirements/intel-oneapi-dpcpp-system-requirements.html>`_
+     - Check system requirements before you install |onedpl_short|.
+   * - `Intel® oneAPI DPC++ Library Release Notes
+       <https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-dpcpp-library-release-notes.html>`_
+     - Check the release notes to learn about updates in the latest release.
+   * - `oneDPL Samples <https://github.com/oneapi-src/oneAPI-samples/tree/master/Libraries/oneDPL>`_
+     - Learn how to use |onedpl_short| with samples.
+   * - |yocto_layers|_
+     - Add oneAPI components to a Yocto project build using the meta-intel layers.
+   * - `oneAPI Samples Catalog <https://oneapi-src.github.io/oneAPI-samples/>`_
+     - Explore the complete list of oneAPI code samples in the oneAPI Samples Catalog (GitHub*).
+       These samples were designed to help you develop, offload, and optimize multiarchitecture applications targeting CPUs, GPUs, and FPGAs.
\ No newline at end of file
diff --git a/_sources/introduction/release_notes.rst b/_sources/introduction/release_notes.rst
index 8f5ce72db7..f69dffa710 100644
--- a/_sources/introduction/release_notes.rst
+++ b/_sources/introduction/release_notes.rst
@@ -1,8 +1,8 @@
-.. |release_notes| replace:: |onedpl_long| Release Notes
-.. _release_notes: https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-dpcpp-library-release-notes.html
-
-=============
-Release Notes
-=============
-
+.. |release_notes| replace:: |onedpl_long| Release Notes
+.. _release_notes: https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-dpcpp-library-release-notes.html
+
+=============
+Release Notes
+=============
+
 Refer to |release_notes|_.
\ No newline at end of file
diff --git a/_sources/kernel_templates/esimd/radix_sort.rst b/_sources/kernel_templates/esimd/radix_sort.rst
index c74ece79a2..f6ba4ad36d 100644
--- a/_sources/kernel_templates/esimd/radix_sort.rst
+++ b/_sources/kernel_templates/esimd/radix_sort.rst
@@ -1,16 +1,17 @@
 Radix Sort
 ##########
 
----------------------------------------------------
-radix_sort and radix_sort_by_key Function Templates
----------------------------------------------------
+-----------------------------
+radix_sort Function Templates
+-----------------------------
 
-The ``radix_sort`` and ``radix_sort_by_key`` functions sort data using the radix sort algorithm.
-The sorting is stable, ensuring the preservation of the relative order of elements with equal keys.
-The functions implement a Onesweep* [#fnote1]_ algorithm variant. Both in-place and out-of-place
-overloads are provided. For out-of-place overloads, the input data order is preserved.
+The ``radix_sort`` function sorts data using the radix sort algorithm.
+The sorting is stable, preserving the relative order of elements with equal keys.
+Both in-place and out-of-place overloads are provided. Out-of-place overloads do not alter the input sequence.
 
-A synopsis of the ``radix_sort`` and ``radix_sort_by_key`` functions is provided below:
+The functions implement a Onesweep* [#fnote1]_ algorithm variant.
+
+A synopsis of the ``radix_sort`` function is provided below:
 
 .. code:: cpp
 
@@ -18,7 +19,7 @@ A synopsis of the ``radix_sort`` and ``radix_sort_by_key`` functions is provided
 
    namespace oneapi::dpl::experimental::kt::gpu::esimd {
 
-   // Sort a single sequence
+   // Sort in-place
    template <bool IsAscending = true, std::uint8_t RadixBits = 8,
              typename KernelParam, typename Iterator>
    sycl::event
@@ -31,55 +32,24 @@ A synopsis of the ``radix_sort`` and ``radix_sort_by_key`` functions is provided
    radix_sort (sycl::queue q, Range&& r, KernelParam param); // (2)
 
 
-   // Sort a single sequence out-of-place
+   // Sort out-of-place
    template <bool IsAscending = true, std::uint8_t RadixBits = 8,
              typename KernelParam, typename Iterator1,
              typename Iterator2>
    sycl::event
    radix_sort (sycl::queue q, Iterator1 first, Iterator1 last,
-               Iterator2 first_out, KernelParam param) // (3)
+               Iterator2 first_out, KernelParam param); // (3)
 
    template <bool IsAscending = true, std::uint8_t RadixBits = 8,
              typename KernelParam, typename Range1, typename Range2>
    sycl::event
    radix_sort (sycl::queue q, Range1&& r, Range2&& r_out,
-               KernelParam param) // (4)
-
-
-   // Sort a sequence of keys and apply the same order to a sequence of values
-   template <bool IsAscending = true, std::uint8_t RadixBits = 8,
-             typename KernelParam, typename Iterator1, typename Iterator2>
-   sycl::event
-   radix_sort_by_key (sycl::queue q, Iterator1 keys_first, Iterator1 keys_last,
-                      Iterator2 values_first, KernelParam param); // (5)
-
-   template <bool IsAscending = true, std::uint8_t RadixBits = 8,
-             typename KernelParam, typename KeysRng, typename ValuesRng>
-   sycl::event
-   radix_sort_by_key (sycl::queue q, KeysRng&& keys,
-                      ValuesRng&& values, KernelParam param); // (6)
-
-
-   // Sort a sequence of keys and values out-of-place
-   template <bool IsAscending = true, std::uint8_t RadixBits = 8,
-             typename KernelParam, typename KeysIterator1,
-             typename ValsIterator1, typename KeysIterator2,
-             typename ValsIterator2>
-   sycl::event
-   radix_sort_by_key (sycl::queue q, KeysIterator1 keys_first,
-                      KeysIterator1 keys_last, ValsIterator1 vals_first,
-                      KeysIterator2 keys_out_first, ValsIterator2 vals_out_first,
-                      KernelParam param) // (7)
-
-   template <bool IsAscending = true, std::uint8_t RadixBits = 8,
-             typename KernelParam, typename KeysRng1, typename ValsRng1,
-             typename KeysRng2, typename ValsRng2>
-   sycl::event
-   radix_sort_by_key (sycl::queue q, KeysRng1&& keys, ValsRng1&& values,
-                      KeysRng2&& keys_out, ValsRng2&& vals_out,
-                      KernelParam param) // (8)
+               KernelParam param); // (4)
    }
 
+.. note::
+   The ``radix_sort`` is currently available only for Intel® Data Center GPU Max Series,
+   and requires Intel® oneAPI DPC++/C++ Compiler 2023.2 or newer.
 
 Template Parameters
 --------------------
@@ -99,22 +69,22 @@ Parameters
 +-----------------------------------------------+---------------------------------------------------------------------+
 | Name                                          | Description                                                         |
 +===============================================+=====================================================================+
-| ``q``                                         |  The SYCL* queue where kernels are submitted.                       |
+| ``q``                                         | The SYCL* queue where kernels are submitted.                        |
 +-----------------------------------------------+---------------------------------------------------------------------+
 |                                               |                                                                     |
 |                                               | The sequences to apply the algorithm to.                            |
 | - ``first``, ``last`` (1),                    | Supported sequence types:                                           |
 | - ``r`` (2),                                  |                                                                     |
-| - ``first``, ``last``, ``first_out`` (3),     | - :ref:`USM pointers <use-usm>` (1,3,5,7),                          |
-| - ``r``, ``r_out`` (4),                       | - :ref:`oneapi::dpl::begin and oneapi::dpl::end                     |
-| - ``keys_first``, ``keys_last``,              |   <use-buffer-wrappers>` (1,3,5,7).                                 |
-|   ``values_first`` (5),                       | - ``sycl::buffer`` (2,4,6,8),                                       |
-| - ``keys``, ``values`` (6),                   | - :ref:`oneapi::dpl::experimental::ranges::views::all               |
-| - ``keys_first``, ``keys_last``,              |   <viewable-ranges>` (2,4,6,8),                                     |
-|   ``vals_first``, ``keys_out_first``,         | - :ref:`oneapi::dpl::experimental::ranges::views::subrange          |
-|   ``values_out_first`` (7)                    |   <viewable-ranges>` (2,4,6,8),                                     |
-| - ``keys``, ``values``,                       |                                                                     |
-|   ``keys_out``, ``values_out`` (8),           |                                                                     |
+| - ``first``, ``last``, ``first_out`` (3),     | - :ref:`USM pointers <use-usm>` (1,3),                              |
+| - ``r``, ``r_out`` (4).                       | - :ref:`oneapi::dpl::begin and oneapi::dpl::end                     |
+|                                               |   <use-buffer-wrappers>` (1,3).                                     |
+|                                               | - ``sycl::buffer`` (2,4),                                           |
+|                                               | - :ref:`oneapi::dpl::experimental::ranges::views::all               |
+|                                               |   <viewable-ranges>` (2,4),                                         |
+|                                               | - :ref:`oneapi::dpl::experimental::ranges::views::subrange          |
+|                                               |   <viewable-ranges>` (2,4).                                         |
+|                                               |                                                                     |
+|                                               |                                                                     |
 |                                               |                                                                     |
 +-----------------------------------------------+---------------------------------------------------------------------+
 | ``param``                                     | A :doc:`kernel_param <../kernel_configuration>` object.             |
@@ -147,8 +117,8 @@ Usage Examples
 --------------
 
 
-radix_sort In-Place Example
----------------------------
+In-Place Example
+----------------
 
 .. code:: cpp
 
@@ -185,74 +155,14 @@ radix_sort In-Place Example
       return 0;
    }
 
-**Output:**
-
-.. code:: none
+**Output**::
 
    5 3 3 3 2 1
 
 
-radix_sort_by_key In-Place Example
-----------------------------------
-
-.. code:: cpp
-
-   // possible build and run commands:
-   //    icpx -fsycl radix_sort_by_key.cpp -o radix_sort_by_key -I /path/to/oneDPL/include && ./radix_sort_by_key
-
-   #include <cstdint>
-   #include <iostream>
-   #include <sycl/sycl.hpp>
-
-   #include <oneapi/dpl/experimental/kernel_templates>
-
-   namespace kt = oneapi::dpl::experimental::kt;
-
-   int main()
-   {
-      std::size_t n = 6;
-      sycl::queue q{sycl::gpu_selector_v};
-      sycl::buffer<std::uint32_t> keys{sycl::range<1>(n)};
-      sycl::buffer<char> values{sycl::range<1>(n)};
-
-      // initialize
-      {
-         sycl::host_accessor k_acc{keys, sycl::write_only};
-         k_acc[0] = 3, k_acc[1] = 2, k_acc[2] = 1, k_acc[3] = 5, k_acc[4] = 3, k_acc[5] = 3;
-
-         sycl::host_accessor v_acc{values, sycl::write_only};
-         v_acc[0] = 'r', v_acc[1] = 'o', v_acc[2] = 's', v_acc[3] = 'd', v_acc[4] = 't', v_acc[5] = 'e';
-      }
-
-      // sort
-      auto e = kt::gpu::esimd::radix_sort_by_key<true, 8>(q, keys, values, kt::kernel_param<96, 64>{}); // (6)
-      e.wait();
-
-      // print
-      {
-         sycl::host_accessor k_acc{keys, sycl::read_only};
-         for(std::size_t i = 0; i < n; ++i)
-               std::cout << k_acc[i] << ' ';
-         std::cout << '\n';
-
-         sycl::host_accessor v_acc{values, sycl::read_only};
-         for(std::size_t i = 0; i < n; ++i)
-               std::cout << v_acc[i] << ' ';
-         std::cout << '\n';
-      }
-
-      return 0;
-   }
-
-**Output:**
-
-.. code:: none
-
-   1 2 3 3 3 5
-   s o r t e d
 
-radix_sort Out-of-Place Example
--------------------------------
+Out-of-Place Example
+--------------------
 
 .. code:: cpp
 
@@ -294,101 +204,24 @@ radix_sort Out-of-Place Example
       return 0;
    }
 
-**Output:**
-
-.. code:: none
+**Output**::
 
    3 2 1 5 3 3
    5 3 3 3 2 1
 
-radix_sort_by_key Out-of-Place Example
---------------------------------------
-
-.. code:: cpp
-
-   // possible build and run commands:
-   //    icpx -fsycl radix_sort_by_key.cpp -o radix_sort_by_key -I /path/to/oneDPL/include && ./radix_sort_by_key
 
-   #include <cstdint>
-   #include <iostream>
-   #include <sycl/sycl.hpp>
-
-   #include <oneapi/dpl/experimental/kernel_templates>
-
-   namespace kt = oneapi::dpl::experimental::kt;
-
-   int main()
-   {
-      std::size_t n = 6;
-      sycl::queue q{sycl::gpu_selector_v};
-      sycl::buffer<std::uint32_t> keys{sycl::range<1>(n)};
-      sycl::buffer<std::uint32_t> keys_out{sycl::range<1>(n)};
-      sycl::buffer<char> values{sycl::range<1>(n)};
-      sycl::buffer<char> values_out{sycl::range<1>(n)};
-
-
-      // initialize
-      {
-         sycl::host_accessor k_acc{keys, sycl::write_only};
-         k_acc[0] = 3, k_acc[1] = 2, k_acc[2] = 1, k_acc[3] = 5, k_acc[4] = 3, k_acc[5] = 3;
-
-         sycl::host_accessor v_acc{values, sycl::write_only};
-         v_acc[0] = 'r', v_acc[1] = 'o', v_acc[2] = 's', v_acc[3] = 'd', v_acc[4] = 't', v_acc[5] = 'e';
-      }
-
-      // sort
-      auto e = kt::gpu::esimd::radix_sort_by_key<true, 8>(q, keys, values, keys_out, values_out,
-                                                          kt::kernel_param<96, 64>{}); // (8)
-      e.wait();
-
-      // print
-      {
-         sycl::host_accessor k_acc{keys, sycl::read_only};
-         for(std::size_t i = 0; i < n; ++i)
-               std::cout << k_acc[i] << ' ';
-         std::cout << '\n';
-
-         sycl::host_accessor v_acc{values, sycl::read_only};
-         for(std::size_t i = 0; i < n; ++i)
-               std::cout << v_acc[i] << ' ';
-         std::cout << "\n\n";
-         
-         sycl::host_accessor k_out_acc{keys_out, sycl::read_only};
-         for(std::size_t i = 0; i < n; ++i)
-               std::cout << k_out_acc[i] << ' ';
-         std::cout << '\n';
-
-         sycl::host_accessor v_out_acc{values_out, sycl::read_only};
-         for(std::size_t i = 0; i < n; ++i)
-               std::cout << v_out_acc[i] << ' ';
-         std::cout << '\n';
-      }
-
-      return 0;
-   }
-
-**Output:**
-
-.. code:: none
-
-   3 2 1 5 3 3
-   r o s d t e
-
-   1 2 3 3 3 5
-   s o r t e d
-
-
-.. _memory-requirements:
+.. _radix-sort-memory-requirements:
 
 -------------------
 Memory Requirements
 -------------------
 
-The algorithms use global and local device memory (see `SYCL 2020 Specification
+The algorithm uses global and local device memory (see `SYCL 2020 Specification
 <https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#_sycl_device_memory_model>`_)
-for intermediate data storage. For the algorithms to operate correctly, there must be enough memory
-on the device; otherwise, the behavior is undefined. The amount of memory that is required
-depends on input data and configuration parameters, as described below.
+for intermediate data storage. For the algorithm to operate correctly, there must be enough memory on the device.
+If there is not enough global device memory, a ``std::bad_alloc`` exception is thrown.
+The behavior is undefined if there is not enough local memory.
+The amount of memory that is required depends on input data and configuration parameters, as described below.
 
 Global Memory Requirements
 --------------------------
@@ -396,12 +229,9 @@ Global Memory Requirements
 Global memory is used for copying the input sequence(s) and storing internal data such as radix value counters.
 The used amount depends on many parameters; below is an upper bound approximation:
 
-:``radix_sort``: N\ :sub:`keys` + C * N\ :sub:`keys`
-
-:``radix_sort_by_key``: N\ :sub:`keys` + N\ :sub:`values` + C * N\ :sub:`keys`
+   N\ :sub:`keys` + C * N\ :sub:`keys`
 
-where the sequence with keys takes N\ :sub:`keys` space, the sequence with values takes N\ :sub:`values` space,
-and the additional space is C * N\ :sub:`keys`.
+where the sequence with keys takes N\ :sub:`keys` space, and the additional space is C * N\ :sub:`keys`.
 
 The value of `C` depends on ``param.data_per_workitem``, ``param.workgroup_size``, and ``RadixBits``.
 For ``param.data_per_workitem`` set to `32`, ``param.workgroup_size`` to `64`, and ``RadixBits`` to `8`,
@@ -413,35 +243,26 @@ Incrementing ``RadixBits`` increases `C` up to twice, while doubling either
 
    If the number of elements to sort does not exceed ``param.data_per_workitem * param.workgroup_size``,
    ``radix_sort`` is executed by a single work-group and does not use any global memory.
-   For ``radix_sort_by_key`` there is no single work-group implementation yet.
 
 ..
    The estimation above is not very precise and it seems it is not necessary for the global memory.
    The C coefficient base is actually 0.53 instead of 1.
    An increment of RadixBits multiplies C by the factor of ~1.5 on average.
 
-   Additionally, C exceeds 1 for radix_sort_by_key,
-   when N is small and the global histogram takes more space than the sequences.
-   This space is small, single WG implementation will be added, therefore this is neglected.
-
-.. _local-memory:
 
 Local Memory Requirements
 -------------------------
 
-Local memory is used for reordering keys or key-value pairs within a work-group,
+Local memory is used for reordering keys within a work-group,
 and for storing internal data such as radix value counters.
 The used amount depends on many parameters; below is an upper bound approximation:
 
-:``radix_sort``: N\ :sub:`keys_per_workgroup` + C
-
-:``radix_sort_by_key``: N\ :sub:`keys_per_workgroup` + N\ :sub:`values_per_workgroup` + C
+   N\ :sub:`keys_per_workgroup` + C
 
-where N\ :sub:`keys_per_workgroup` and N\ :sub:`values_per_workgroup` are the amounts of memory
-to store keys and values, respectively.  `C` is some additional space for storing internal data.
+where N\ :sub:`keys_per_workgroup` is the amount of memory to store keys.
+`C` is some additional space for storing internal data.
 
 N\ :sub:`keys_per_workgroup` equals to ``sizeof(key_type) * param.data_per_workitem * param.workgroup_size``,
-N\ :sub:`values_per_workgroup` equals to ``sizeof(value_type) * param.data_per_workitem * param.workgroup_size``,
 `C` does not exceed `4KB`.
 
 ..
@@ -484,7 +305,7 @@ The initial configuration may be selected according to these high-level guidelin
 .. warning::
 
    Avoid setting too large ``param.data_per_workitem`` and ``param.workgroup_size`` values.
-   Make sure that :ref:`Memory requirements <memory-requirements>` are satisfied.
+   Make sure that :ref:`Memory requirements <radix-sort-memory-requirements>` are satisfied.
 
 .. note::
 
@@ -492,7 +313,7 @@ The initial configuration may be selected according to these high-level guidelin
    since ``param.workgroup_size`` currently supports only one value (`64`).
 
 
-.. [#fnote1] Andy Adinets and Duane Merrill (2022). Onesweep: A Faster Least Significant Digit Radix Sort for GPUs. Retrieved from https://arxiv.org/abs/2206.01784.
+.. [#fnote1] Andy Adinets and Duane Merrill (2022). Onesweep: A Faster Least Significant Digit Radix Sort for GPUs. https://arxiv.org/abs/2206.01784.
 .. [#fnote2] The X\ :sup:`e`-core term is described in the `oneAPI GPU Optimization Guide
    <https://www.intel.com/content/www/us/en/docs/oneapi/optimization-guide-gpu/2024-0/intel-xe-gpu-architecture.html#XE-CORE>`_.
    Check the number of cores in the device specification, such as `Intel® Data Center GPU Max specification
diff --git a/_sources/kernel_templates/esimd/radix_sort_by_key.rst b/_sources/kernel_templates/esimd/radix_sort_by_key.rst
new file mode 100644
index 0000000000..9ee99fadb6
--- /dev/null
+++ b/_sources/kernel_templates/esimd/radix_sort_by_key.rst
@@ -0,0 +1,361 @@
+Radix Sort By Key
+#################
+
+------------------------------------
+radix_sort_by_key Function Templates
+------------------------------------
+
+The ``radix_sort_by_key`` function sorts keys using the radix sort algorithm, applying the same order to the corresponding values.
+The sorting is stable, preserving the relative order of elements with equal keys.
+Both in-place and out-of-place overloads are provided. Out-of-place overloads do not alter the input sequences.
+
+The functions implement a Onesweep* [#fnote1]_ algorithm variant.
+
+A synopsis of the ``radix_sort_by_key`` function is provided below:
+
+.. code:: cpp
+
+   // defined in <oneapi/dpl/experimental/kernel_templates>
+
+   namespace oneapi::dpl::experimental::kt::gpu::esimd {
+
+   // Sort in-place
+   template <bool IsAscending = true, std::uint8_t RadixBits = 8,
+             typename KernelParam, typename Iterator1, typename Iterator2>
+   sycl::event
+   radix_sort_by_key (sycl::queue q, Iterator1 keys_first, Iterator1 keys_last,
+                      Iterator2 values_first, KernelParam param); // (1)
+
+   template <bool IsAscending = true, std::uint8_t RadixBits = 8,
+             typename KernelParam, typename KeysRng, typename ValuesRng>
+   sycl::event
+   radix_sort_by_key (sycl::queue q, KeysRng&& keys,
+                      ValuesRng&& values, KernelParam param); // (2)
+
+
+   // Sort out-of-place
+   template <bool IsAscending = true, std::uint8_t RadixBits = 8,
+             typename KernelParam, typename KeysIterator1,
+             typename ValuesIterator1, typename KeysIterator2,
+             typename ValuesIterator2>
+   sycl::event
+   radix_sort_by_key (sycl::queue q, KeysIterator1 keys_first,
+                      KeysIterator1 keys_last, ValuesIterator1 values_first,
+                      KeysIterator2 keys_out_first, ValuesIterator2 values_out_first,
+                      KernelParam param); // (3)
+
+   template <bool IsAscending = true, std::uint8_t RadixBits = 8,
+             typename KernelParam, typename KeysRng1, typename ValuesRng1,
+             typename KeysRng2, typename ValuesRng2>
+   sycl::event
+   radix_sort_by_key (sycl::queue q, KeysRng1&& keys, ValuesRng1&& values,
+                      KeysRng2&& keys_out, ValuesRng2&& values_out,
+                      KernelParam param); // (4)
+   }
+
+.. note::
+   The ``radix_sort_by_key`` is currently available only for Intel® Data Center GPU Max Series,
+   and requires Intel® oneAPI DPC++/C++ Compiler 2023.2 or newer.
+
+Template Parameters
+--------------------
+
++-----------------------------+---------------------------------------------------------------------------------------+
+| Name                        | Description                                                                           |
++=============================+=======================================================================================+
+| ``bool IsAscending``        | The sort order. Ascending: ``true``; Descending: ``false``.                           |
++-----------------------------+---------------------------------------------------------------------------------------+
+| ``std::uint8_t RadixBits``  | The number of bits to sort for each radix sort algorithm pass.                        |
++-----------------------------+---------------------------------------------------------------------------------------+
+
+
+Parameters
+----------
+
++-----------------------------------------------+---------------------------------------------------------------------+
+| Name                                          | Description                                                         |
++===============================================+=====================================================================+
+| ``q``                                         | The SYCL* queue where kernels are submitted.                        |
++-----------------------------------------------+---------------------------------------------------------------------+
+|                                               |                                                                     |
+|                                               | The sequences to apply the algorithm to.                            |
+| - ``keys_first``, ``keys_last``,              | Supported sequence types:                                           |
+|   ``values_first`` (1),                       |                                                                     |
+| - ``keys``, ``values`` (2),                   | - :ref:`USM pointers <use-usm>` (1,3),                              |
+| - ``keys_first``, ``keys_last``,              | - :ref:`oneapi::dpl::begin and oneapi::dpl::end                     |
+|   ``values_first``, ``keys_out_first``,       |   <use-buffer-wrappers>` (1,3).                                     |
+|   ``values_out_first`` (3)                    | - ``sycl::buffer`` (2,4),                                           |
+| - ``keys``, ``values``,                       | - :ref:`oneapi::dpl::experimental::ranges::views::all               |
+|   ``keys_out``, ``values_out`` (4).           |   <viewable-ranges>` (2,4),                                         |
+|                                               | - :ref:`oneapi::dpl::experimental::ranges::views::subrange          |
+|                                               |   <viewable-ranges>` (2,4).                                         |
+|                                               |                                                                     |
+|                                               |                                                                     |
+|                                               |                                                                     |
++-----------------------------------------------+---------------------------------------------------------------------+
+| ``param``                                     | A :doc:`kernel_param <../kernel_configuration>` object.             |
+|                                               | Its ``data_per_workitem`` must be a positive multiple of 32.        |
+|                                               |                                                                     |
+|                                               |                                                                     |
++-----------------------------------------------+---------------------------------------------------------------------+
+
+
+**Type Requirements**:
+
+- The element type of sequence(s) to sort must be a C++ integral or floating-point type
+  other than ``bool`` with a width of up to 64 bits.
+
+.. note::
+
+   Current limitations:
+
+   - Number of elements to sort must not exceed `2^30`.
+   - ``RadixBits`` can only be `8`.
+   - ``param.workgroup_size`` can only be `64`.
+
+Return Value
+------------
+
+A ``sycl::event`` object representing the status of the algorithm execution.
+
+--------------
+Usage Examples
+--------------
+
+
+In-Place Example
+----------------
+
+.. code:: cpp
+
+   // possible build and run commands:
+   //    icpx -fsycl radix_sort_by_key.cpp -o radix_sort_by_key -I /path/to/oneDPL/include && ./radix_sort_by_key
+
+   #include <cstdint>
+   #include <iostream>
+   #include <sycl/sycl.hpp>
+
+   #include <oneapi/dpl/experimental/kernel_templates>
+
+   namespace kt = oneapi::dpl::experimental::kt;
+
+   int main()
+   {
+      std::size_t n = 6;
+      sycl::queue q{sycl::gpu_selector_v};
+      sycl::buffer<std::uint32_t> keys{sycl::range<1>(n)};
+      sycl::buffer<char> values{sycl::range<1>(n)};
+
+      // initialize
+      {
+         sycl::host_accessor k_acc{keys, sycl::write_only};
+         k_acc[0] = 3, k_acc[1] = 2, k_acc[2] = 1, k_acc[3] = 5, k_acc[4] = 3, k_acc[5] = 3;
+
+         sycl::host_accessor v_acc{values, sycl::write_only};
+         v_acc[0] = 'r', v_acc[1] = 'o', v_acc[2] = 's', v_acc[3] = 'd', v_acc[4] = 't', v_acc[5] = 'e';
+      }
+
+      // sort
+      auto e = kt::gpu::esimd::radix_sort_by_key<true, 8>(q, keys, values, kt::kernel_param<96, 64>{}); // (2)
+      e.wait();
+
+      // print
+      {
+         sycl::host_accessor k_acc{keys, sycl::read_only};
+         for(std::size_t i = 0; i < n; ++i)
+               std::cout << k_acc[i] << ' ';
+         std::cout << '\n';
+
+         sycl::host_accessor v_acc{values, sycl::read_only};
+         for(std::size_t i = 0; i < n; ++i)
+               std::cout << v_acc[i] << ' ';
+         std::cout << '\n';
+      }
+
+      return 0;
+   }
+
+**Output**::
+
+   1 2 3 3 3 5
+   s o r t e d
+
+Out-of-Place Example
+--------------------
+
+.. code:: cpp
+
+   // possible build and run commands:
+   //    icpx -fsycl radix_sort_by_key.cpp -o radix_sort_by_key -I /path/to/oneDPL/include && ./radix_sort_by_key
+
+   #include <cstdint>
+   #include <iostream>
+   #include <sycl/sycl.hpp>
+
+   #include <oneapi/dpl/experimental/kernel_templates>
+
+   namespace kt = oneapi::dpl::experimental::kt;
+
+   int main()
+   {
+      std::size_t n = 6;
+      sycl::queue q{sycl::gpu_selector_v};
+      sycl::buffer<std::uint32_t> keys{sycl::range<1>(n)};
+      sycl::buffer<std::uint32_t> keys_out{sycl::range<1>(n)};
+      sycl::buffer<char> values{sycl::range<1>(n)};
+      sycl::buffer<char> values_out{sycl::range<1>(n)};
+
+
+      // initialize
+      {
+         sycl::host_accessor k_acc{keys, sycl::write_only};
+         k_acc[0] = 3, k_acc[1] = 2, k_acc[2] = 1, k_acc[3] = 5, k_acc[4] = 3, k_acc[5] = 3;
+
+         sycl::host_accessor v_acc{values, sycl::write_only};
+         v_acc[0] = 'r', v_acc[1] = 'o', v_acc[2] = 's', v_acc[3] = 'd', v_acc[4] = 't', v_acc[5] = 'e';
+      }
+
+      // sort
+      auto e = kt::gpu::esimd::radix_sort_by_key<true, 8>(q, keys, values, keys_out, values_out,
+                                                          kt::kernel_param<96, 64>{}); // (4)
+      e.wait();
+
+      // print
+      {
+         sycl::host_accessor k_acc{keys, sycl::read_only};
+         for(std::size_t i = 0; i < n; ++i)
+               std::cout << k_acc[i] << ' ';
+         std::cout << '\n';
+
+         sycl::host_accessor v_acc{values, sycl::read_only};
+         for(std::size_t i = 0; i < n; ++i)
+               std::cout << v_acc[i] << ' ';
+         std::cout << "\n\n";
+         
+         sycl::host_accessor k_out_acc{keys_out, sycl::read_only};
+         for(std::size_t i = 0; i < n; ++i)
+               std::cout << k_out_acc[i] << ' ';
+         std::cout << '\n';
+
+         sycl::host_accessor v_out_acc{values_out, sycl::read_only};
+         for(std::size_t i = 0; i < n; ++i)
+               std::cout << v_out_acc[i] << ' ';
+         std::cout << '\n';
+      }
+
+      return 0;
+   }
+
+**Output**::
+
+   3 2 1 5 3 3
+   r o s d t e
+
+   1 2 3 3 3 5
+   s o r t e d
+
+
+.. _radix-sort-by-key-memory-requirements:
+
+-------------------
+Memory Requirements
+-------------------
+
+The algorithm uses global and local device memory (see `SYCL 2020 Specification
+<https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#_sycl_device_memory_model>`_)
+for intermediate data storage. For the algorithm to operate correctly, there must be enough memory on the device.
+If there is not enough global device memory, a ``std::bad_alloc`` exception is thrown.
+The behavior is undefined if there is not enough local memory.
+The amount of memory that is required depends on input data and configuration parameters, as described below.
+
+Global Memory Requirements
+--------------------------
+
+Global memory is used for copying the input sequence(s) and storing internal data such as radix value counters.
+The used amount depends on many parameters; below is an upper bound approximation:
+
+   N\ :sub:`keys` + N\ :sub:`values` + C * N\ :sub:`keys`
+
+where the sequence with keys takes N\ :sub:`keys` space, the sequence with values takes N\ :sub:`values` space,
+and the additional space is C * N\ :sub:`keys`.
+
+The value of `C` depends on ``param.data_per_workitem``, ``param.workgroup_size``, and ``RadixBits``.
+For ``param.data_per_workitem`` set to `32`, ``param.workgroup_size`` to `64`, and ``RadixBits`` to `8`,
+`C` approximately equals to `1`.
+Incrementing ``RadixBits`` increases `C` up to twice, while doubling either
+``param.data_per_workitem`` or ``param.workgroup_size`` leads to a halving of `C`.
+
+..
+   The estimation above is not very precise and it seems it is not necessary for the global memory.
+   The C coefficient base is actually 0.53 instead of 1.
+   An increment of RadixBits multiplies C by the factor of ~1.5 on average.
+
+   Additionally, C exceeds 1 for radix_sort_by_key,
+   when N is small and the global histogram takes more space than the sequences.
+   This space is small, single WG implementation will be added, therefore this is neglected.
+
+Local Memory Requirements
+-------------------------
+
+Local memory is used for reordering key-value pairs within a work-group,
+and for storing internal data such as radix value counters.
+The used amount depends on many parameters; below is an upper bound approximation:
+
+   N\ :sub:`keys_per_workgroup` + N\ :sub:`values_per_workgroup` + C
+
+where N\ :sub:`keys_per_workgroup` and N\ :sub:`values_per_workgroup` are the amounts of memory
+to store keys and values, respectively. `C` is some additional space for storing internal data.
+
+N\ :sub:`keys_per_workgroup` equals to ``sizeof(key_type) * param.data_per_workitem * param.workgroup_size``,
+N\ :sub:`values_per_workgroup` equals to ``sizeof(value_type) * param.data_per_workitem * param.workgroup_size``,
+`C` does not exceed `4KB`.
+
+..
+   C as 4KB stands on these points:
+   1) Extra space is needed to store a histogram to distribute keys. It's size is 4 * (2^RadixBits).
+   The estimation is correct for RadixBits 9 (2KB) and smaller. Support of larger RadixBits is not expected.
+   1) N_keys + N_values is rounded up at 2KB border (temporarily as a workaround for a GPU driver bug).
+
+..
+   The estimation assumes that reordering keys/pairs takes more space than ranking keys.
+   The ranking takes approximatelly "2 * workgroup_size * (2^RadixBits)" bytes.
+   It suprpasses Intel Data Center GPU Max SLM capacity in only marginal cases,
+   e.g., when RadixBits is 10 and workgroup_size is 64, or when RadixBits is 9 and workgroup_size is 128.
+   It is ignored as an unrealistic case.
+
+-----------------------------------------
+Recommended Settings for Best Performance
+-----------------------------------------
+
+The general advice is to choose kernel parameters based on performance measurements and profiling information.
+The initial configuration may be selected according to these high-level guidelines:
+
+..
+   TODO: add this part when param.workgroup_size supports more than one value:
+   Increasing ``param.data_per_workitem`` should usually be preferred to increasing ``param.workgroup_size``,
+   to avoid extra synchronization overhead within a work-group.
+
+- When the number of elements to sort ``N`` is less than 1M, utilizing all available
+  compute cores is key for better performance. Allow creating enough work chunks to feed all
+  X\ :sup:`e`-cores [#fnote2]_ on a GPU: ``param.data_per_workitem * param.workgroup_size ≈ N / xe_core_count``.
+
+- When the number of elements to sort is large (more than ~1M), maximizing the number of elements
+  processed by a work-group, which equals to ``param.data_per_workitem * param.workgroup_size``,
+  reduces synchronization overheads between work-groups and usually benefits the overall performance.
+
+.. warning::
+
+   Avoid setting too large ``param.data_per_workitem`` and ``param.workgroup_size`` values.
+   Make sure that :ref:`Memory requirements <radix-sort-by-key-memory-requirements>` are satisfied.
+
+.. note::
+
+   ``param.data_per_workitem`` is the only available parameter to tune the performance,
+   since ``param.workgroup_size`` currently supports only one value (`64`).
+
+
+.. [#fnote1] Andy Adinets and Duane Merrill (2022). Onesweep: A Faster Least Significant Digit Radix Sort for GPUs. https://arxiv.org/abs/2206.01784.
+.. [#fnote2] The X\ :sup:`e`-core term is described in the `oneAPI GPU Optimization Guide
+   <https://www.intel.com/content/www/us/en/docs/oneapi/optimization-guide-gpu/2024-0/intel-xe-gpu-architecture.html#XE-CORE>`_.
+   Check the number of cores in the device specification, such as `Intel® Data Center GPU Max specification
+   <https://www.intel.com/content/www/us/en/products/details/discrete-gpus/data-center-gpu/max-series/products.html>`_.
diff --git a/_sources/kernel_templates/esimd_main.rst b/_sources/kernel_templates/esimd_main.rst
index c717e46d1e..3b1c4b555c 100644
--- a/_sources/kernel_templates/esimd_main.rst
+++ b/_sources/kernel_templates/esimd_main.rst
@@ -1,31 +1,19 @@
 ESIMD-Based Kernel Templates
 ############################
 
-The ESIMD kernel templates are based on `Explicit SIMD SYCL extension
-<https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/2024-0/explicit-simd-sycl-extension.html>`_
-of Intel® oneAPI DPC++/C++ Compiler.
+The ESIMD kernel templates are based on |esimd_sycl_extension|_ of |dpcpp_cpp|.
 This technology only supports Intel GPU devices.
 
 These templates are available in the ``oneapi::dpl::experimental::kt::gpu::esimd`` namespace. The following are implemented:
 
-* :doc:`radix_sort and radix_sort_by_key <esimd/radix_sort>`
+* :doc:`radix_sort <esimd/radix_sort>`
+* :doc:`radix_sort_by_key <esimd/radix_sort_by_key>`
 
 .. toctree::
    :maxdepth: 2
    :titlesonly:
-   :glob:
    :hidden:
 
    esimd/radix_sort
+   esimd/radix_sort_by_key
 
--------------------
-System Requirements
--------------------
-
-- Hardware: Intel® Data Center GPU Max Series.
-- Compiler: Intel® oneAPI DPC++/C++ Compiler 2023.2 and newer.
-- Operating Systems:
-
-  - Red Hat Enterprise Linux* 9.2,
-  - SUSE Linux Enterprise Server* 15 SP5,
-  - Ubuntu* 22.04.
diff --git a/_sources/kernel_templates/kernel_configuration.rst b/_sources/kernel_templates/kernel_configuration.rst
index 8b2b9ac796..185d4fc735 100644
--- a/_sources/kernel_templates/kernel_configuration.rst
+++ b/_sources/kernel_templates/kernel_configuration.rst
@@ -58,21 +58,19 @@ Member Types
 | ``kernel_name`` | ``KernelName`` | An optional parameter that is used to set a kernel name.                         |
 |                 |                |                                                                                  |
 |                 |                | .. note::                                                                        |
-|                 |                |                                                                                  |
-|                 |                |     The ``KernelName`` parameter might be required in case an implementation of  |
-|                 |                |     SYCL is not fully compliant with the SYCL 2020 Specification and             |
-|                 |                |     does not support optional kernel names.                                      |
+|                 |                |     The ``KernelName`` parameter might be required in case an implementation     |
+|                 |                |     of SYCL is not fully compliant with the `SYCL 2020 Specification`_           |
+|                 |                |     and does not support optional kernel names.                                  |
 |                 |                |                                                                                  |
 |                 |                | If omitted, SYCL kernel name(s) will be automatically generated.                 |
 |                 |                |                                                                                  |
 |                 |                | If provided, it must be a unique C++ typename that satisfies the requirements    |
-|                 |                | for SYCL kernel names (see `SYCL 2020 Specification                              |
-|                 |                | <https://registry.khronos.org/SYCL/specs/                                        |
-|                 |                | sycl-2020/html/sycl-2020.html#sec:naming.kernels>`_).                            |
+|                 |                | for SYCL kernel names in the `SYCL 2020 Specification`_.                         |
 |                 |                |                                                                                  |
 |                 |                | .. note::                                                                        |
-|                 |                |                                                                                  |
 |                 |                |    The provided name can be augmented by oneDPL when used with                   |
 |                 |                |    a template that creates multiple SYCL kernels.                                |
 |                 |                |                                                                                  |
 +-----------------+----------------+----------------------------------------------------------------------------------+
+
+.. _`SYCL 2020 Specification`: https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#sec:naming.kernels
\ No newline at end of file
diff --git a/_sources/kernel_templates/single_pass_scan.rst b/_sources/kernel_templates/single_pass_scan.rst
index de2472e97b..06dd40bdf5 100644
--- a/_sources/kernel_templates/single_pass_scan.rst
+++ b/_sources/kernel_templates/single_pass_scan.rst
@@ -78,10 +78,12 @@ Parameters
 
   Current limitations:
 
-  - The function will internally block until the issued kernels have completed execution.
+  - The function is intended to be asynchronous, but in some cases, the function will not return until the algorithm fully completes.
     Although intended in the future to be an asynchronous call, the algorithm is currently synchronous.
   - The SYCL device associated with the provided queue must support 64-bit atomic operations if the element type is 64-bits.
-  - There must be a known identity value for the provided combination of the element type and the binary operation. That is, ``sycl::has_known_identity_v`` must evaluate to true. Such operators are listed in the `SYCL 2020 specification <https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#table.identities>`_.
+  - There must be a known identity value for the provided combination of the element type and the binary operation. That is,
+    ``sycl::has_known_identity_v`` must evaluate to true. Such operators are listed in
+    the `SYCL 2020 specification <https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#table.identities>`_.
 
 Return Value
 ------------
@@ -133,9 +135,7 @@ inclusive_scan Example
       return 0;
    }
 
-**Output:**
-
-.. code:: none
+**Output**::
 
    1 3 4 7 8 10
 
@@ -147,9 +147,10 @@ Memory Requirements
 
 The algorithm uses global and local device memory (see `SYCL 2020 Specification
 <https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#_sycl_device_memory_model>`__)
-for intermediate data storage. For the algorithm to operate correctly, there must be enough memory
-on the device. It throws a ``std::bad_alloc`` exception if there is not enough global device memory. The behavior is undefined if there is not enough local memory. The amount of memory that is required
-depends on input data and configuration parameters, as described below.
+for intermediate data storage. For the algorithm to operate correctly, there must be enough memory on the device.
+If there is not enough global device memory, a ``std::bad_alloc`` exception is thrown.
+The behavior is undefined if there is not enough local memory.
+The amount of memory that is required depends on input data and configuration parameters, as described below.
 
 Global Memory Requirements
 --------------------------
diff --git a/_sources/kernel_templates_main.rst b/_sources/kernel_templates_main.rst
index 77affdc416..108e54221f 100644
--- a/_sources/kernel_templates_main.rst
+++ b/_sources/kernel_templates_main.rst
@@ -10,7 +10,7 @@ It is recommended to use kernel templates when there is an opportunity to custom
 for a particular workload (for example, the number of elements and their type),
 or for a specific device (for example, based on the available local memory).
 
-To use the API, include the ``oneapi/dpl/experimental/kernel_templates`` header file.
+To use the API, include the ``<oneapi/dpl/experimental/kernel_templates>`` header file.
 The primary API namespace is ``oneapi::dpl::experimental::kt``, and nested namespaces are used to further categorize the templates.
 
 * :doc:`Kernel Configuration <kernel_templates/kernel_configuration>`. Generic structure for configuring a kernel template.
@@ -20,7 +20,6 @@ The primary API namespace is ``oneapi::dpl::experimental::kt``, and nested names
 .. toctree::
    :maxdepth: 2
    :titlesonly:
-   :glob:
    :hidden:
 
    kernel_templates/kernel_configuration
diff --git a/_sources/macros.rst b/_sources/macros.rst
index 09718e798c..2a1b5e4f8b 100644
--- a/_sources/macros.rst
+++ b/_sources/macros.rst
@@ -27,6 +27,24 @@ Macro                             Description
 ``_PSTL_VERSION_PATCH``           ``_PSTL_VERSION % 10``: The patch number.
 ================================= ==============================
 
+.. _feature-macros:
+
+Feature Macros
+==============
+Use these macros to test presence of specific |onedpl_short| functionality.
+
+================================== ===============================================
+Macro                              Macro values and the functionality
+================================== ===============================================
+``ONEDPL_HAS_RANDOM_NUMBERS``      Pseudo-random number generators and distributions.
+
+                                   * ``202409L`` - added support of comparison and I/O stream operators and an experimental Philox engine
+---------------------------------- -----------------------------------------------
+``ONEDPL_HAS_RANGE_ALGORITHMS``    Parallel range algorithms.
+
+                                   * ``202409L`` - see :ref:`available algorithms <range-algorithms-202409L>`.
+================================== ===============================================
+
 Additional Macros
 ==================
 Use these macros to control aspects of |onedpl_short| usage. You can set them in your program code
@@ -38,9 +56,7 @@ Macro                              Description
 ``PSTL_USE_NONTEMPORAL_STORES``    This macro enables the use of ``#pragma vector nontemporal``
                                    for write-only data when algorithms such as ``std::copy``, ``std::fill``, etc.,
                                    are executed with unsequenced policies.
-                                   For further details about the pragma,
-                                   see the `vector page in the Intel® oneAPI DPC++/C++ Compiler Developer Guide and Reference
-                                   <https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/current/vector.html>`_.
+                                   For further details about the pragma, see the |vector_pragma|_.
                                    If the macro evaluates to a non-zero value,
                                    the use of ``#pragma vector nontemporal`` is enabled.
                                    By default, the macro is not defined.
@@ -94,11 +110,17 @@ Macro                              Description
                                    such as ``dpcpp_default`` and ``dpcpp_fpga``. When the macro is not defined (by default)
                                    or evaluates to non-zero, predefined policies objects can be used.
                                    When the macro is set to 0, predefined policies objects and make functions
-                                   without arguments, when ``make_device_policy()``,
-                                   ``make_fpga_policy()``, are not available.
+                                   without arguments (``make_device_policy()`` and ``make_fpga_policy()``) are not available.
 ---------------------------------- ------------------------------
 ``ONEDPL_ALLOW_DEFERRED_WAITING``  This macro allows waiting for completion of certain algorithms executed with
                                    device policies to be deferred. (Disabled by default.)
+
+                                   When the macro evaluates to non-zero, a call to a oneDPL algorithm with
+                                   a device policy might return before the computation completes on the device.
+
+                                   .. Warning:: Before accessing data produced or modified by the call, waiting
+                                      for completion of all tasks in the corresponding SYCL queue is required;
+                                      otherwise, the program behavior is undefined.
 ---------------------------------- ------------------------------
 ``ONEDPL_FPGA_DEVICE``             Use this macro to build your code containing |onedpl_short| parallel
                                    algorithms for FPGA devices. (Disabled by default.)
diff --git a/_sources/onedpl_gsg.rst b/_sources/onedpl_gsg.rst
index 5b598c23c3..761b7d677b 100644
--- a/_sources/onedpl_gsg.rst
+++ b/_sources/onedpl_gsg.rst
@@ -1,217 +1,223 @@
-Get Started with the |onedpl_long|
-##################################
-
-|onedpl_long| (|onedpl_short|) works with the
-`Intel® oneAPI DPC++/C++ Compiler <https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/get-started-guide/current/overview.html>`_
-to provide high-productivity APIs to developers, which can minimize SYCL*
-programming efforts across devices for high performance parallel applications.
-
-|onedpl_short| consists of the following components:
-
-* Parallel API
-* API for SYCL Kernels
-* Macros
-
-
-For general information about |onedpl_short|, visit the `oneDPL GitHub* repository <https://github.com/oneapi-src/oneDPL>`_,
-or visit the `Intel® oneAPI DPC++ Library Guide <https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/overview.html>`_
-and the `Intel® oneAPI DPC++ Library main page <https://www.intel.com/content/www/us/en/developer/tools/oneapi/dpc-library.html>`_.
-
-Quick Start
-===========
-
-Installation
-------------
-
-Visit the |onedpl_short| `Release Notes
-<https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-dpcpp-library-release-notes.html>`_
-page for:
-
-* Where to Find the Release
-* Overview
-* New Features
-* Fixed Issues
-* Known Issues and Limitations
-
-Install the `Intel® oneAPI Base Toolkit (Base Kit) <https://www.intel.com/content/www/us/en/developer/tools/oneapi/base-toolkit.html>`_
-to use |onedpl_short|.
-
-To use Parallel API, include the corresponding header files in your source code.
-
-All |onedpl_short| header files are in the ``oneapi/dpl`` directory. Use ``#include <oneapi/dpl/…>`` to include them.
-|onedpl_short| uses the namespace ``oneapi::dpl`` for most its classes and functions.
-
-To use tested C++ standard APIs, you need to include the corresponding C++ standard header files
-and use the ``std`` namespace.
-
-CMake Support
--------------
-`CMake <https://cmake.org/cmake/help/latest/index.html>`_ generates build scripts which can then be used to build and link your application. |onedpl_short| can be added to your project via CMake. 
-
-A simple example for Linux is provided below. For more detailed usage and options including details specific to Windows, please look to the `CMake Support Page <https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/cmake-support.html>`_.
-
-Simple Example CMake File
-*************************
-To use |onedpl_short| with CMake, create a CMakeLists.txt file for your project's base directory and use `find_package <https://cmake.org/cmake/help/latest/command/find_package.html>`_ and `target_link_libraries <https://cmake.org/cmake/help/latest/command/target_link_libraries.html>`_ to add oneDPL.
-For example:
-
-.. code:: cpp
-
-  project(Foo)
-  add_executable(foo foo.cpp)
-  
-  # Search to find oneDPL
-  find_package(oneDPL REQUIRED)
-  
-  # Connect oneDPL to foo
-  target_link_libraries(foo oneDPL)
-
-Simple Example CMake Invocation
-*******************************
-The following is an example CMake invocation which generates build scripts for the project in the parent directory: 
-
-.. code:: cpp
-
-  mkdir build && cd build
-  cmake -DCMAKE_CXX_COMPILER=icpx -DCMAKE_BUILD_TYPE=release ..
-
-Example Build Command
-*********************
-Once build scripts have been generated for your desired configuration following the instruction above, a `build command <https://cmake.org/cmake/help/latest/manual/cmake.1.html#build-a-project>`_ can be issued to build your project:
-
-.. code:: cpp
-
-  cmake --build .
-
-pkg-config Support
-------------------
-
-The pkg-config program is used to retrieve information about your installed libraries, and
-to compile and link against one or more libraries.
-
-Use pkg-config with |onedpl_short|
-**********************************
-
-Use pkg-config with the ``--cflags`` flag to get the include path to the oneDPL directory:
-
-.. code:: cpp
-
-  icpx -fsycl foo.cpp $(pkg-config --cflags dpl)
-  
-The ``--msvc-syntax`` flag is required when you use a Microsoft Visual C++* compiler.
-This flag converts your compiling and linking flags to the appropriate form:
-
-.. code:: cpp
-
-  icpx -fsycl foo.cpp $(pkg-config --msvc-syntax --cflags dpl)
-
-.. note::
-  Use the pkg-config tool to get rid of large hard-coded paths and make compilation more portable.
-
-
-Usage Examples
---------------
-
-|onedpl_short| sample code is available from the
-`oneAPI GitHub samples repository <https://github.com/oneapi-src/oneAPI-samples/tree/master/Libraries/oneDPL>`_.
-Each sample includes a readme with build instructions.
-
-\<oneapi/dpl/random\> Header Usage Example
-******************************************
-
-This example illustrates |onedpl_short| random number generator usage.
-The sample below shows you how to create an random number generator engine object (the source of pseudo-randomness),
-a distribution object (specifying the desired probability distribution), and how to generate
-the random numbers themselves. Random number generation is performed in a vectorized manner
-to improve the speed of your computations.
-
-This example performs its computations on your default SYCL device. You can set the
-``SYCL_DEVICE_TYPE`` environment variable to CPU or GPU.
-
-.. code:: cpp
-
-    template<int VecSize>
-    void random_fill(float* usmptr, std::size_t n) {
-        auto zero = oneapi::dpl::counting_iterator<std::size_t>(0);
-
-        std::for_each(oneapi::dpl::execution::dpcpp_default,
-            zero, zero + n/VecSize,
-            [usmptr](std::size_t i) {
-                auto offset = i * VecSize;
-
-                oneapi::dpl::minstd_rand_vec<VecSize> engine(seed, offset);
-                oneapi::dpl::uniform_real_distribution<sycl::vec<float, VecSize>> distr;
-
-                auto res = distr(engine);
-                res.store(i, sycl::global_ptr<float>(usmptr));
-            });
-    }
-
-Pi Benchmark Usage Example
-**************************
-
-This example uses a Monte Carlo method to estimate the value of π.
-The basic idea is to generate random points within a square, and to check what
-fraction of these random points lie in a quarter-circle inscribed within that square.
-The expected value is the ratio of the areas of the quarter-circle and the square (π/4).
-You can take the observed fraction of points in the quarter-circle as an estimate of π/4.
-
-This example shows you how to create an random number generator engine object (the source of pseudo-randomness),
-a distribution object (specifying the desired probability distribution), generate the
-random numbers themselves, and then perform a reduction to count quantity of points that
-fit into the square *S*. Random number generation is performed in scalar manner to simplify your code.
-
-
-.. figure:: images/pi_benchmark.png
-   :alt: An image of pi chart.
-
-.. code:: cpp
-
-    float estimated_pi;
-    {
-        sycl::queue q(sycl::gpu_selector_v);
-        auto policy = oneapi::dpl::execution::make_device_policy(q);
-
-        float sum = std::transform_reduce( policy,
-                                          oneapi::dpl::counting_iterator<int>(0),
-                                          oneapi::dpl::counting_iterator<int>(N),
-                                          0.0f,
-                                          std::plus<float>{},
-                                          [=](int n){
-                                              float local_sum = 0.0f;
-                                              oneapi::dpl::minstd_rand engine(SEED, n * ITER * 2);
-                                              oneapi::dpl::uniform_real_distribution<float> distr;
-                                              for(int i = 0; i < ITER; ++i) {
-                                                  float x = distr(engine);
-                                                  float y = distr(engine);
-                                                  if (x * x + y * y <= 1.0)
-                                                      local_sum += 1.0;
-                                              }
-                                              return local_sum / (float)ITER;
-                                          }
-        );
-        estimated_pi = 4.0f * (float)sum / N;
-    }
-
-
-Find More
-=========
-
-.. list-table::
-   :widths: 50 50
-   :header-rows: 1
-
-   * - Resource Link
-     - Description
-   * - `Intel® oneAPI DPC++ Library Guide <https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/overview.html>`_
-     - Refer to the |onedpl_short| guide for  more in depth information.
-   * - `System Requirements <https://www.intel.com/content/www/us/en/developer/articles/system-requirements/intel-oneapi-dpcpp-system-requirements.html>`_
-     - Check system requirements before you install |onedpl_short|.
-   * - `Intel® oneAPI DPC++ Library Release Notes <https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-dpcpp-library-release-notes.html>`_
-     - Check the release notes to learn about updates in the latest release.
-   * - `oneDPL Samples <https://github.com/oneapi-src/oneAPI-samples/tree/master/Libraries/oneDPL>`_
-     - Learn how to use |onedpl_short| with samples.
-   * - `Layers for Yocto* Project <https://www.intel.com/content/www/us/en/docs/oneapi-iot-toolkit/get-started-guide-linux/current/adding-oneapi-components-to-yocto-project-builds.html>`_
-     - Add oneAPI components to a Yocto project build using the meta-intel layers.
-   * - `oneAPI Samples Catalog <https://oneapi-src.github.io/oneAPI-samples/>`_
-     - Explore the complete list of oneAPI code samples in the oneAPI Samples Catalog (GitHub*). These samples were designed to help you develop, offload, and optimize multiarchitecture applications targeting CPUs, GPUs, and FPGAs.
\ No newline at end of file
+Get Started with the |onedpl_long|
+##################################
+
+|onedpl_long| (|onedpl_short|) works with the |dpcpp_cpp_with_gsg_link|_
+to provide high-productivity APIs to developers, which can minimize SYCL*
+programming efforts across devices for high performance parallel applications.
+
+|onedpl_short| consists of the following components:
+
+* Parallel API
+* API for SYCL Kernels
+* Macros
+
+
+For general information about |onedpl_short|, visit the `oneDPL GitHub* repository <https://github.com/oneapi-src/oneDPL>`_,
+or visit the |onedpl_library_guide|_ and the `Intel® oneAPI DPC++ Library main page
+<https://www.intel.com/content/www/us/en/developer/tools/oneapi/dpc-library.html>`_.
+
+Quick Start
+===========
+
+Installation
+------------
+
+Visit the |onedpl_short| `Release Notes
+<https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-dpcpp-library-release-notes.html>`_
+page for:
+
+* Where to Find the Release
+* Overview
+* New Features
+* Fixed Issues
+* Known Issues and Limitations
+
+Install the `Intel® oneAPI Base Toolkit (Base Kit) <https://www.intel.com/content/www/us/en/developer/tools/oneapi/base-toolkit.html>`_
+to use |onedpl_short|.
+
+To use Parallel API, include the corresponding header files in your source code.
+
+All |onedpl_short| header files are in the ``oneapi/dpl`` directory. Use ``#include <oneapi/dpl/…>`` to include them.
+|onedpl_short| uses the namespace ``oneapi::dpl`` for most its classes and functions.
+
+To use tested C++ standard APIs, you need to include the corresponding C++ standard header files
+and use the ``std`` namespace.
+
+CMake Support
+-------------
+`CMake <https://cmake.org/cmake/help/latest/index.html>`_ generates build scripts which can then be used
+to build and link your application. |onedpl_short| can be added to your project via CMake. 
+
+A simple example for Linux is provided below. For more detailed usage and options including details specific to Windows,
+please look to the |dpcpp_cmake_support|_.
+
+Simple Example CMake File
+*************************
+To use |onedpl_short| with CMake, create a CMakeLists.txt file for your project's base directory and use
+`find_package <https://cmake.org/cmake/help/latest/command/find_package.html>`_
+and `target_link_libraries <https://cmake.org/cmake/help/latest/command/target_link_libraries.html>`_ to add oneDPL.
+For example:
+
+.. code:: cpp
+
+  project(Foo)
+  add_executable(foo foo.cpp)
+  
+  # Search to find oneDPL
+  find_package(oneDPL REQUIRED)
+  
+  # Connect oneDPL to foo
+  target_link_libraries(foo oneDPL)
+
+Simple Example CMake Invocation
+*******************************
+The following is an example CMake invocation which generates build scripts for the project in the parent directory: 
+
+.. code:: cpp
+
+  mkdir build && cd build
+  cmake -DCMAKE_CXX_COMPILER=icpx -DCMAKE_BUILD_TYPE=release ..
+
+Example Build Command
+*********************
+Once build scripts have been generated for your desired configuration following the instruction above, a `build command
+<https://cmake.org/cmake/help/latest/manual/cmake.1.html#build-a-project>`_ can be issued to build your project:
+
+.. code:: cpp
+
+  cmake --build .
+
+pkg-config Support
+------------------
+
+The pkg-config program is used to retrieve information about your installed libraries, and
+to compile and link against one or more libraries.
+
+Use pkg-config with |onedpl_short|
+**********************************
+
+Use pkg-config with the ``--cflags`` flag to get the include path to the oneDPL directory:
+
+.. code:: cpp
+
+  icpx -fsycl foo.cpp $(pkg-config --cflags dpl)
+  
+The ``--msvc-syntax`` flag is required when you use a Microsoft Visual C++* compiler.
+This flag converts your compiling and linking flags to the appropriate form:
+
+.. code:: cpp
+
+  icpx -fsycl foo.cpp $(pkg-config --msvc-syntax --cflags dpl)
+
+.. note::
+  Use the pkg-config tool to get rid of large hard-coded paths and make compilation more portable.
+
+
+Usage Examples
+--------------
+
+|onedpl_short| sample code is available from the
+`oneAPI GitHub samples repository <https://github.com/oneapi-src/oneAPI-samples/tree/master/Libraries/oneDPL>`_.
+Each sample includes a readme with build instructions.
+
+\<oneapi/dpl/random\> Header Usage Example
+******************************************
+
+This example illustrates |onedpl_short| random number generator usage.
+The sample below shows you how to create an random number generator engine object (the source of pseudo-randomness),
+a distribution object (specifying the desired probability distribution), and how to generate
+the random numbers themselves. Random number generation is performed in a vectorized manner
+to improve the speed of your computations.
+
+This example performs its computations on your default SYCL device. You can set the
+``SYCL_DEVICE_TYPE`` environment variable to CPU or GPU.
+
+.. code:: cpp
+
+    template<int VecSize>
+    void random_fill(float* usmptr, std::size_t n) {
+        auto zero = oneapi::dpl::counting_iterator<std::size_t>(0);
+
+        std::for_each(oneapi::dpl::execution::dpcpp_default,
+            zero, zero + n/VecSize,
+            [usmptr](std::size_t i) {
+                auto offset = i * VecSize;
+
+                oneapi::dpl::minstd_rand_vec<VecSize> engine(seed, offset);
+                oneapi::dpl::uniform_real_distribution<sycl::vec<float, VecSize>> distr;
+
+                auto res = distr(engine);
+                res.store(i, sycl::global_ptr<float>(usmptr));
+            });
+    }
+
+Pi Benchmark Usage Example
+**************************
+
+This example uses a Monte Carlo method to estimate the value of π.
+The basic idea is to generate random points within a square, and to check what
+fraction of these random points lie in a quarter-circle inscribed within that square.
+The expected value is the ratio of the areas of the quarter-circle and the square (π/4).
+You can take the observed fraction of points in the quarter-circle as an estimate of π/4.
+
+This example shows you how to create an random number generator engine object (the source of pseudo-randomness),
+a distribution object (specifying the desired probability distribution), generate the
+random numbers themselves, and then perform a reduction to count quantity of points that
+fit into the square *S*. Random number generation is performed in scalar manner to simplify your code.
+
+
+.. figure:: images/pi_benchmark.png
+   :alt: An image of pi chart.
+
+.. code:: cpp
+
+    float estimated_pi;
+    {
+        sycl::queue q(sycl::gpu_selector_v);
+        auto policy = oneapi::dpl::execution::make_device_policy(q);
+
+        float sum = std::transform_reduce( policy,
+                                          oneapi::dpl::counting_iterator<int>(0),
+                                          oneapi::dpl::counting_iterator<int>(N),
+                                          0.0f,
+                                          std::plus<float>{},
+                                          [=](int n){
+                                              float local_sum = 0.0f;
+                                              oneapi::dpl::minstd_rand engine(SEED, n * ITER * 2);
+                                              oneapi::dpl::uniform_real_distribution<float> distr;
+                                              for(int i = 0; i < ITER; ++i) {
+                                                  float x = distr(engine);
+                                                  float y = distr(engine);
+                                                  if (x * x + y * y <= 1.0)
+                                                      local_sum += 1.0;
+                                              }
+                                              return local_sum / (float)ITER;
+                                          }
+        );
+        estimated_pi = 4.0f * (float)sum / N;
+    }
+
+
+Find More
+=========
+
+.. list-table::
+   :widths: 50 50
+   :header-rows: 1
+
+   * - Resource Link
+     - Description
+   * - |onedpl_library_guide|_
+     - Refer to the |onedpl_short| guide for  more in depth information.
+   * - `System Requirements <https://www.intel.com/content/www/us/en/developer/articles/system-requirements/intel-oneapi-dpcpp-system-requirements.html>`_
+     - Check system requirements before you install |onedpl_short|.
+   * - `Intel® oneAPI DPC++ Library Release Notes
+       <https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-dpcpp-library-release-notes.html>`_
+     - Check the release notes to learn about updates in the latest release.
+   * - `oneDPL Samples <https://github.com/oneapi-src/oneAPI-samples/tree/master/Libraries/oneDPL>`_
+     - Learn how to use |onedpl_short| with samples.
+   * - |yocto_layers|_
+     - Add oneAPI components to a Yocto project build using the meta-intel layers.
+   * - `oneAPI Samples Catalog <https://oneapi-src.github.io/oneAPI-samples/>`_
+     - Explore the complete list of oneAPI code samples in the oneAPI Samples Catalog (GitHub*).
+       These samples were designed to help you develop, offload, and optimize multiarchitecture applications targeting CPUs, GPUs, and FPGAs.
\ No newline at end of file
diff --git a/_sources/parallel_api/additional_algorithms.rst b/_sources/parallel_api/additional_algorithms.rst
index 6827f7d606..5223ba8d91 100644
--- a/_sources/parallel_api/additional_algorithms.rst
+++ b/_sources/parallel_api/additional_algorithms.rst
@@ -1,147 +1,157 @@
-Additional Algorithms
-######################
-
-The definitions of the algorithms listed below are available through the ``oneapi/dpl/algorithm``
-header.  All algorithms are implemented in the ``oneapi::dpl`` namespace.
-
-* ``reduce_by_segment``: performs partial reductions on a sequence's values and keys. Each
-  reduction is computed with a given reduction operation for a contiguous subsequence of values, which are
-  determined by keys being equal according to a predicate. A return value is a pair of iterators holding
-  the end of the output sequences for keys and values.
-
-  For correct computation, the reduction operation should be associative. If no operation is specified,
-  the default operation for the reduction is ``std::plus``, and the default predicate is ``std::equal_to``.
-  The algorithm requires that the type of the elements used for values be default constructible. For example::
-
-    keys:   [0,0,0,1,1,1]
-    values: [1,2,3,4,5,6]
-    output_keys:   [0,1]
-    output_values: [1+2+3=6,4+5+6=15]
-
-* ``inclusive_scan_by_segment``: performs partial prefix scans on a sequence's values. Each
-  scan applies to a contiguous subsequence of values, which are determined by the keys associated with the
-  values being equal. The return value is an iterator targeting the end of the result sequence.
-
-  For correct computation, the prefix scan operation should be associative. If no operation is specified,
-  the default operation is ``std::plus``, and the default predicate is ``std::equal_to``. The algorithm
-  requires that the type of the elements used for values be default constructible. For example::
-
-    keys:   [0,0,0,1,1,1]
-    values: [1,2,3,4,5,6]
-    result: [1,1+2=3,1+2+3=6,4,4+5=9,4+5+6=15]
-
-* ``exclusive_scan_by_segment``: performs partial prefix scans on a sequence's values. Each
-  scan applies to a contiguous subsequence of values that are determined by the keys associated with the values
-  being equal, and sets the first element to the initial value provided. The return value is an iterator
-  targeting the end of the result sequence.
-
-  For correct computation, the prefix scan operation should be associative. If no operation is specified,
-  the default operation is ``std::plus``, and the default predicate is ``std::equal_to``. For example::
-
-    keys:   [0,0,0,1,1,1]
-    values: [1,2,3,4,5,6]
-    initial value: [0]
-    result: [0,0+1=1,0+1+2=3,0,0+4=4,0+4+5=9]
-
-* ``binary_search``: performs a binary search of the input sequence for each of the values in
-  the search sequence provided.  For each element of the search sequence the algorithm writes a boolean value
-  to the result sequence that indicates whether the search value was found in the input sequence. An iterator
-  to one past the last value in the result sequence is returned. The algorithm assumes the input sequence has
-  been sorted by the comparator provided. If no comparator is provided, then a function object that uses
-  ``operator<`` to compare the elements is used. For example::
-
-    input sequence:  [0, 2, 2, 2, 3, 3, 3, 3, 6, 6]
-    search sequence: [0, 2, 4, 7, 6]
-    result sequence: [true, true, false, false, true]
-
-* ``lower_bound``: performs a binary search of the input sequence for each of the values in
-  the search sequence provided to identify the lowest index in the input sequence where the search value could
-  be inserted without violating the sorted ordering of the input sequence.  The lowest index for each search
-  value is written to the result sequence, and the algorithm returns an iterator to one past the last value
-  written to the result sequence. If no comparator is provided, then a function object that uses ``operator<``
-  to compare the elements is used. For example::
-
-    input sequence:  [0, 2, 2, 2, 3, 3, 3, 3, 6, 6]
-    search sequence: [0, 2, 4, 7, 6]
-    result sequence: [0, 1, 8, 10, 8]
-
-* ``upper_bound``: performs a binary search of the input sequence for each of the values in
-  the search sequence provided to identify the highest index in the input sequence where the search value could
-  be inserted without violating the sorted ordering of the input sequence.  The highest index for each search
-  value is written to the result sequence, and the algorithm returns an iterator to one past the last value
-  written to the result sequence. If no comparator is provided, then a function object that uses ``operator<``
-  to compare the elements is used. For example::
-
-    input sequence:  [0, 2, 2, 2, 3, 3, 3, 3, 6, 6]
-    search sequence: [0, 2, 4, 7, 6]
-    result sequence: [1, 4, 8, 10, 10]
-
-* ``sort_by_key``: performs a stable key-value sort. The algorithm sorts the sequence's keys according to 
-  a comparioson operator. If no comparator is provided, then the elements are compared with ``operator<``.
-  The sequence's values are permutated according to the sorted sequence's keys. The prerequisite for correct
-  behavior is that the size for both keys sequence and values sequence shall be the same.  
-  For example::
-
-    keys:   [3,    5,   0,   4,   3,   0]
-    values: ['a', 'b', 'c', 'd', 'e', 'f']
-    output_keys:   [0,    0,   3,   3,   4,   5]
-    output_values: ['c', 'f', 'a', 'e', 'd', 'b']
-
-* ``transform_if``: performs a transform on the input sequence(s) elements and stores the result into the
-  corresponding position in the output sequence at each position for which the predicate applied to the 
-  element(s) evaluates to ``true``. If the predicate evaluates to ``false``, the transform is not applied for
-  the elements(s), and the output sequence's corresponding position is left unmodified. There are two overloads
-  of this function, one for a single input sequence with a unary transform and a unary predicate, and another
-  for two input sequences and a binary transform and a binary predicate.
-
-  Unary example::
-
-    unary predicate: [](auto i){return i % 2 == 0;} // is even
-    unary transform: [](auto i){return i * 2;}      // double element
-    input sequence:           [0, 1, 2, 3, 3, 3, 4, 4, 7, 6]
-    original output sequence: [9, 8, 7, 6, 5, 4, 3, 2, 1, 0]
-    final output sequence:    [0, 8, 4, 6, 5, 4, 8, 8, 1, 12]
-
-
-  Binary example::
-
-    binary predicate: [](auto a, auto b){return a == b;} // are equal
-    unary transform:  [](auto a, auto b){return a + b;}  // sum values
-    input sequence1:           [0, 1, 2, 3, 3, 3, 4, 4, 7, 6]
-    input sequence2:           [5, 1, 3, 4, 3, 3, 4, 4, 7, 9]
-    original output sequence:  [9, 9, 9, 9, 9, 9, 9, 9, 9, 9]
-    final output sequence:     [9, 2, 9, 9, 6, 6, 8, 8, 14, 9]
-
-* ``histogram``: performs a histogram on a sequence of of input elements. Histogram counts the number of
-  elements which map to each of a defined set of bins. The algorithm has two overloads.
-
-  The first overload takes as input the number of bins, range minimum, and range maximum, then evenly
-  divides bins within that range. An input element ``a`` maps to a bin ``i`` such that
-  ``i = floor((a - minimum) / ((maximum - minimum) / num_bins)))``.
-  
-  The other overload defines ``m`` bins from a sorted sequence of ``m + 1`` user-provided boundaries
-  where an input element ``a`` maps to a bin ``i`` if and only if
-  ``__boundary_first[i] <= a < __boundary_first[i + 1]``.
-  
-  Input values which do not map to a defined bin are skipped silently. The algorithm counts the number of
-  input elements which map to each bin and outputs the result to a user-provided sequence of ``m`` output
-  bin counts. The user must provide sufficient output data to store each bin, and the type of the output
-  sequence must be sufficient to store the counts of the histogram without overflow. All input and output
-  sequences must be ``RandomAccessIterators``. Histogram currently only supports execution with device
-  policies.
-
-  Evenly divided bins example::
-
-    inputs:   [9, 9, 3, 8, 4, 4, 4, 5, 1, 99]
-    num_bins: 5
-    min:      0
-    max:      10
-    output:   [1, 1, 4, 0 3]
-
-  Custom range bins example::
-
-    inputs:     [9, 9, 3, 8, 4, 4, 4, 5, 1, 99]
-    boundaries: [-1, 0, 8, 12]
-    output:     [0, 6, 3]
-
-
+Additional Algorithms
+######################
+
+The definitions of the algorithms listed below are available through the ``<oneapi/dpl/algorithm>``
+header.  All algorithms are implemented in the ``oneapi::dpl`` namespace.
+
+* ``reduce_by_segment``: performs partial reductions on a sequence's values and keys. Each
+  reduction is computed with a given reduction operation for a contiguous subsequence of values, which are
+  determined by keys being equal according to a predicate. A return value is a pair of iterators holding
+  the end of the output sequences for keys and values.
+
+  For correct computation, the reduction operation should be associative. If no operation is specified,
+  the default operation for the reduction is ``std::plus``, and the default predicate is ``std::equal_to``.
+  The algorithm requires that the type of the elements used for values be default constructible. For example::
+
+    keys:   [0,0,0,1,1,1]
+    values: [1,2,3,4,5,6]
+    output_keys:   [0,1]
+    output_values: [1+2+3=6,4+5+6=15]
+
+* ``inclusive_scan_by_segment``: performs partial prefix scans on a sequence's values. Each
+  scan applies to a contiguous subsequence of values, which are determined by the keys associated with the
+  values being equal. The return value is an iterator targeting the end of the result sequence.
+
+  For correct computation, the prefix scan operation should be associative. If no operation is specified,
+  the default operation is ``std::plus``, and the default predicate is ``std::equal_to``. The algorithm
+  requires that the type of the elements used for values be default constructible. For example::
+
+    keys:   [0,0,0,1,1,1]
+    values: [1,2,3,4,5,6]
+    result: [1,1+2=3,1+2+3=6,4,4+5=9,4+5+6=15]
+
+* ``exclusive_scan_by_segment``: performs partial prefix scans on a sequence's values. Each
+  scan applies to a contiguous subsequence of values that are determined by the keys associated with the values
+  being equal, and sets the first element to the initial value provided. The return value is an iterator
+  targeting the end of the result sequence.
+
+  For correct computation, the prefix scan operation should be associative. If no operation is specified,
+  the default operation is ``std::plus``, and the default predicate is ``std::equal_to``. For example::
+
+    keys:   [0,0,0,1,1,1]
+    values: [1,2,3,4,5,6]
+    initial value: [0]
+    result: [0,0+1=1,0+1+2=3,0,0+4=4,0+4+5=9]
+
+* ``binary_search``: performs a binary search of the input sequence for each of the values in
+  the search sequence provided.  For each element of the search sequence the algorithm writes a boolean value
+  to the result sequence that indicates whether the search value was found in the input sequence. An iterator
+  to one past the last value in the result sequence is returned. The algorithm assumes the input sequence has
+  been sorted by the comparator provided. If no comparator is provided, then a function object that uses
+  ``operator<`` to compare the elements is used. For example::
+
+    input sequence:  [0, 2, 2, 2, 3, 3, 3, 3, 6, 6]
+    search sequence: [0, 2, 4, 7, 6]
+    result sequence: [true, true, false, false, true]
+
+* ``lower_bound``: performs a binary search of the input sequence for each of the values in
+  the search sequence provided to identify the lowest index in the input sequence where the search value could
+  be inserted without violating the sorted ordering of the input sequence.  The lowest index for each search
+  value is written to the result sequence, and the algorithm returns an iterator to one past the last value
+  written to the result sequence. If no comparator is provided, then a function object that uses ``operator<``
+  to compare the elements is used. For example::
+
+    input sequence:  [0, 2, 2, 2, 3, 3, 3, 3, 6, 6]
+    search sequence: [0, 2, 4, 7, 6]
+    result sequence: [0, 1, 8, 10, 8]
+
+* ``upper_bound``: performs a binary search of the input sequence for each of the values in
+  the search sequence provided to identify the highest index in the input sequence where the search value could
+  be inserted without violating the sorted ordering of the input sequence.  The highest index for each search
+  value is written to the result sequence, and the algorithm returns an iterator to one past the last value
+  written to the result sequence. If no comparator is provided, then a function object that uses ``operator<``
+  to compare the elements is used. For example::
+
+    input sequence:  [0, 2, 2, 2, 3, 3, 3, 3, 6, 6]
+    search sequence: [0, 2, 4, 7, 6]
+    result sequence: [1, 4, 8, 10, 10]
+
+* ``sort_by_key``: performs a key-value sort.
+  The algorithm sorts a sequence of keys using a given comparison function object.
+  If it is not provided, the elements are compared with ``operator<``.
+  A sequence of values is simultaneously permuted according to the sorted order of keys.
+  There must be at least as many values as the keys, otherwise the behavior is undefined.
+
+  For example::
+
+    keys:   [3,    5,   0,   4,   3,   0]
+    values: ['a', 'b', 'c', 'd', 'e', 'f']
+    output_keys:   [0,    0,   3,   3,   4,   5]
+    output_values: ['c', 'f', 'a', 'e', 'd', 'b']
+
+.. note::
+     ``sort_by_key`` currently implements a stable sort for device execution policies,
+     but may implement an unstable sort in the future.
+     Use ``stable_sort_by_key`` if stability is essential.
+
+* ``stable_sort_by_key``: performs a key-value sort similar to ``sort_by_key``,
+  but with the added guarantee of stability.
+
+* ``transform_if``: performs a transform on the input sequence(s) elements and stores the result into the
+  corresponding position in the output sequence at each position for which the predicate applied to the
+  element(s) evaluates to ``true``. If the predicate evaluates to ``false``, the transform is not applied for
+  the elements(s), and the output sequence's corresponding position is left unmodified. There are two overloads
+  of this function, one for a single input sequence with a unary transform and a unary predicate, and another
+  for two input sequences and a binary transform and a binary predicate.
+
+  Unary example::
+
+    unary predicate: [](auto i){return i % 2 == 0;} // is even
+    unary transform: [](auto i){return i * 2;}      // double element
+    input sequence:           [0, 1, 2, 3, 3, 3, 4, 4, 7, 6]
+    original output sequence: [9, 8, 7, 6, 5, 4, 3, 2, 1, 0]
+    final output sequence:    [0, 8, 4, 6, 5, 4, 8, 8, 1, 12]
+
+
+  Binary example::
+
+    binary predicate: [](auto a, auto b){return a == b;} // are equal
+    unary transform:  [](auto a, auto b){return a + b;}  // sum values
+    input sequence1:           [0, 1, 2, 3, 3, 3, 4, 4, 7, 6]
+    input sequence2:           [5, 1, 3, 4, 3, 3, 4, 4, 7, 9]
+    original output sequence:  [9, 9, 9, 9, 9, 9, 9, 9, 9, 9]
+    final output sequence:     [9, 2, 9, 9, 6, 6, 8, 8, 14, 9]
+
+* ``histogram``: performs a histogram on a sequence of of input elements. Histogram counts the number of
+  elements which map to each of a defined set of bins. The algorithm has two overloads.
+
+  The first overload takes as input the number of bins, range minimum, and range maximum, then evenly
+  divides bins within that range. An input element ``a`` maps to a bin ``i`` such that
+  ``i = floor((a - minimum) / ((maximum - minimum) / num_bins)))``.
+
+  The other overload defines ``m`` bins from a sorted sequence of ``m + 1`` user-provided boundaries
+  where an input element ``a`` maps to a bin ``i`` if and only if
+  ``__boundary_first[i] <= a < __boundary_first[i + 1]``.
+
+  Input values which do not map to a defined bin are skipped silently. The algorithm counts the number of
+  input elements which map to each bin and outputs the result to a user-provided sequence of ``m`` output
+  bin counts. The user must provide sufficient output data to store each bin, and the type of the output
+  sequence must be sufficient to store the counts of the histogram without overflow. All input and output
+  sequences must be ``RandomAccessIterators``. Histogram currently only supports execution with device
+  policies.
+
+  Evenly divided bins example::
+
+    inputs:   [9, 9, 3, 8, 4, 4, 4, 5, 1, 99]
+    num_bins: 5
+    min:      0
+    max:      10
+    output:   [1, 1, 4, 0 3]
+
+  Custom range bins example::
+
+    inputs:     [9, 9, 3, 8, 4, 4, 4, 5, 1, 99]
+    boundaries: [-1, 0, 8, 12]
+    output:     [0, 6, 3]
+
+
diff --git a/_sources/parallel_api/async_api.rst b/_sources/parallel_api/async_api.rst
index d6e6f77fe1..242b30c92a 100644
--- a/_sources/parallel_api/async_api.rst
+++ b/_sources/parallel_api/async_api.rst
@@ -1,5 +1,5 @@
-Asynchronous API Algorithms
-###########################
+Asynchronous Algorithms
+#######################
 
 The functions defined in the STL ``<algorithm>`` or ``<numeric>`` headers are traditionally blocking. |onedpl_long| (|onedpl_short|)
 extends the functionality of the C++17 parallel algorithms by providing asynchronous algorithms with non-blocking behavior.
@@ -55,19 +55,16 @@ Example of Async API Usage
     #include <sycl/sycl.hpp>
     
     int main() {
-        using namespace oneapi;
-        {
-            /* Build and compute a simple dependency chain: Fill buffer -> Transform -> Reduce */
-            sycl::buffer<int> a{10};
- 
-            auto fut1 = dpl::experimental::fill_async(dpl::execution::dpcpp_default, 
-                                                      dpl::begin(a),dpl::end(a),7);
-            
-            auto fut2 = dpl::experimental::transform_async(dpl::execution::dpcpp_default,
-                                                           dpl::begin(a),dpl::end(a),dpl::begin(a),
-                                                           [&](const int& x){return x + 1; },fut1);
-            auto ret_val = dpl::experimental::reduce_async(dpl::execution::dpcpp_default,
-                                                           dpl::begin(a),dpl::end(a),fut1,fut2).get();
-        }
+        /* Build and compute a simple dependency chain: Fill buffer -> Transform -> Reduce */
+        sycl::buffer<int> a{10};
+
+        auto fut1 = dpl::experimental::fill_async(dpl::execution::dpcpp_default, 
+                                                  dpl::begin(a),dpl::end(a),7);
+        
+        auto fut2 = dpl::experimental::transform_async(dpl::execution::dpcpp_default,
+                                                       dpl::begin(a),dpl::end(a),dpl::begin(a),
+                                                       [&](const int& x){return x + 1; },fut1);
+        auto ret_val = dpl::experimental::reduce_async(dpl::execution::dpcpp_default,
+                                                       dpl::begin(a),dpl::end(a),fut1,fut2).get();
         return 0;
     }
diff --git a/_sources/parallel_api/execution_policies.rst b/_sources/parallel_api/execution_policies.rst
index ad922c04f2..a5188446d4 100644
--- a/_sources/parallel_api/execution_policies.rst
+++ b/_sources/parallel_api/execution_policies.rst
@@ -1,68 +1,70 @@
 Execution Policies
 ##################
 
-The implementation supports the device execution policies used to run the massive parallel
-computational model for heterogeneous systems. The policies are specified in
-the |onedpl_long| (|onedpl_short|) section of the `oneAPI Specification
-<https://spec.oneapi.io/versions/latest/elements/oneDPL/source/parallel_api.html#dpc-execution-policy>`_.
-
-For any of the implemented algorithms, pass one of the execution policy objects as the first
-argument in a call to specify the desired execution behavior. The policies have
-the following meaning:
-
-================================= ==============================
-Execution Policy Value            Description
-================================= ==============================
-``seq``                           Sequential execution.
---------------------------------- ------------------------------
-``unseq``                         Unsequenced SIMD execution. This policy requires that
-                                  all functions provided are SIMD-safe.
---------------------------------- ------------------------------
-``par``                           Parallel execution by multiple threads.
---------------------------------- ------------------------------
-``par_unseq``                     Combined effect of ``unseq`` and ``par``.
---------------------------------- ------------------------------
-``dpcpp_default``                 Massive parallel execution on devices using |dpcpp_short|.
---------------------------------- ------------------------------
-``dpcpp_fpga``                    Massive parallel execution on FPGA devices.
-================================= ==============================
+According to `the oneAPI specification
+<https://uxlfoundation.github.io/oneAPI-spec/spec/elements/oneDPL/source/index.html>`_,
+|onedpl_long| (|onedpl_short|) provides execution policies semantically aligned with the C++ standard,
+referred to as *standard-aligned* or *host execution policies*, as well as *device execution policies*
+to run data parallel computations on heterogeneous systems.
+
+The execution policies are defined in the ``oneapi::dpl::execution`` namespace and provided
+in the ``<oneapi/dpl/execution>`` header. The policies have the following meaning:
+
+====================== =====================================================
+Policy Name / Type     Description
+====================== =====================================================
+``seq``                The standard-aligned policy for sequential execution.
+---------------------- -----------------------------------------------------
+``unseq``              The standard-aligned policy for possible unsequenced SIMD execution.
+                       This policy requires user-provided functions to be SIMD-safe.
+---------------------- -----------------------------------------------------
+``par``                The standard-aligned policy for possible parallel execution by multiple threads.
+---------------------- -----------------------------------------------------
+``par_unseq``          The standard-aligned policy with the combined effect of ``unseq`` and ``par``.
+---------------------- -----------------------------------------------------
+``device_policy``      The class template to create device policies for data parallel execution.
+---------------------- -----------------------------------------------------
+``dpcpp_default``      The device policy for data parallel execution on the default SYCL device.
+---------------------- -----------------------------------------------------
+``fpga_policy``        The class template to create policies for execution on FPGA devices.
+---------------------- -----------------------------------------------------
+``dpcpp_fpga``         The device policy for data parallel execution on a SYCL FPGA device.
+====================== =====================================================
 
 The implementation is based on Parallel STL from the
 `LLVM Project <https://github.com/llvm/llvm-project/tree/main/pstl>`_.
 
 |onedpl_short| supports two parallel backends for execution with ``par`` and ``par_unseq`` policies:
 
-#. TBB backend (enabled by default) uses |onetbb_long| or |tbb_long| for parallel execution.
+#. The TBB backend (enabled by default) uses |onetbb_long| or |tbb_long| for parallel execution.
 
-#. OpenMP backend uses OpenMP* pragmas for parallel execution. Visit
+#. The OpenMP backend uses OpenMP* pragmas for parallel execution. Visit
    :doc:`Macros <../macros>` for the information how to enable the OpenMP backend.
 
+OpenMP pragmas are also used for SIMD execution with ``unseq`` and ``par_unseq`` policies.
+
 Follow these steps to add Parallel API to your application:
 
 #. Add ``#include <oneapi/dpl/execution>`` to your code.
    Then include one or more of the following header files, depending on the algorithms you
    intend to use:
 
-   #. ``#include <oneapi/dpl/algorithm>``
-   #. ``#include <oneapi/dpl/numeric>``
-   #. ``#include <oneapi/dpl/memory>``
-
-   For better coexistence with the C++ standard library,
-   include |onedpl_short| header files before the standard C++ ones.
+   - ``#include <oneapi/dpl/algorithm>``
+   - ``#include <oneapi/dpl/numeric>``
+   - ``#include <oneapi/dpl/memory>``
 
-#. Pass a |onedpl_short| execution policy object, defined in the ``oneapi::dpl::execution``
-   namespace, to a parallel algorithm.
-#. Use the C++ standard execution policies:
+#. Pass a |onedpl_short| execution policy object as the first argument to a parallel algorithm
+   to indicate the desired execution behavior.
 
-   #. Compile the code with options that enable OpenMP parallelism and/or vectorization pragmas.
-   #. Link with the |onetbb_long| or |tbb_long| dynamic library for TBB-based parallelism.
+#. If you use the standard-aligned execution policies:
 
-#. Use the device execution policies:
+   - Compile the code with options that enable OpenMP parallelism and/or SIMD vectorization pragmas.
+   - Compile and link with the |onetbb_short| or |tbb_short| library for TBB-based parallelism.
 
-   #. Compile the code with options that enable support for SYCL 2020.
+   If you use the device execution policies, compile the code with options that enable support for SYCL 2020.
 
-Use the C++ Standard Execution Policies
-=======================================
+Use the C++ Standard Aligned Execution Policies
+===============================================
 
 Example:
 
@@ -80,12 +82,10 @@ Example:
   }
 
 Use the Device Execution Policies
-========================================
+=================================
 
-The device execution policy specifies where a parallel algorithm runs.
-It encapsulates a SYCL device or queue and allows you to
-set an optional kernel name. Device execution policies can be used with all
-standard C++ algorithms that support execution policies.
+The device execution policy specifies where a |onedpl_short| parallel algorithm runs.
+It encapsulates a SYCL device or queue and allows you to set an optional kernel name.
 
 To create a policy object, you may use one of the following constructor arguments:
 
@@ -100,8 +100,8 @@ names for SYCL kernel functions. The |dpcpp_cpp| supports it by default;
 for other compilers it may need to be enabled with compilation options such as
 ``-fsycl-unnamed-lambda``. Refer to your compiler documentation for more information.
 
-The ``oneapi::dpl::execution::dpcpp_default`` object is a predefined object of
-the ``device_policy`` class. It is created with a default kernel name and a default queue.
+The ``oneapi::dpl::execution::dpcpp_default`` object is a predefined immutable object of
+the ``device_policy`` class. It is created with a default kernel name and uses a default queue.
 Use it to construct customized policy objects or pass directly when invoking an algorithm.
 
 If ``dpcpp_default`` is passed directly to more than one algorithm, you must ensure that the
@@ -117,8 +117,8 @@ and ``using namespace sycl;`` directives when referring to policy classes and fu
 
 .. code:: cpp
 
-   auto policy_a = device_policy<class PolicyA> {};
-   std::for_each(policy_a, ...);
+  auto policy_a = device_policy<class PolicyA> {};
+  std::for_each(policy_a, ...);
 
 .. code:: cpp
 
@@ -167,18 +167,16 @@ The default constructor of ``fpga_policy`` wraps a SYCL queue created
 for ``fpga_selector``, or for ``fpga_emulator_selector``
 if the ``ONEDPL_FPGA_EMULATOR`` is defined.
 
-``oneapi::dpl::execution::dpcpp_fpga`` is a predefined object of
+``oneapi::dpl::execution::dpcpp_fpga`` is a predefined immutable object of
 the ``fpga_policy`` class created with a default unroll factor and a default kernel name.
 Use it to create customized policy objects or pass directly when invoking an algorithm.
 
 .. Note::
 
    Specifying the unroll factor for a policy enables loop unrolling in the implementation of
-   your algorithms. The default value is 1.
-   To find out how to choose a more precise value, refer to the `unroll Pragma <https://www.intel.com/content/www/us/en/docs/oneapi-fpga-add-on/developer-guide/current/unroll-pragma.html>`_
-   and `Loop Analysis <https://www.intel.com/content/www/us/en/docs/oneapi-fpga-add-on/developer-guide/current/loop-analysis.html>`_ content in
-   the `Intel® oneAPI FPGA Handbook
-   <https://www.intel.com/content/www/us/en/docs/oneapi-fpga-add-on/developer-guide/2024-0/intel-oneapi-fpga-handbook.html>`_.
+   |onedpl_short| algorithms. The default value is 1.
+   To find out how to choose a more precise value, refer to the |unroll_pragma|_
+   and |loop_analysis|_ content in the |fpga_handbook|_.
 
 The ``make_fpga_policy`` function templates simplify ``fpga_policy`` creation.
 
@@ -197,10 +195,10 @@ The code below assumes you have added ``using namespace oneapi::dpl::execution;`
 
 
 Error Handling with Device Execution Policies
-====================================================
+=============================================
 
-The SYCL error handling model supports two types of errors: Synchronous errors cause the SYCL host
-runtime libraries throw exceptions. Asynchronous errors may only be processed in a user-supplied error handler
+The SYCL error handling model supports two types of errors. Synchronous errors cause the SYCL API functions
+to throw exceptions. Asynchronous errors may only be processed in a user-supplied error handler
 associated with a SYCL queue.
 
 For algorithms executed with device policies, handling all errors, synchronous or asynchronous, is a
@@ -213,4 +211,4 @@ responsibility of the caller. Specifically:
 
 To process SYCL asynchronous errors, the queue associated with a device policy must be
 created with an error handler object. The predefined policy objects (``dpcpp_default``, etc.) have
-no error handlers; do not use them if you need to process asynchronous errors.
\ No newline at end of file
+no error handlers; do not use them if you need to process asynchronous errors.
diff --git a/_sources/parallel_api/iterators.rst b/_sources/parallel_api/iterators.rst
index 13884eafa2..c67c9da2b4 100644
--- a/_sources/parallel_api/iterators.rst
+++ b/_sources/parallel_api/iterators.rst
@@ -1,19 +1,20 @@
 Iterators
 #########
 
-The definitions of the iterators are available through the ``oneapi/dpl/iterator``
+The definitions of the iterators are available through the ``<oneapi/dpl/iterator>``
 header.  All iterators are implemented in the ``oneapi::dpl`` namespace.
 
 * ``counting_iterator``: a random-access iterator-like type whose dereferenced value is an integer
   counter. Instances of a ``counting_iterator`` provide read-only dereference operations. The counter of an
-  ``counting_iterator`` instance changes according to the arithmetic of the random-access iterator type::
+  ``counting_iterator`` instance changes according to the arithmetic of the random-access iterator type:
+
+  .. code:: cpp
 
-    using namespace oneapi;
     dpl::counting_iterator<int> count_a(0);
     dpl::counting_iterator<int> count_b = count_a + 10;
     int init = count_a[0]; // OK: init == 0
     *count_b = 7; // ERROR: counting_iterator does not provide write operations
-    auto sum = std::reduce(dpl::execution::dpcpp_default,
+    auto sum = dpl::reduce(dpl::execution::dpcpp_default,
                            count_a, count_b, init); // sum is (0 + 0 + 1 + ... + 9) = 45
 
 * ``zip_iterator``: an iterator constructed with one or more iterators as input. The result of
@@ -26,20 +27,22 @@ header.  All iterators are implemented in the ``oneapi::dpl`` namespace.
 
   The ``zip_iterator`` is useful in defining by key algorithms where input iterators
   representing keys and values are processed as key-value pairs. The example below demonstrates a stable sort
-  by key, where only the keys are compared but both keys and values are swapped::
+  by key, where only the keys are compared but both keys and values are swapped:
+
+  .. code:: cpp
 
-    using namespace oneapi;
     auto zipped_begin = dpl::make_zip_iterator(keys_begin, vals_begin);
-    std::stable_sort(dpl::execution::dpcpp_default, zipped_begin, zipped_begin + n,
+    dpl::stable_sort(dpl::execution::dpcpp_default, zipped_begin, zipped_begin + n,
         [](auto lhs, auto rhs) { return get<0>(lhs) < get<0>(rhs); });
 
   The dereferenced object of ``zip_iterator`` supports the *structured binding* feature (`C++17 and above
   <https://en.cppreference.com/w/cpp/language/structured_binding>`_) for easier access to
-  wrapped iterators values::
+  wrapped iterators values:
+
+  .. code:: cpp
 
-    using namespace oneapi;
     auto zipped_begin = dpl::make_zip_iterator(sequence1.begin(), sequence2.begin(), sequence3.begin());
-    auto found = std::find(dpl::execution::dpcpp_default, zipped_begin, zipped_begin + n,
+    auto found = dpl::find(dpl::execution::dpcpp_default, zipped_begin, zipped_begin + n,
         [](auto tuple_like_obj) {
           auto [e1, e2, e3] = tuple_like_obj;
           return e1 == e2 && e1 == e3;
@@ -57,11 +60,12 @@ header.  All iterators are implemented in the ``oneapi::dpl`` namespace.
   The ``discard_iterator`` is useful in the implementation of stencil algorithms where the stencil is not part of the
   desired output. An example of this would be a ``copy_if`` algorithm that receives an input iterator range,
   a stencil iterator range, and copies the elements of the input whose corresponding stencil value is 1. Use
-  ``discard_iterator`` so you do not declare a temporary allocation to store the copy of the stencil::
+  ``discard_iterator`` so you do not declare a temporary allocation to store the copy of the stencil:
+
+  .. code:: cpp
 
-    using namespace oneapi;
     auto zipped_first = dpl::make_zip_iterator(first, stencil);
-    std::copy_if(dpl::execution::dpcpp_default,
+    dpl::copy_if(dpl::execution::dpcpp_default,
                  zipped_first, zipped_first + (last - first),
                  dpl::make_zip_iterator(result, dpl::discard_iterator()),
                  [](auto t){return get<1>(t) == 1;}
@@ -87,14 +91,15 @@ header.  All iterators are implemented in the ``oneapi::dpl`` namespace.
 
   To simplify the construction of the iterator, ``oneapi::dpl::make_transform_iterator`` is provided. The
   function receives the base iterator and transform operation instance as arguments, and constructs the
-  ``transform_iterator`` instance::
+  ``transform_iterator`` instance:
+
+  .. code:: cpp
 
-    using namespace oneapi;
     dpl::counting_iterator<int> first(0);
     dpl::counting_iterator<int> last(10);
     auto transform_first = dpl::make_transform_iterator(first, std::negate<int>());
     auto transform_last = transform_first + (last - first);
-    auto sum = std::reduce(dpl::execution::dpcpp_default,
+    auto sum = dpl::reduce(dpl::execution::dpcpp_default,
                            transform_first, transform_last); // sum is (0 + -1 + ... + -9) = -45
 
 * ``permutation_iterator``: an iterator whose dereferenced value set is defined by the source iterator
@@ -106,7 +111,9 @@ header.  All iterators are implemented in the ``oneapi::dpl`` namespace.
   in cases where algorithms are executed with device policies.
 
   The ``make_permutation_iterator`` is provided to simplify construction of iterator instances. The function
-  receives the source iterator and the iterator or function object representing the index map::
+  receives the source iterator and the iterator or function object representing the index map:
+
+  .. code:: cpp
 
     struct multiply_index_by_two {
         template <typename Index>
@@ -118,7 +125,6 @@ header.  All iterators are implemented in the ``oneapi::dpl`` namespace.
     // compute the number of elements in the range between the first and last that are accessed
     // by the permutation iterator
     size_t num_elements = std::distance(first, last) / 2 + std::distance(first, last) % 2;
-    using namespace oneapi;
     auto permutation_first = dpl::make_permutation_iterator(first, multiply_index_by_two());
     auto permutation_last = permutation_first + num_elements;
-    std::copy(dpl::execution::dpcpp_default, permutation_first, permutation_last, result);
+    dpl::copy(dpl::execution::dpcpp_default, permutation_first, permutation_last, result);
diff --git a/_sources/parallel_api/parallel_range_algorithms.rst b/_sources/parallel_api/parallel_range_algorithms.rst
new file mode 100644
index 0000000000..f0356f71e2
--- /dev/null
+++ b/_sources/parallel_api/parallel_range_algorithms.rst
@@ -0,0 +1,111 @@
+Parallel Range Algorithms
+#########################
+
+C++20 introduces the `Ranges library <https://en.cppreference.com/w/cpp/ranges>`_ and
+`range algorithms <https://en.cppreference.com/w/cpp/algorithm/ranges>`_ as a modern paradigm for expressing
+generic operations on data sequences.
+
+|onedpl_long| (|onedpl_short|) extends it with *parallel range algorithms*, which can be used with the standard range
+classes to leverage |onedpl_short| ability of parallel execution on both the host computer and data parallel devices.
+
+oneDPL only supports random access ranges, because they allow simultaneous constant-time access to elements
+at any position in the range. This enables efficient workload distribution among multiple threads or processing units,
+which is essential for achieving high performance in parallel execution.
+
+.. Note::
+
+  The use of parallel range algorithms requires C++20 and the C++ standard libraries coming with GCC 10 (or higher),
+  Clang 16 (or higher) and Microsoft* Visual Studio* 2019 16.10 (or higher).
+
+Supported Range Views
+---------------------
+
+`Views <https://en.cppreference.com/w/cpp/ranges/view>`_ are lightweight ranges typically used to describe
+data transformation pipelines. The C++20 standard defines two categories of standard range views, called
+*factories* and *adaptors*:
+
+* A range factory generates its data elements on access via an index or an iterator to the range.
+* A range adaptor transforms its underlying data range(s) or view(s) into a new view with modified behavior.
+
+The following C++ standard random access adaptors and factories can be used with the |onedpl_short|
+parallel range algorithms:
+
+* ``std::ranges::views::all``: A range adaptor that returns a view that includes all elements of a range
+  (only with standard-aligned execution policies).
+* ``std::ranges::subrange``: A utility that produces a view from an iterator and a sentinel or from a range.
+* ``std::span``: A view to a contiguous data sequence. 
+* ``std::ranges::iota_view``: A range factory that generates a sequence of elements by repeatedly incrementing
+  an initial value.
+* ``std::ranges::single_view``: A view that contains exactly one element of a specified value.
+* ``std::ranges::transform_view``: A range adaptor that produces a view that applies a transformation to each element
+  of another view.
+* ``std::ranges::reverse_view``: A range adaptor that produces a reversed sequence of elements provided by another view.
+* ``std::ranges::take_view``: A range adaptor that produces a view of the first N elements from another view.
+* ``std::ranges::drop_view``: A range adaptor that produces a view excluding the first N elements from another view.
+
+Visit :doc:`pass_data_algorithms` for more information, especially on the :ref:`use of range views <use-range-views>`
+with device execution policies.
+
+Supported Algorithms
+--------------------
+
+The ``<oneapi/dpl/algorithm>`` header defines the parallel range algorithms in the ``namespace oneapi::dpl::ranges``.
+All algorithms work with both standard-aligned (host) and device execution policies.
+
+The ``ONEDPL_HAS_RANGE_ALGORITHMS`` :ref:`feature macro <feature-macros>` may be used to test for the presence of
+parallel range algorithms.
+
+.. _range-algorithms-202409L:
+
+If ``ONEDPL_HAS_RANGE_ALGORITHMS`` is defined to ``202409L`` or a greater value, the following algorithms are provided:
+
+* ``for_each``
+* ``transform``
+* ``find``
+* ``find_if``
+* ``find_if_not``
+* ``adjacent_find``
+* ``all_of``
+* ``any_of``
+* ``none_of``
+* ``search``
+* ``search_n``
+* ``count``
+* ``count_if``
+* ``equal``
+* ``sort``
+* ``stable_sort``
+* ``is_sorted``
+* ``min_element``
+* ``max_element``
+* ``copy``
+* ``copy_if``
+* ``merge``
+
+Usage Example for Parallel Range Algorithms
+-------------------------------------------
+
+.. code:: cpp
+
+    {        
+        std::vector<int> vec_in = {0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
+        std::vector<int> vec_out{vec_in.size()};
+
+        auto view_in = std::ranges::views::all(vec_in) | std::ranges::views::reverse;
+        oneapi::dpl::ranges::copy(oneapi::dpl::execution::par, view_in, vec_out);
+    }
+    {
+        using usm_shared_allocator = sycl::usm_allocator<int, sycl::usm::alloc::shared>;
+        // Allocate for the queue used by the execution policy
+        usm_shared_allocator alloc{oneapi::dpl::execution::dpcpp_default.queue()};
+
+        std::vector<int, usm_shared_allocator> vec_in{{0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, alloc};
+        std::vector<int, usm_shared_allocator> vec_out{vec_in.size(), alloc};
+
+        auto view_in = std::ranges::subrange(vec_in.begin(), vec_in.end()) | std::ranges::views::reverse;
+        oneapi::dpl::ranges::copy(oneapi::dpl::execution::dpcpp_default, view_in, std::span(vec_out));
+    }
+
+.. rubric:: See also:
+
+:doc:`range_based_api`
diff --git a/_sources/parallel_api/pass_data_algorithms.rst b/_sources/parallel_api/pass_data_algorithms.rst
index 4c0ec8a4ca..5d3a0b32b5 100644
--- a/_sources/parallel_api/pass_data_algorithms.rst
+++ b/_sources/parallel_api/pass_data_algorithms.rst
@@ -1,20 +1,34 @@
 Pass Data to Algorithms
 #######################
 
-When using the C++ standard execution policies, oneDPL supports data being passed to its algorithms as specified
-in the ISO/IEC 14882:2017 standard (commonly called C++17). According to the standard, the calling code
-must prevent data races when using algorithms with parallel execution policies.
-
-Note: Implementations of ``std::vector<bool>`` are not required to avoid data races for concurrent modifications
-of vector elements. Some implementations may optimize multiple ``bool`` elements into a bitfield, making it unsafe
-for multithreading. For this reason, it is recommended to avoid ``std::vector<bool>`` for anything but a read-only
-input with the C++ standard execution policies.
-
-When using a device execution policy, you can use one of the following ways to pass data to an algorithm:
-
-* ``oneapi:dpl::begin`` and ``oneapi::dpl::end`` functions
-* Unified shared memory (USM) pointers
-* ``std::vector`` with or without a USM allocator
+For an algorithm to access data, it is important that the used execution policy matches the data storage type.
+The following table shows which execution policies can be used with various data storage types.
+
+================================================ ========================== =============
+Data Storage                                     Device Policies            Host Policies
+================================================ ========================== =============
+`SYCL buffer`_                                   Yes                        No
+Device-allocated `unified shared memory`_ (USM)  Yes                        No
+Shared and host-allocated USM                    Yes                        Yes
+``std::vector`` with ``sycl::usm_allocator``     Yes                        Yes
+``std::vector`` with an ordinary allocator       See :ref:`use-std-vector`  Yes
+Other data in host memory                        No                         Yes
+================================================ ========================== =============
+
+When using the standard-aligned (or *host*) execution policies, |onedpl_short| supports data being passed
+to its algorithms as specified in the C++ standard (C++17 for algorithms working with iterators,
+C++20 for parallel range algorithms), with :ref:`known restrictions and limitations <library-restrictions>`.
+
+According to the standard, the calling code must prevent data races when using algorithms
+with parallel execution policies.
+
+.. note::
+   Implementations of ``std::vector<bool>`` are not required to avoid data races for concurrent modifications
+   of vector elements. Some implementations may optimize multiple ``bool`` elements into a bitfield, making it unsafe
+   for multithreading. For this reason, it is recommended to avoid ``std::vector<bool>`` for anything but a read-only
+   input with the standard-aligned execution policies.
+
+The following subsections describe proper ways to pass data to an algorithm invoked with a device execution policy.
 
 .. _use-buffer-wrappers:
 
@@ -23,7 +37,7 @@ Use oneapi::dpl::begin and oneapi::dpl::end Functions
 
 ``oneapi::dpl::begin`` and ``oneapi::dpl::end`` are special helper functions that
 allow you to pass SYCL buffers to parallel algorithms. These functions accept
-a SYCL buffer and return an object of an unspecified type that provides the following API:
+a `SYCL buffer`_ and return an object of an unspecified type that provides the following API:
 
 * It satisfies ``CopyConstructible`` and ``CopyAssignable`` C++ named requirements and comparable with
   ``operator==`` and ``operator!=``.
@@ -33,16 +47,15 @@ a SYCL buffer and return an object of an unspecified type that provides the foll
 * It provides the ``get_buffer`` method, which returns the buffer passed to the ``begin`` and ``end`` functions.
 
 The ``begin`` and ``end`` functions can take SYCL 2020 deduction tags and ``sycl::no_init`` as arguments
-to explicitly mention which access mode should be applied to the buffer accessor when submitting a
-SYCL kernel to a device. For example:
+to explicitly control which access mode should be applied to a particular buffer when submitting
+a SYCL kernel to a device:
 
 .. code:: cpp
 
-  auto first1 = begin(buf, sycl::read_only);
-  auto first2 = begin(buf, sycl::write_only, sycl::no_init);
-  auto first3 = begin(buf, sycl::no_init);
-
-The example above allows you to control the access mode for the particular buffer passing to a parallel algorithm.
+  sycl::buffer<int> buf{/*...*/};
+  auto first_ro = oneapi::dpl::begin(buf, sycl::read_only);
+  auto first_wo = oneapi::dpl::begin(buf, sycl::write_only, sycl::no_init);
+  auto first_ni = oneapi::dpl::begin(buf, sycl::no_init);
 
 To use the functions, add ``#include <oneapi/dpl/iterator>`` to your code. For example:
 
@@ -53,16 +66,16 @@ To use the functions, add ``#include <oneapi/dpl/iterator>`` to your code. For e
   #include <oneapi/dpl/iterator>
   #include <random>
   #include <sycl/sycl.hpp>
+
   int main(){
     std::vector<int> vec(1000);
     std::generate(vec.begin(), vec.end(), std::minstd_rand{});
 
-    //create a buffer from host memory
-    sycl::buffer<int> buf { vec.data(), vec.size() };
+    sycl::buffer<int> buf{ vec.data(), vec.size() };
     auto buf_begin = oneapi::dpl::begin(buf);
     auto buf_end   = oneapi::dpl::end(buf);
 
-    std::sort(oneapi::dpl::execution::dpcpp_default, buf_begin, buf_end);
+    oneapi::dpl::sort(oneapi::dpl::execution::dpcpp_default, buf_begin, buf_end);
     return 0;
   }
 
@@ -71,9 +84,9 @@ To use the functions, add ``#include <oneapi/dpl/iterator>`` to your code. For e
 Use Unified Shared Memory
 -------------------------
 
-If you have USM-allocated memory, pass the pointers to the start and past the end
-of the sequence to a parallel algorithm. Make sure that the execution policy and
-the USM-allocated memory were created for the same queue. For example:
+If you have USM-allocated data, pass the pointers to the start and past the end
+of the data sequence to a parallel algorithm. Make sure that the execution policy and
+the USM allocation use the same SYCL queue. For example:
 
 .. code:: cpp
 
@@ -81,32 +94,32 @@ the USM-allocated memory were created for the same queue. For example:
   #include <oneapi/dpl/algorithm>
   #include <random>
   #include <sycl/sycl.hpp>
+
   int main(){
     sycl::queue q;
     const int n = 1000;
     int* d_head = sycl::malloc_shared<int>(n, q);
     std::generate(d_head, d_head + n, std::minstd_rand{});
 
-    std::sort(oneapi::dpl::execution::make_device_policy(q), d_head, d_head + n);
+    oneapi::dpl::sort(oneapi::dpl::execution::make_device_policy(q), d_head, d_head + n);
 
     sycl::free(d_head, q);
     return 0;
   }
 
+.. note::
+   Use of non-USM pointers is not supported for algorithms with device execution policies.
+
 When using device USM, such as allocated by ``malloc_device``, you are responsible for data
 transfers to and from the device to ensure that input data is device accessible during oneDPL
 algorithm execution and that the result is available to the subsequent operations.
 
-Use std::vector
------------------------------
-
-The following examples demonstrate two ways to use the parallel algorithms with ``std::vector``:
+.. _use-std-vector:
 
-* Host allocators
-* USM allocators
+Use std::vector
+---------------
 
-You can use iterators to host allocated ``std::vector`` data
-as shown in the following example:
+You can use iterators to an ordinary ``std::vector`` with data in host memory, as shown in the following example:
 
 .. code:: cpp
 
@@ -114,28 +127,42 @@ as shown in the following example:
   #include <oneapi/dpl/algorithm>
   #include <random>
   #include <vector>
+
   int main(){
     std::vector<int> vec( 1000 );
     std::generate(vec.begin(), vec.end(), std::minstd_rand{});
 
-    std::sort(oneapi::dpl::execution::dpcpp_default, vec.begin(), vec.end());
+    oneapi::dpl::sort(oneapi::dpl::execution::dpcpp_default, vec.begin(), vec.end());
     return 0;
   }
 
-When using iterators to host allocated data, a temporary SYCL buffer is created, and the data
-is copied to this buffer. After processing on a device is complete, the modified data is copied
-from the temporary buffer back to the host container. While convenient, using host allocated
-data can lead to unintended copying between host and device. We recommend working with SYCL buffers
-or USM memory to reduce data copying between the host and device. 
+In this case a temporary SYCL buffer is created, the data is copied to this buffer, and it is processed
+according to the algorithm semantics. After processing on a device is complete, the modified data is copied
+from the temporary buffer back to the host container.
+
+.. note::
+   For parallel range algorithms with device execution policies the use of ordinary ``std::vector``\s is not supported.
 
-You can also use ``std::vector`` with a USM allocator, as shown in the following example:
+While convenient, direct use of an ordinary ``std::vector`` can lead to unintended copying between the host
+and the device. We recommend working with SYCL buffers or with USM to reduce data copying.
+
+.. note::
+   For specialized memory algorithms that begin or end the lifetime of data objects, that is,
+   ``uninitialized_*`` and ``destroy*`` families of functions, the data to initialize or destroy
+   should be accessible on the device without extra copying. Therefore these algorithms may not use
+   data storage on the host with device execution policies.
+
+You can also use ``std::vector`` with a ``sycl::usm_allocator``, as shown in the following example.
+Make sure that the allocator and the execution policy use the same SYCL queue:
 
 .. code:: cpp
 
   #include <oneapi/dpl/execution>
   #include <oneapi/dpl/algorithm>
   #include <random>
+  #include <vector>
   #include <sycl/sycl.hpp>
+
   int main(){
     const int n = 1000;
     auto policy = oneapi::dpl::execution::dpcpp_default;
@@ -144,18 +171,67 @@ You can also use ``std::vector`` with a USM allocator, as shown in the following
     std::generate(vec.begin(), vec.end(), std::minstd_rand{});
 
     // Recommended to use USM pointers:
-    std::sort(policy, vec.data(), vec.data() + vec.size());
-
-    // Iterators for USM allocators might require extra copying - not recommended method
-    // std::sort(policy, vec.begin(), vec.end());
+    oneapi::dpl::sort(policy, vec.data(), vec.data() + vec.size());
+  /*
+    // Iterators for USM allocators might require extra copying - not a recommended method
+    oneapi::dpl::sort(policy, vec.begin(), vec.end());
+  */
     return 0;
   }
 
-Make sure that the execution policy and the USM-allocated memory were created for the same queue.
-
 For ``std::vector`` with a USM allocator we recommend to use ``std::vector::data()`` in
 combination with ``std::vector::size()`` as shown in the example above, rather than iterators to
 ``std::vector``. That is because for some implementations of the C++ Standard Library it might not
 be possible for |onedpl_short| to detect that iterators are pointing to USM-allocated data. In that
-case the data will be treated as if it were host-allocated, with an extra copy made to a SYCL buffer.
-Retrieving USM pointers from ``std::vector`` as shown guarantees no unintended copying.
\ No newline at end of file
+case the data will be treated as if it were in host memory, with an extra copy made to a SYCL buffer.
+Retrieving USM pointers from ``std::vector`` as shown guarantees no unintended copying.
+
+.. _use-range-views:
+
+Use Range Views
+---------------
+
+For :doc:`parallel range algorithms <parallel_range_algorithms>` with device execution policies,
+place the data in USM or a USM-allocated ``std::vector``, and pass it to an algorithm
+via a device-copyable range or view object such as ``std::ranges::subrange`` or ``std::span``.
+
+.. note::
+   Use of ``std::ranges::views::all`` is not supported for algorithms with device execution policies.
+
+These data ranges as well as supported range adaptors and factories may be combined into
+data transformation pipelines that also can be used with parallel range algorithms. For example:
+
+.. code:: cpp
+
+  #include <oneapi/dpl/execution>
+  #include <oneapi/dpl/algorithm>
+  #include <random>
+  #include <vector>
+  #include <span>
+  #include <ranges>
+  #include <functional>
+  #include <sycl/sycl.hpp>
+
+  int main(){
+    const int n = 1000;
+    auto policy = oneapi::dpl::execution::dpcpp_default;
+    sycl::queue q = policy.queue();
+
+    int* d_head = sycl::malloc_host<int>(n, q);
+    std::generate(d_head, d_head + n, std::minstd_rand{});
+
+    sycl::usm_allocator<int, sycl::usm::alloc::shared> alloc(q);
+    std::vector<int, decltype(alloc)> vec(n, alloc);
+
+    oneapi::dpl::ranges::copy(policy,
+        std::ranges::subrange(d_head, d_head + n) | std::views::transform(std::negate{}),
+        std::span(vec));
+
+    oneapi::dpl::ranges::sort(policy, std::span(vec));
+
+    sycl::free(d_head, q);
+    return 0;
+  }
+
+.. _`SYCL buffer`: https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#subsec:buffers
+.. _`unified shared memory`: https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#sec:usm
diff --git a/_sources/parallel_api/range_based_api.rst b/_sources/parallel_api/range_based_api.rst
index 7323814c59..5d55e11585 100644
--- a/_sources/parallel_api/range_based_api.rst
+++ b/_sources/parallel_api/range_based_api.rst
@@ -1,32 +1,75 @@
-Range-Based API Algorithms
-##########################
-.. Note::
+Experimental Range-Based API
+############################
+
+The ``<oneapi/dpl/ranges>`` header file contains experimental classes and functions that implement
+the functionality similar to what is provided by the C++20 Ranges Library, yet only requires C++17.
+This allows you to combine |onedpl_short| data parallel execution capabilities with some aspects
+of modern range-based API. The functionality is only implemented for the device execution policies.
 
-  The use of the range-based API requires C++17 and the C++ standard libraries coming with GCC 8.1 (or higher)
-  or Clang 7 (or higher).
+.. Note::
+   The use of the experimental range-based API requires the C++ standard libraries
+   coming with GCC 8.1 (or higher) or Clang 7 (or higher).
 
-C++20 introduces the Ranges library. C++20 standard splits ranges into two categories: factories and adaptors.
-A range factory does not have underlying data. An element is generated on success by an index or by dereferencing an iterator.
-A range adaptor, from the |onedpl_long| (|onedpl_short|) perspective, is a utility that transforms the base range,
-or another adapted range, into a view with custom behavior.
+.. Warning::
+   This experimental functionality will be gradually substituted by the
+   :doc:`parallel range algorithms <parallel_range_algorithms>` and eventually discontinued.
 
-|onedpl_short| supports an ``iota_view`` range factory.
+Range Views
+-----------
 
-A ``sycl::buffer`` wrapped with ``all_view`` can be used as the range.
+.. _viewable-ranges:
 
-|onedpl_short| considers the supported factories and ``all_view`` as base ranges.
-The range adaptors may be combined into a pipeline with a ``base`` range at the beginning. For example:
+The following viewable ranges are defined in the ``oneapi::dpl::experimental::ranges`` namespace:
+
+* ``views::iota``: A range factory that generates a sequence of elements by repeatedly incrementing an initial value.
+* ``views::all``: A custom utility that represents a view of all or a part of ``sycl::buffer`` elements
+  for reading and writing on a device.
+* ``views::all_read``: A custom utility that represents a view of all or a part of ``sycl::buffer`` elements
+  for reading on a device.
+* ``views::all_write``: A custom utility that represents a view of all or a part of ``sycl::buffer`` elements
+  for writing on a device.
+* ``views::host_all``: A custom utility that represents a view of all or a part of ``sycl::buffer`` elements
+  for reading and writing on the host.
+* ``views::subrange``: A utility that represents a view of unified shared memory (USM) data range
+  defined by two USM pointers.
+* ``views::zip``: A custom range adaptor that produces one ``zip_view`` from other several views.
+* ``views::transform``: A range adaptor that represents a view of an underlying sequence after applying
+  a transformation to each element.
+* ``views::reverse``: A range adaptor that produces a reversed sequence of elements provided by another view.
+* ``views::take``: A range adaptor that produces a view of the first N elements from another view.
+* ``views::drop``: A range adaptor that produces a view excluding the first N elements from another view.
+
+Only these ranges, ``sycl::buffer``, and their combinations can be passed to the experimental range-based algorithms.
+
+A ``sycl::buffer`` wrapped with ``views::all`` and similar utilities, ``views::subrange`` over USM, and ``views::iota``
+are considered *base ranges*. The range adaptors may be combined into a pipeline with a base range at the beginning.
+For example:
 
 .. code:: cpp
 
     sycl::buffer<int> buf(data, sycl::range<1>(10));
-    auto range_1 = iota_view(0, 10) | views::reverse();
-    auto range_2 = all_view(buf) | views::reverse();
+    auto range_1 = views::iota(0, 10) | views::reverse;
+    auto range_2 = views::all(buf) | views::take(10);
+
+For ranges based on a SYCL buffer, data access is only permitted on a device, while ``size()`` and ``empty()``
+methods are allowed to be called on both host and device.
+
+Range-Based Algorithms
+----------------------
+
+The functions for experimental range based algorithms resemble the standard C++ parallel algorithm overloads
+where all data sequences represented by ranges instead of iterators or iterator pairs, for example:
+
+.. code:: cpp
+
+   template <typename ExecutionPolicy, typename Range1, typename Range2>
+   void copy(ExecutionPolicy&& exec, Range1&& source, Range2&& destination);
 
-For the range, based on the ``all_view`` factory, data access is permitted on a device only. ``size()`` and ``empty()`` methods are allowed 
-to be called on both host and device.
+Note that ``source`` is used instead of two iterators to represent the input, and ``destination`` represents the output.
 
-The following algorithms are available to use with the ranges:
+The following algorithms are available to use with the ranges. These algorithms are defined in the
+``oneapi::dpl::experimental::ranges`` namespace and can only be invoked with device execution policies.
+To use these algorithms, include both ``<oneapi/dpl/ranges>`` and ``<oneapi/dpl/execution>`` header files.
 
 * ``adjacent_find``
 * ``all_of``
@@ -76,49 +119,19 @@ The following algorithms are available to use with the ranges:
 * ``unique``
 * ``unique_copy``
 
-The signature example of the range-based algorithms looks like:
-
-.. code:: cpp
-
-   template <typename ExecutionPolicy, typename Range1, typename Range2>
-   void copy(ExecutionPolicy&& exec, Range1&& source, Range2&& destination);
-
-where ``source`` is used instead of two iterators to represent the input, and ``destination`` represents the output.
-
-These algorithms are declared in the ``oneapi::dpl::experimental::ranges`` namespace and implemented only for device execution policies.
-To make these algorithms available, the ``<oneapi/dpl/ranges>`` header should be included (after ``<oneapi/dpl/execution>``).
-Use of the range-based API requires C++17 and the C++ standard libraries that come with GCC 8.1 (or higher) or Clang 7 (or higher).
-
-The following viewable ranges are declared in the ``oneapi::dpl::experimental::ranges`` namespace.
-Only the ranges shown below and ``sycl::buffer`` are available as ranges for range-based algorithms.
-
-.. _viewable-ranges:
-
-* ``views::iota``: A range factory that generates a sequence of N elements, which starts from an initial value and ends by final N-1.
-* ``views::all``: A custom utility that represents a view of all or a part of ``sycl::buffer`` underlying elements for reading and writing on a device.
-* ``views::all_read``: A custom utility that represents a view of all or a part of ``sycl::buffer`` underlying elements for reading on a device.
-* ``views::all_write``: A custom utility that represents a view of all or a part of ``sycl::buffer`` underlying elements for writing on a device.
-* ``views::host_all``: A custom utility that represents a view of all or a part of ``sycl::buffer`` underlying elements for reading and writing on the host.
-* ``views::subrange``: A utility that represents a view of unified shared memory (USM) data range defined by a two USM pointers.
-* ``views::zip``: A custom range adapter that produces one ``zip_view`` from other several views.
-* ``views::transform``: A range adapter that represents a view of a underlying sequence after applying a transformation to each element.
-* ``views::reverse``: A range adapter that produces a reversed sequence of elements provided by another view.
-* ``views::take``: A range adapter that produces a view of the first N elements from another view.
-* ``views::drop``: A range adapter that produces a view excluding the first N elements from another view.
-
-Example of Range-Based API Usage
---------------------------------
+Usage Example
+-------------
 
 .. code:: cpp
 
-    using namespace oneapi::dpl::experimental::ranges;
+    namespace rangexp = oneapi::dpl::experimental::ranges;
 
     {
         sycl::buffer<int> A(data, sycl::range<1>(max_n));
         sycl::buffer<int> B(data2, sycl::range<1>(max_n));
 
-        auto view = all_view(A) | views::reverse();
-        auto range_res = all_view<int, sycl::access::mode::write>(B);
+        auto view = rangexp::views::all(A) | rangexp::views::reverse;
+        auto range_res = rangexp::views::all_write(B);
 
-        copy(oneapi::dpl::execution::dpcpp_default, view, range_res);
+        rangexp::copy(oneapi::dpl::execution::dpcpp_default, view, range_res);
     }
diff --git a/_sources/parallel_api_main.rst b/_sources/parallel_api_main.rst
index 638aecc3ad..5c78c6f46f 100644
--- a/_sources/parallel_api_main.rst
+++ b/_sources/parallel_api_main.rst
@@ -1,38 +1,38 @@
 Parallel API
 ############
 
-Parallel API is an implementation of the C++ standard libraries algorithms and execution
-policies, as specified in the ISO/IEC 14882:2017 standard (commonly called C++17). The implementation
-supports the unsequenced execution policy and the ``shift_left``/``shift_right`` algorithms, which are specified
-in the final draft of the C++ 20 standard (N4860). For more details see the `C++ Standard Execution
-Policies <https://en.cppreference.com/w/cpp/algorithm/execution_policy_tag_t>`_. |onedpl_long| (|onedpl_short|)
-provides specific versions of the algorithms, including:
+The Parallel API in |onedpl_long| (|onedpl_short|) is an implementation of the C++ standard algorithms
+with `execution policies <https://en.cppreference.com/w/cpp/algorithm#Execution_policies>`_,
+as specified in the ISO/IEC 14882:2017 standard (commonly called C++17), as well as those added in C++20.
+It offers threaded and SIMD execution of these algorithms on Intel® processors implemented on top of OpenMP*
+and |onetbb_short|, as well as data parallel execution on accelerators backed by SYCL* support in |dpcpp_cpp|.
+
+Extending the capabilities of `range algorithms <https://en.cppreference.com/w/cpp/algorithm/ranges>`_ in C++20,
+the Parallel API provides analogous *parallel range algorithms* that execute according to an execution policy.
+
+In addition, |onedpl_short| provides specific variations of some algorithms, including:
 
 * Segmented reduce
 * Segmented scan
 * Vectorized search algorithms
-
-Parallel API offers support for the parallel and vectorized execution of algorithms on Intel®
-processors and heterogeneity support with a DPC++ based implementation for device execution policies.
-For sequential execution, |onedpl_short| relies on an available implementation of the C++ standard library.
+* Sorting of key-value pairs
+* Conditional transform
 
 The utility API includes iterators and function object classes. The iterators implement
 zip, transform, complete permutation operations on other iterators, and include a counting and discard iterator.
 The function object classes provide minimum, maximum, and identity operations
 that may be passed to algorithms such as reduce or transform.
 
-|onedpl_short| also includes an experimental implementation of range-based algorithms with their
-required ranges and Async API.
+|onedpl_short| also includes an experimental implementation of asynchronous algorithms.
 
 .. toctree::
    :maxdepth: 2
    :titlesonly:
-   :glob:
    :hidden:
 
    parallel_api/execution_policies
-   parallel_api/iterators
-   parallel_api/async_api
-   parallel_api/range_based_api
+   parallel_api/parallel_range_algorithms
    parallel_api/additional_algorithms
    parallel_api/pass_data_algorithms
+   parallel_api/iterators
+   parallel_api/range_based_api
diff --git a/_static/documentation_options.js b/_static/documentation_options.js
index 8302a8473b..89523924e1 100644
--- a/_static/documentation_options.js
+++ b/_static/documentation_options.js
@@ -1,6 +1,6 @@
 var DOCUMENTATION_OPTIONS = {
     URL_ROOT: document.getElementById("documentation_options").getAttribute('data-url_root'),
-    VERSION: '2022.6.0',
+    VERSION: '2022.7.0',
     LANGUAGE: 'None',
     COLLAPSE_INDEX: false,
     BUILDER: 'html',
diff --git a/api_for_sycl_kernels/random.html b/api_for_sycl_kernels/random.html
index 912411955a..3bdadbd936 100644
--- a/api_for_sycl_kernels/random.html
+++ b/api_for_sycl_kernels/random.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Random Number Generators &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Random Number Generators &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,8 +45,8 @@
     <link rel="shortcut icon" href="../_static/favicons.png"/>
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="Tested Standard C++ APIs" href="tested_standard_cpp_api.html" />
-    <link rel="prev" title="API for the SYCL* Kernels" href="../api_for_sycl_kernels_main.html" />
+    <link rel="next" title="Utility Function Object Classes" href="utility_function_object_classes.html" />
+    <link rel="prev" title="Tested Standard C++ APIs" href="tested_standard_cpp_api.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 current active has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
-<li class="toctree-l2 current active"><a class="current reference internal" href="#">Random Number Generators</a></li>
+<li class="toctree-l1 current active has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2 current active"><a class="current reference internal" href="#">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -415,12 +420,12 @@ <h1>Random Number Generators<a class="headerlink" href="#random-number-generator
 <div class="section" id="random-number-engines">
 <h2>Random Number Engines<a class="headerlink" href="#random-number-engines" title="Permalink to this headline">#</a></h2>
 <p>Random number engines use seed data as an entropy source to generate pseudo-random numbers.
-oneDPL provides several class templates for customized engines, they are defined in the header
-<code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/random&gt;</span></code>.</p>
+oneDPL provides several class templates for customizable engines, defined in the header
+<code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/random&gt;</span></code> under the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::</span></code> namespace.</p>
 <table class="table">
 <colgroup>
-<col style="width: 22%" />
-<col style="width: 78%" />
+<col style="width: 41%" />
+<col style="width: 59%" />
 </colgroup>
 <thead>
 <tr class="row-odd"><th class="head"><p>Engine</p></th>
@@ -437,17 +442,22 @@ <h2>Random Number Engines<a class="headerlink" href="#random-number-engines" tit
 <tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">discard_block_engine</span></code></p></td>
 <td><p>Implements a discard block adaptor</p></td>
 </tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">experimental::philox_engine</span></code></p></td>
+<td><p>Implements a Philox algorithm</p></td>
+</tr>
 </tbody>
 </table>
 </div>
 <div class="section" id="predefined-random-number-engines">
 <h2>Predefined Random Number Engines<a class="headerlink" href="#predefined-random-number-engines" title="Permalink to this headline">#</a></h2>
-<p>Predefined random number engines are instantiations of random number engines class templates.
-The types below are defined in the header <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/random&gt;</span></code> under the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::</span></code> namespace.</p>
+<p>Predefined random number engines are instantiations of the random number engines class templates
+with selected engine parameters.</p>
+<p>The types below are defined in the header <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/random&gt;</span></code> in the same namespaces as their
+respective class templates.</p>
 <table class="table">
 <colgroup>
-<col style="width: 40%" />
-<col style="width: 60%" />
+<col style="width: 10%" />
+<col style="width: 90%" />
 </colgroup>
 <thead>
 <tr class="row-odd"><th class="head"><p>Type</p></th>
@@ -473,14 +483,21 @@ <h2>Predefined Random Number Engines<a class="headerlink" href="#predefined-rand
 <tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">ranlux48</span></code></p></td>
 <td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::discard_block_engine&lt;ranlux48_base,</span> <span class="pre">389,</span> <span class="pre">11&gt;</span></code></p></td>
 </tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">philox4x32</span></code></p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::experimental::philox_engine&lt;std::uint_fast32_t,</span> <span class="pre">32,</span> <span class="pre">4,</span> <span class="pre">10,</span> <span class="pre">0xCD9E8D57,</span> <span class="pre">0x9E3779B9,</span> <span class="pre">0xD2511F53,</span> <span class="pre">0xBB67AE85&gt;</span></code></p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">philox4x64</span></code></p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::experimental::philox_engine&lt;std::uint_fast64_t,</span> <span class="pre">64,</span> <span class="pre">4,</span> <span class="pre">10,</span> <span class="pre">0xCA5A826395121157,</span> <span class="pre">0x9E3779B97F4A7C15,</span> <span class="pre">0xD2E7470EE14C6C93,</span> <span class="pre">0xBB67AE8584CAA73B&gt;</span></code></p></td>
+</tr>
 </tbody>
 </table>
-<p>The engines described below can efficiently generate vectors of random numbers. These types are
-defined in the header <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/random&gt;</span></code> under the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::</span></code> namespace.</p>
+<p>The following predefined engines can efficiently generate vectors of random numbers.
+They differ from the scalar engines above by using <code class="docutils literal notranslate"><span class="pre">sycl::vec&lt;T,</span> <span class="pre">N&gt;</span></code> as the data type,
+while other engine parameters remain the same.</p>
 <table class="table">
 <colgroup>
-<col style="width: 40%" />
-<col style="width: 60%" />
+<col style="width: 23%" />
+<col style="width: 77%" />
 </colgroup>
 <thead>
 <tr class="row-odd"><th class="head"><p>Type</p></th>
@@ -489,28 +506,44 @@ <h2>Predefined Random Number Engines<a class="headerlink" href="#predefined-rand
 </thead>
 <tbody>
 <tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">template&lt;std::int32_t</span> <span class="pre">N&gt;</span> <span class="pre">minstd_rand0_vec&lt;N&gt;</span></code></p></td>
-<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::linear_congruential_engine&lt;sycl::vec&lt;std::uint32_t,</span> <span class="pre">N&gt;,</span> <span class="pre">16807,</span> <span class="pre">0,</span> <span class="pre">2147483647&gt;</span></code>
-minstd_rand0 for a vector generation case</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::linear_congruential_engine&lt;sycl::vec&lt;std::uint32_t,</span> <span class="pre">N&gt;,</span> <span class="pre">16807,</span> <span class="pre">0,</span> <span class="pre">2147483647&gt;</span></code></p>
+<p><code class="docutils literal notranslate"><span class="pre">minstd_rand0</span></code> that generates a vector.</p>
+</td>
 </tr>
 <tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">template&lt;std::int32_t</span> <span class="pre">N&gt;</span> <span class="pre">minstd_rand_vec&lt;N&gt;</span></code></p></td>
-<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::linear_congruential_engine&lt;sycl::vec&lt;std::uint32_t,</span> <span class="pre">N&gt;,</span> <span class="pre">48271,</span> <span class="pre">0,</span> <span class="pre">2147483647&gt;</span></code>
-minstd_rand for a vector generation case</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::linear_congruential_engine&lt;sycl::vec&lt;std::uint32_t,</span> <span class="pre">N&gt;,</span> <span class="pre">48271,</span> <span class="pre">0,</span> <span class="pre">2147483647&gt;</span></code></p>
+<p><code class="docutils literal notranslate"><span class="pre">minstd_rand</span></code> that generates a vector.</p>
+</td>
 </tr>
 <tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">template&lt;std::int32_t</span> <span class="pre">N&gt;</span> <span class="pre">ranlux24_base_vec&lt;N&gt;</span></code></p></td>
-<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::subtract_with_carry_engine&lt;sycl::vec&lt;std::uint32_t,</span> <span class="pre">N&gt;,</span> <span class="pre">24,</span> <span class="pre">10,</span> <span class="pre">24&gt;</span></code>
-ranlux24_base for a vector generation case</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::subtract_with_carry_engine&lt;sycl::vec&lt;std::uint32_t,</span> <span class="pre">N&gt;,</span> <span class="pre">24,</span> <span class="pre">10,</span> <span class="pre">24&gt;</span></code></p>
+<p><code class="docutils literal notranslate"><span class="pre">ranlux24_base</span></code> that generates a vector.</p>
+</td>
 </tr>
 <tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">template&lt;std::int32_t</span> <span class="pre">N&gt;</span> <span class="pre">ranlux48_base_vec&lt;N&gt;</span></code></p></td>
-<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::subtract_with_carry_engine&lt;sycl::vec&lt;std::uint64_t,</span> <span class="pre">N&gt;,</span> <span class="pre">48,</span> <span class="pre">5,</span> <span class="pre">12&gt;</span></code>
-ranlux48_base for a vector generation case</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::subtract_with_carry_engine&lt;sycl::vec&lt;std::uint64_t,</span> <span class="pre">N&gt;,</span> <span class="pre">48,</span> <span class="pre">5,</span> <span class="pre">12&gt;</span></code></p>
+<p><code class="docutils literal notranslate"><span class="pre">ranlux48_base</span></code> that generates a vector.</p>
+</td>
 </tr>
 <tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">template&lt;std::int32_t</span> <span class="pre">N&gt;</span> <span class="pre">ranlux24_vec&lt;N&gt;</span></code></p></td>
-<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::discard_block_engine&lt;ranlux24_base_vec&lt;N&gt;,</span> <span class="pre">223,</span> <span class="pre">23&gt;</span></code>
-ranlux24 for a vector generation case</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::discard_block_engine&lt;ranlux24_base_vec&lt;N&gt;,</span> <span class="pre">223,</span> <span class="pre">23&gt;</span></code></p>
+<p><code class="docutils literal notranslate"><span class="pre">ranlux24</span></code> that generates a vector.</p>
+</td>
 </tr>
 <tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">template&lt;std::int32_t</span> <span class="pre">N&gt;</span> <span class="pre">ranlux48_vec&lt;N&gt;</span></code></p></td>
-<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::discard_block_engine&lt;ranlux48_base_vec&lt;N&gt;,</span> <span class="pre">389,</span> <span class="pre">11&gt;</span></code>
-ranlux48 for vector generation case</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::discard_block_engine&lt;ranlux48_base_vec&lt;N&gt;,</span> <span class="pre">389,</span> <span class="pre">11&gt;</span></code></p>
+<p><code class="docutils literal notranslate"><span class="pre">ranlux48</span></code> that generates a vector.</p>
+</td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">template&lt;std::int32_t</span> <span class="pre">N&gt;</span> <span class="pre">philox4x32_vec&lt;N&gt;</span></code></p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::experimental::philox_engine&lt;sycl::vec&lt;std::uint_fast32_t,</span> <span class="pre">N&gt;,</span> <span class="pre">32,</span> <span class="pre">4,</span> <span class="pre">10,</span> <span class="pre">0xCD9E8D57,</span> <span class="pre">0x9E3779B9,</span> <span class="pre">0xD2511F53,</span> <span class="pre">0xBB67AE85&gt;</span></code></p>
+<p><code class="docutils literal notranslate"><span class="pre">philox4x32</span></code> that generates a vector.</p>
+</td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">template&lt;std::int32_t</span> <span class="pre">N&gt;</span> <span class="pre">philox4x64_vec&lt;N&gt;</span></code></p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::experimental::philox_engine&lt;sycl::vec&lt;std::uint_fast64_t,</span> <span class="pre">N&gt;,</span> <span class="pre">64,</span> <span class="pre">4,</span> <span class="pre">10,</span> <span class="pre">0xCA5A826395121157,</span> <span class="pre">0x9E3779B97F4A7C15,</span> <span class="pre">0xD2E7470EE14C6C93,</span> <span class="pre">0xBB67AE8584CAA73B&gt;</span></code></p>
+<p><code class="docutils literal notranslate"><span class="pre">philox4x64</span></code> that generates a vector.</p>
+</td>
 </tr>
 </tbody>
 </table>
@@ -522,8 +555,8 @@ <h2>Random Number Distributions<a class="headerlink" href="#random-number-distri
 are defined in the header <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/random&gt;</span></code> under the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::</span></code> namespace.</p>
 <table class="table">
 <colgroup>
-<col style="width: 22%" />
-<col style="width: 78%" />
+<col style="width: 28%" />
+<col style="width: 72%" />
 </colgroup>
 <thead>
 <tr class="row-odd"><th class="head"><p>Distribution</p></th>
@@ -563,6 +596,10 @@ <h2>Random Number Distributions<a class="headerlink" href="#random-number-distri
 </tr>
 </tbody>
 </table>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p><code class="docutils literal notranslate"><span class="pre">bernoulli_distribution</span></code>, <code class="docutils literal notranslate"><span class="pre">geometric_distribution</span></code>, and <code class="docutils literal notranslate"><span class="pre">uniform_int_distribution</span></code> can only be used on devices with FP64 support as they rely on double precision in their implementation (use <code class="docutils literal notranslate"><span class="pre">sycl::aspect::fp64</span></code> to check if the device supports FP64).</p>
+</div>
 </div>
 <div class="section" id="usage-model-of-onedpl-short-random-number-generation-functionality">
 <h2>Usage Model of oneDPL Random Number Generation Functionality<a class="headerlink" href="#usage-model-of-onedpl-short-random-number-generation-functionality" title="Permalink to this headline">#</a></h2>
@@ -634,20 +671,20 @@ <h2>Usage Model of oneDPL Random Number Generation Functionality<a class="header
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="../api_for_sycl_kernels_main.html"
+       href="tested_standard_cpp_api.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">API for the SYCL* Kernels</p>
+        <p class="prev-next-title">Tested Standard C++ APIs</p>
       </div>
     </a>
     <a class="right-next"
-       href="tested_standard_cpp_api.html"
+       href="utility_function_object_classes.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">Tested Standard C++ APIs</p>
+        <p class="prev-next-title">Utility Function Object Classes</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
diff --git a/api_for_sycl_kernels/tested_standard_cpp_api.html b/api_for_sycl_kernels/tested_standard_cpp_api.html
index d8230c9aeb..bfa36ee780 100644
--- a/api_for_sycl_kernels/tested_standard_cpp_api.html
+++ b/api_for_sycl_kernels/tested_standard_cpp_api.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Tested Standard C++ APIs &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Tested Standard C++ APIs &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,8 +45,8 @@
     <link rel="shortcut icon" href="../_static/favicons.png"/>
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="Utility Function Object Classes" href="utility_function_object_classes.html" />
-    <link rel="prev" title="Random Number Generators" href="random.html" />
+    <link rel="next" title="Random Number Generators" href="random.html" />
+    <link rel="prev" title="API for SYCL* Kernels" href="../api_for_sycl_kernels_main.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 current active has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
-<li class="toctree-l2"><a class="reference internal" href="random.html">Random Number Generators</a></li>
+<li class="toctree-l1 current active has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2 current active"><a class="current reference internal" href="#">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -1466,10 +1471,10 @@ <h2>Tested Standard C++ API Reference<a class="headerlink" href="#tested-standar
 <col style="width: 51%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p>libstdc++(GNU)</p></td>
+<tr class="row-odd"><td><p>libstdc++ (GNU)</p></td>
 <td><p>Provided with GCC*-7.5.0, GCC*-9.3.0</p></td>
 </tr>
-<tr class="row-even"><td><p>libc++(LLVM)</p></td>
+<tr class="row-even"><td><p>libc++ (LLVM)</p></td>
 <td><p>Provided with Clang*-11.0</p></td>
 </tr>
 <tr class="row-odd"><td><p>Microsoft Visual C++* (MSVC) Standard Library</p></td>
@@ -1503,20 +1508,20 @@ <h2>Tested Standard C++ API Reference<a class="headerlink" href="#tested-standar
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="random.html"
+       href="../api_for_sycl_kernels_main.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">Random Number Generators</p>
+        <p class="prev-next-title">API for SYCL* Kernels</p>
       </div>
     </a>
     <a class="right-next"
-       href="utility_function_object_classes.html"
+       href="random.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">Utility Function Object Classes</p>
+        <p class="prev-next-title">Random Number Generators</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
diff --git a/api_for_sycl_kernels/utility_function_object_classes.html b/api_for_sycl_kernels/utility_function_object_classes.html
index 33432b46cd..3d278b2d1a 100644
--- a/api_for_sycl_kernels/utility_function_object_classes.html
+++ b/api_for_sycl_kernels/utility_function_object_classes.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Utility Function Object Classes &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Utility Function Object Classes &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,8 +45,8 @@
     <link rel="shortcut icon" href="../_static/favicons.png"/>
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="Dynamic Selection API" href="../dynamic_selection_api_main.html" />
-    <link rel="prev" title="Tested Standard C++ APIs" href="tested_standard_cpp_api.html" />
+    <link rel="next" title="Macros" href="../macros.html" />
+    <link rel="prev" title="Random Number Generators" href="random.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 current active has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
-<li class="toctree-l2"><a class="reference internal" href="random.html">Random Number Generators</a></li>
+<li class="toctree-l1 current active has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="random.html">Random Number Generators</a></li>
 <li class="toctree-l2 current active"><a class="current reference internal" href="#">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -394,14 +399,14 @@ <h1>Utility Function Object Classes</h1>
   <div class="section" id="utility-function-object-classes">
 <h1>Utility Function Object Classes<a class="headerlink" href="#utility-function-object-classes" title="Permalink to this headline">#</a></h1>
 <p>The definitions of the utility function objects are available through the
-<code class="docutils literal notranslate"><span class="pre">oneapi/dpl/functional</span></code> header.  All function objects are implemented in the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl</span></code> namespace.</p>
+<code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/functional&gt;</span></code> header.  All function objects are implemented in the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl</span></code> namespace.</p>
 <ul class="simple">
-<li><p><code class="docutils literal notranslate"><span class="pre">identity</span></code>: A C++11 implementation of the C++20 <code class="docutils literal notranslate"><span class="pre">std::identity</span></code> function object type, where the operator() returns the
-argument unchanged.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">minimum</span></code>: A function object type where the operator() applies <code class="docutils literal notranslate"><span class="pre">std::less</span></code> to its arguments, then returns the
-lesser argument unchanged.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">maximum</span></code>: A function object type where the operator() applies <code class="docutils literal notranslate"><span class="pre">std::greater</span></code> to its arguments, then returns the
-greater argument unchanged.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">identity</span></code>: A function object type where the operator() returns the argument unchanged.
+It is an implementation of <code class="docutils literal notranslate"><span class="pre">std::identity</span></code> that can be used prior to C++20.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">minimum</span></code>: A function object type where the operator() applies <code class="docutils literal notranslate"><span class="pre">std::less</span></code> to its arguments,
+then returns the lesser argument unchanged.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">maximum</span></code>: A function object type where the operator() applies <code class="docutils literal notranslate"><span class="pre">std::greater</span></code> to its arguments,
+then returns the greater argument unchanged.</p></li>
 </ul>
 </div>
 
@@ -418,20 +423,20 @@ <h1>Utility Function Object Classes<a class="headerlink" href="#utility-function
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="tested_standard_cpp_api.html"
+       href="random.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">Tested Standard C++ APIs</p>
+        <p class="prev-next-title">Random Number Generators</p>
       </div>
     </a>
     <a class="right-next"
-       href="../dynamic_selection_api_main.html"
+       href="../macros.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">Dynamic Selection API</p>
+        <p class="prev-next-title">Macros</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
diff --git a/api_for_sycl_kernels_main.html b/api_for_sycl_kernels_main.html
index 6596d96322..eebe3c0c79 100644
--- a/api_for_sycl_kernels_main.html
+++ b/api_for_sycl_kernels_main.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>API for the SYCL* Kernels &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>API for SYCL* Kernels &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,8 +45,8 @@
     <link rel="shortcut icon" href="_static/favicons.png"/>
     <link rel="index" title="Index" href="genindex.html" />
     <link rel="search" title="Search" href="search.html" />
-    <link rel="next" title="Random Number Generators" href="api_for_sycl_kernels/random.html" />
-    <link rel="prev" title="Pass Data to Algorithms" href="parallel_api/pass_data_algorithms.html" />
+    <link rel="next" title="Tested Standard C++ APIs" href="api_for_sycl_kernels/tested_standard_cpp_api.html" />
+    <link rel="prev" title="Experimental Range-Based API" href="parallel_api/range_based_api.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 current active has-children"><a class="current reference internal" href="#">API for the SYCL* Kernels</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 current active has-children"><a class="current reference internal" href="#">API for SYCL* Kernels</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -377,7 +382,7 @@
               
 
 <div id="jb-print-docs-body" class="onlyprint">
-    <h1>API for the SYCL* Kernels</h1>
+    <h1>API for SYCL* Kernels</h1>
     <!-- Table of contents -->
     <div id="print-main-content">
         <div id="jb-print-toc">
@@ -391,8 +396,8 @@ <h1>API for the SYCL* Kernels</h1>
 <div id="searchbox"></div>
                 <article class="bd-article" role="main">
                   
-  <div class="section" id="api-for-the-sycl-kernels">
-<h1>API for the SYCL* Kernels<a class="headerlink" href="#api-for-the-sycl-kernels" title="Permalink to this headline">#</a></h1>
+  <div class="section" id="api-for-sycl-kernels">
+<h1>API for SYCL* Kernels<a class="headerlink" href="#api-for-sycl-kernels" title="Permalink to this headline">#</a></h1>
 <p>oneAPI DPC++ Library (oneDPL) includes the following APIs for SYCL* kernels:</p>
 <ul class="simple">
 <li><p><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html"><span class="doc">Tested Standard C++ APIs</span></a>. The basic
@@ -419,20 +424,20 @@ <h1>API for the SYCL* Kernels<a class="headerlink" href="#api-for-the-sycl-kerne
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="parallel_api/pass_data_algorithms.html"
+       href="parallel_api/range_based_api.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">Pass Data to Algorithms</p>
+        <p class="prev-next-title">Experimental Range-Based API</p>
       </div>
     </a>
     <a class="right-next"
-       href="api_for_sycl_kernels/random.html"
+       href="api_for_sycl_kernels/tested_standard_cpp_api.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">Random Number Generators</p>
+        <p class="prev-next-title">Tested Standard C++ APIs</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
diff --git a/cmake_support.html b/cmake_support.html
index 4eb272d6f3..2713c472bb 100644
--- a/cmake_support.html
+++ b/cmake_support.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>CMake Support &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>CMake Support &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1 current active"><a class="current reference internal" href="#">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1 current active"><a class="current reference internal" href="#">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -426,7 +431,10 @@ <h2>General Usage<a class="headerlink" href="#general-usage" title="Permalink to
 <div class="section" id="requirements">
 <h2>Requirements<a class="headerlink" href="#requirements" title="Permalink to this headline">#</a></h2>
 <p>The minimal supported CMake version for oneDPL is 3.11 on Linux and 3.20 on Windows.</p>
-<p>The supported <a class="reference external" href="https://cmake.org/cmake/help/latest/manual/cmake-generators.7.html#ninja-generators">CMake Generator</a> for Linux is <a class="reference external" href="https://cmake.org/cmake/help/latest/generator/Unix%20Makefiles.html">Unix Makefiles</a> (default). In the Windows environment, the supported generator is <a class="reference external" href="https://cmake.org/cmake/help/latest/generator/Ninja.html">Ninja</a> as described in the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/current/use-cmake-with-the-compiler.html">Intel® oneAPI DPC++/C++ Compiler Developer Guide and Reference</a> which may be specified via <code class="docutils literal notranslate"><span class="pre">-GNinja</span></code>.</p>
+<p>The supported <a class="reference external" href="https://cmake.org/cmake/help/latest/manual/cmake-generators.7.html#ninja-generators">CMake Generator</a>
+for Linux is <a class="reference external" href="https://cmake.org/cmake/help/latest/generator/Unix%20Makefiles.html">Unix Makefiles</a> (default).
+In the Windows environment, the supported generator is <a class="reference external" href="https://cmake.org/cmake/help/latest/generator/Ninja.html">Ninja</a>
+which may be specified via <code class="docutils literal notranslate"><span class="pre">-GNinja</span></code> as described in the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/2025-0/use-cmake-with-the-compiler.html">CMake support documentation for the Intel® oneAPI DPC++/C++ Compiler</a>.</p>
 </div>
 <div class="section" id="onedpl-short-backend-options">
 <h2>oneDPL Backend Options<a class="headerlink" href="#onedpl-short-backend-options" title="Permalink to this headline">#</a></h2>
diff --git a/dynamic_selection_api/auto_tune_policy.html b/dynamic_selection_api/auto_tune_policy.html
index 87a68e4bc4..f9bba4382b 100644
--- a/dynamic_selection_api/auto_tune_policy.html
+++ b/dynamic_selection_api/auto_tune_policy.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Auto-Tune Policy &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Auto-Tune Policy &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 current active has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="functions.html">Functions</a></li>
 <li class="toctree-l2 current active has-children"><a class="reference internal" href="policies.html">Policies</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -526,22 +531,22 @@ <h2>Selection Algorithm<a class="headerlink" href="#selection-algorithm" title="
 <p>The selection algorithm for <code class="docutils literal notranslate"><span class="pre">auto_tune_policy</span></code> uses runtime profiling
 to choose the best resource for the given function. A simplified, expository
 implementation of the selection algorithm follows:</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span>template&lt;typename Function, typename ...Args&gt;
-selection_type auto_tune_policy::select(Function&amp;&amp; f, Args&amp;&amp;...args) {
-  if (initialized_) {
-    auto k = make_task_key(f, args...);
-    auto tuner = get_tuner(k);
-    auto offset = tuner-&gt;get_resource_to_profile();
-    if (offset == use_best) {
-      return selection_type {*this, tuner-&gt;best_resource_, tuner};
-    } else {
-      auto r = resources_[offset];
-      return selection{*this, r, tuner};
-    }
-  } else {
-    throw std::logic_error(“selected called before initialization”);
-  }
-}
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">template</span><span class="o">&lt;</span><span class="k">typename</span><span class="w"> </span><span class="nc">Function</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="p">...</span><span class="n">Args</span><span class="o">&gt;</span>
+<span class="n">selection_type</span><span class="w"> </span><span class="n">auto_tune_policy</span><span class="o">::</span><span class="n">select</span><span class="p">(</span><span class="n">Function</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">f</span><span class="p">,</span><span class="w"> </span><span class="n">Args</span><span class="o">&amp;&amp;</span><span class="p">...</span><span class="n">args</span><span class="p">)</span><span class="w"> </span><span class="p">{</span>
+<span class="w">  </span><span class="k">if</span><span class="w"> </span><span class="p">(</span><span class="n">initialized_</span><span class="p">)</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">k</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">make_task_key</span><span class="p">(</span><span class="n">f</span><span class="p">,</span><span class="w"> </span><span class="n">args</span><span class="p">...);</span>
+<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">tuner</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">get_tuner</span><span class="p">(</span><span class="n">k</span><span class="p">);</span>
+<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">offset</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">tuner</span><span class="o">-&gt;</span><span class="n">get_resource_to_profile</span><span class="p">();</span>
+<span class="w">    </span><span class="k">if</span><span class="w"> </span><span class="p">(</span><span class="n">offset</span><span class="w"> </span><span class="o">==</span><span class="w"> </span><span class="n">use_best</span><span class="p">)</span><span class="w"> </span><span class="p">{</span>
+<span class="w">      </span><span class="k">return</span><span class="w"> </span><span class="n">selection_type</span><span class="w"> </span><span class="p">{</span><span class="o">*</span><span class="k">this</span><span class="p">,</span><span class="w"> </span><span class="n">tuner</span><span class="o">-&gt;</span><span class="n">best_resource_</span><span class="p">,</span><span class="w"> </span><span class="n">tuner</span><span class="p">};</span>
+<span class="w">    </span><span class="p">}</span><span class="w"> </span><span class="k">else</span><span class="w"> </span><span class="p">{</span>
+<span class="w">      </span><span class="k">auto</span><span class="w"> </span><span class="n">r</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">resources_</span><span class="p">[</span><span class="n">offset</span><span class="p">];</span>
+<span class="w">      </span><span class="k">return</span><span class="w"> </span><span class="n">selection</span><span class="p">{</span><span class="o">*</span><span class="k">this</span><span class="p">,</span><span class="w"> </span><span class="n">r</span><span class="p">,</span><span class="w"> </span><span class="n">tuner</span><span class="p">};</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">}</span><span class="w"> </span><span class="k">else</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="k">throw</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">logic_error</span><span class="p">(</span><span class="s">&quot;selected called before initialization&quot;</span><span class="p">);</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
 </pre></div>
 </div>
 <p>where <code class="docutils literal notranslate"><span class="pre">make_task_key</span></code> combines the inputs, including the function and its
@@ -581,6 +586,12 @@ <h2>Constructors<a class="headerlink" href="#constructors" title="Permalink to t
 </tr>
 </tbody>
 </table>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>When initializing the <code class="docutils literal notranslate"><span class="pre">auto_tune_policy</span></code> with SYCL queues, constructing the queues with the
+<code class="docutils literal notranslate"><span class="pre">sycl::property::queue::enable_profiling</span></code> property allows a more accurate determination of the
+best-performing device to be made.</p>
+</div>
 </div>
 <div class="section" id="deferred-initialization">
 <h2>Deferred Initialization<a class="headerlink" href="#deferred-initialization" title="Permalink to this headline">#</a></h2>
@@ -607,6 +618,12 @@ <h2>Deferred Initialization<a class="headerlink" href="#deferred-initialization"
 </tr>
 </tbody>
 </table>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>When initializing the <code class="docutils literal notranslate"><span class="pre">auto_tune_policy</span></code> with SYCL queues, constructing the queues with the
+<code class="docutils literal notranslate"><span class="pre">sycl::property::queue::enable_profiling</span></code> property allows a more accurate determination of the
+best-performing device to be made.</p>
+</div>
 </div>
 <div class="section" id="queries">
 <h2>Queries<a class="headerlink" href="#queries" title="Permalink to this headline">#</a></h2>
diff --git a/dynamic_selection_api/dynamic_load_policy.html b/dynamic_selection_api/dynamic_load_policy.html
index 5877fade3f..979c76c831 100644
--- a/dynamic_selection_api/dynamic_load_policy.html
+++ b/dynamic_selection_api/dynamic_load_policy.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Dynamic Load Policy &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Dynamic Load Policy &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 current active has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="functions.html">Functions</a></li>
 <li class="toctree-l2 current active has-children"><a class="reference internal" href="policies.html">Policies</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -520,14 +525,14 @@ <h2>Selection Algorithm<a class="headerlink" href="#selection-algorithm" title="
 and then number of reported task completions. This value is tracked for each
 available resource.</p>
 <p>Simplified, expository implementation of the selection algorithm:</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">template</span><span class="o">&lt;</span><span class="n">typename</span><span class="o">...</span> <span class="n">Args</span><span class="o">&gt;</span>
-<span class="n">selection_type</span> <span class="n">dynamic_load_policy</span><span class="p">::</span><span class="n">select</span><span class="p">(</span><span class="n">Args</span><span class="o">&amp;&amp;</span> <span class="o">...</span><span class="p">)</span> <span class="p">{</span>
-  <span class="k">if</span> <span class="p">(</span><span class="n">initialized_</span><span class="p">)</span> <span class="p">{</span>
-    <span class="n">auto</span> <span class="n">least_loaded_resource</span> <span class="o">=</span> <span class="n">find_least_loaded</span><span class="p">(</span><span class="n">resources_</span><span class="p">);</span>
-    <span class="k">return</span> <span class="n">selection_type</span><span class="p">{</span><span class="n">dynamic_load_policy</span><span class="o">&lt;</span><span class="n">Backend</span><span class="o">&gt;</span><span class="p">(</span><span class="o">*</span><span class="n">this</span><span class="p">),</span> <span class="n">least_loaded</span><span class="p">};</span>
-  <span class="p">}</span> <span class="k">else</span> <span class="p">{</span>
-    <span class="n">throw</span> <span class="n">std</span><span class="p">::</span><span class="n">logic_error</span><span class="p">(</span><span class="s2">&quot;select called before initialialization&quot;</span><span class="p">);</span>
-  <span class="p">}</span>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">template</span><span class="o">&lt;</span><span class="k">typename</span><span class="p">...</span><span class="w"> </span><span class="n">Args</span><span class="o">&gt;</span>
+<span class="n">selection_type</span><span class="w"> </span><span class="n">dynamic_load_policy</span><span class="o">::</span><span class="n">select</span><span class="p">(</span><span class="n">Args</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="p">...)</span><span class="w"> </span><span class="p">{</span>
+<span class="w">  </span><span class="k">if</span><span class="w"> </span><span class="p">(</span><span class="n">initialized_</span><span class="p">)</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">least_loaded_resource</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">find_least_loaded</span><span class="p">(</span><span class="n">resources_</span><span class="p">);</span>
+<span class="w">    </span><span class="k">return</span><span class="w"> </span><span class="n">selection_type</span><span class="p">{</span><span class="n">dynamic_load_policy</span><span class="o">&lt;</span><span class="n">Backend</span><span class="o">&gt;</span><span class="p">(</span><span class="o">*</span><span class="k">this</span><span class="p">),</span><span class="w"> </span><span class="n">least_loaded</span><span class="p">};</span>
+<span class="w">  </span><span class="p">}</span><span class="w"> </span><span class="k">else</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="k">throw</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">logic_error</span><span class="p">(</span><span class="s">&quot;select called before initialialization&quot;</span><span class="p">);</span>
+<span class="w">  </span><span class="p">}</span>
 <span class="p">}</span>
 </pre></div>
 </div>
diff --git a/dynamic_selection_api/fixed_resource_policy.html b/dynamic_selection_api/fixed_resource_policy.html
index d1e21ede95..0b61034787 100644
--- a/dynamic_selection_api/fixed_resource_policy.html
+++ b/dynamic_selection_api/fixed_resource_policy.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Fixed-Resource Policy &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Fixed-Resource Policy &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 current active has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="functions.html">Functions</a></li>
 <li class="toctree-l2 current active has-children"><a class="reference internal" href="policies.html">Policies</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -536,14 +541,14 @@ <h2>Selection Algorithm<a class="headerlink" href="#selection-algorithm" title="
 the same specific resource from its set of resources. The index of the
 resource is set during construction or deferred initialization.</p>
 <p>Simplified, expository implementation of the selection algorithm:</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span>template&lt;typename... Args&gt;
-selection_type fixed_resource_policy::select(Args&amp;&amp; ...) {
-  if (initialized_) {
-    return selection_type{*this, resources_[fixed_offset_]};
-  } else {
-    throw std::logic_error(“select called before initialization”);
-  }
-}
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">template</span><span class="o">&lt;</span><span class="k">typename</span><span class="p">...</span><span class="w"> </span><span class="n">Args</span><span class="o">&gt;</span>
+<span class="n">selection_type</span><span class="w"> </span><span class="n">fixed_resource_policy</span><span class="o">::</span><span class="n">select</span><span class="p">(</span><span class="n">Args</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="p">...)</span><span class="w"> </span><span class="p">{</span>
+<span class="w">  </span><span class="k">if</span><span class="w"> </span><span class="p">(</span><span class="n">initialized_</span><span class="p">)</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="k">return</span><span class="w"> </span><span class="n">selection_type</span><span class="p">{</span><span class="o">*</span><span class="k">this</span><span class="p">,</span><span class="w"> </span><span class="n">resources_</span><span class="p">[</span><span class="n">fixed_offset_</span><span class="p">]};</span>
+<span class="w">  </span><span class="p">}</span><span class="w"> </span><span class="k">else</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="k">throw</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">logic_error</span><span class="p">(</span><span class="s">&quot;select called before initialization&quot;</span><span class="p">);</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
 </pre></div>
 </div>
 <p>where <code class="docutils literal notranslate"><span class="pre">resources_</span></code> is a container of resources, such as
diff --git a/dynamic_selection_api/functions.html b/dynamic_selection_api/functions.html
index 39cd1b82cd..b69ef2fe13 100644
--- a/dynamic_selection_api/functions.html
+++ b/dynamic_selection_api/functions.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Functions &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Functions &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 current active has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2 current active"><a class="current reference internal" href="#">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -459,7 +464,7 @@ <h2>Select<a class="headerlink" href="#select" title="Permalink to this headline
 <span class="p">}</span>
 </pre></div>
 </div>
-<p>The output of this example:</p>
+<p>The output of this example is:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">selected</span> <span class="n">queue</span> <span class="ow">is</span> <span class="n">cpu</span>
 <span class="n">selected</span> <span class="n">queue</span> <span class="ow">is</span> <span class="n">gpu</span>
 <span class="n">selected</span> <span class="n">queue</span> <span class="ow">is</span> <span class="n">cpu</span>
@@ -539,7 +544,7 @@ <h3>Submit Using a Policy<a class="headerlink" href="#submit-using-a-policy" tit
 <span class="p">}</span>
 </pre></div>
 </div>
-<p>The output from this example:</p>
+<p>The output from this example is:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="p">(</span><span class="n">j</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="n">submit</span> <span class="n">to</span> <span class="n">cpu</span>
 <span class="p">(</span><span class="n">i</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="k">async</span> <span class="n">work</span> <span class="n">on</span> <span class="n">main</span> <span class="n">thread</span>
 <span class="p">(</span><span class="n">i</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="n">submission</span> <span class="n">done</span>
@@ -602,7 +607,7 @@ <h3>Submit Using a Selection<a class="headerlink" href="#submit-using-a-selectio
 <span class="p">}</span>
 </pre></div>
 </div>
-<p>The output from this example:</p>
+<p>The output from this example is:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="p">(</span><span class="n">j</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="n">submit</span> <span class="n">to</span> <span class="n">cpu</span>
 <span class="p">(</span><span class="n">i</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="k">async</span> <span class="n">work</span> <span class="n">on</span> <span class="n">main</span> <span class="n">thread</span>
 <span class="p">(</span><span class="n">i</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="n">submission</span> <span class="n">done</span>
@@ -662,7 +667,7 @@ <h2>Wait<a class="headerlink" href="#wait" title="Permalink to this headline">#<
 <span class="p">}</span>
 </pre></div>
 </div>
-<p>The output from this example:</p>
+<p>The output from this example is:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="p">(</span><span class="n">j</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="n">submit</span> <span class="n">to</span> <span class="n">cpu</span>
 <span class="p">(</span><span class="n">i</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="k">async</span> <span class="n">work</span> <span class="n">on</span> <span class="n">main</span> <span class="n">thread</span>
 <span class="p">(</span><span class="n">j</span> <span class="o">==</span> <span class="mi">1</span><span class="p">):</span> <span class="n">submit</span> <span class="n">to</span> <span class="n">gpu</span>
@@ -730,7 +735,7 @@ <h3>Submit and Wait Using a Policy<a class="headerlink" href="#submit-and-wait-u
 <span class="p">}</span>
 </pre></div>
 </div>
-<p>The output from this example:</p>
+<p>The output from this example is:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="p">(</span><span class="n">j</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="n">submit</span> <span class="n">to</span> <span class="n">cpu</span>
 <span class="p">(</span><span class="n">i</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="n">submission</span> <span class="n">done</span>
 <span class="p">(</span><span class="n">j</span> <span class="o">==</span> <span class="mi">1</span><span class="p">):</span> <span class="n">submit</span> <span class="n">to</span> <span class="n">gpu</span>
@@ -786,7 +791,7 @@ <h3>Submit and Wait Using a Selection<a class="headerlink" href="#submit-and-wai
 <span class="p">}</span>
 </pre></div>
 </div>
-<p>The output from this example:</p>
+<p>The output from this example is:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="p">(</span><span class="n">j</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="n">submit</span> <span class="n">to</span> <span class="n">cpu</span>
 <span class="p">(</span><span class="n">i</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span> <span class="n">submission</span> <span class="n">done</span>
 <span class="p">(</span><span class="n">j</span> <span class="o">==</span> <span class="mi">1</span><span class="p">):</span> <span class="n">submit</span> <span class="n">to</span> <span class="n">gpu</span>
@@ -833,7 +838,7 @@ <h3>Getting the Resource Options<a class="headerlink" href="#getting-the-resourc
 <span class="p">}</span>
 </pre></div>
 </div>
-<p>The output from this example on a test machine is shown below.</p>
+<p>The output from this example on a test machine is:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">Resources</span> <span class="ow">in</span> <span class="n">explicitly</span> <span class="nb">set</span> <span class="n">policy</span>
 <span class="n">queue</span> <span class="ow">is</span> <span class="n">cpu</span>
 <span class="n">queue</span> <span class="ow">is</span> <span class="n">gpu</span>
diff --git a/dynamic_selection_api/policies.html b/dynamic_selection_api/policies.html
index 3dd78e44b8..301682361e 100644
--- a/dynamic_selection_api/policies.html
+++ b/dynamic_selection_api/policies.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Policies &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Policies &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 current active has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="functions.html">Functions</a></li>
 <li class="toctree-l2 current active has-children"><a class="current reference internal" href="#">Policies</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -495,7 +500,7 @@ <h2>Common Reference Semantics<a class="headerlink" href="#common-reference-sema
 <span class="p">}</span>
 </pre></div>
 </div>
-<p>The output of this example:</p>
+<p>The output of this example is:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">p1</span> <span class="n">selection</span> <span class="mi">1</span><span class="p">:</span> <span class="n">cpu</span>
 <span class="n">p2</span> <span class="n">selection</span> <span class="mi">1</span><span class="p">:</span> <span class="n">cpu</span>
 <span class="n">p2</span> <span class="n">selection</span> <span class="mi">2</span><span class="p">:</span> <span class="n">gpu</span>
diff --git a/dynamic_selection_api/round_robin_policy.html b/dynamic_selection_api/round_robin_policy.html
index bb9f153c22..129c86b127 100644
--- a/dynamic_selection_api/round_robin_policy.html
+++ b/dynamic_selection_api/round_robin_policy.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Round-Robin Policy &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Round-Robin Policy &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 current active has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="functions.html">Functions</a></li>
 <li class="toctree-l2 current active has-children"><a class="reference internal" href="policies.html">Policies</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -515,15 +520,15 @@ <h2>Selection Algorithm<a class="headerlink" href="#selection-algorithm" title="
 <p>The selection algorithm for <code class="docutils literal notranslate"><span class="pre">round_robin_policy</span></code> rotates through
 the elements of the set of available resources. A simplified, expository
 implementation of the selection algorithm follows:</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span>template&lt;typename ...Args&gt;
-selection_type round_robin_policy::select(Args&amp;&amp;...) {
-  if (initialized_) {
-    auto&amp; r = resources_[next_context_++ % num_resources_];
-    return selection_type{*this, r};
-  } else {
-    throw std::logic_error(“selected called before initialization”);
-  }
-}
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">template</span><span class="o">&lt;</span><span class="k">typename</span><span class="w"> </span><span class="p">...</span><span class="n">Args</span><span class="o">&gt;</span>
+<span class="n">selection_type</span><span class="w"> </span><span class="n">round_robin_policy</span><span class="o">::</span><span class="n">select</span><span class="p">(</span><span class="n">Args</span><span class="o">&amp;&amp;</span><span class="p">...)</span><span class="w"> </span><span class="p">{</span>
+<span class="w">  </span><span class="k">if</span><span class="w"> </span><span class="p">(</span><span class="n">initialized_</span><span class="p">)</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="k">auto</span><span class="o">&amp;</span><span class="w"> </span><span class="n">r</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">resources_</span><span class="p">[</span><span class="n">next_context_</span><span class="o">++</span><span class="w"> </span><span class="o">%</span><span class="w"> </span><span class="n">num_resources_</span><span class="p">];</span>
+<span class="w">    </span><span class="k">return</span><span class="w"> </span><span class="n">selection_type</span><span class="p">{</span><span class="o">*</span><span class="k">this</span><span class="p">,</span><span class="w"> </span><span class="n">r</span><span class="p">};</span>
+<span class="w">  </span><span class="p">}</span><span class="w"> </span><span class="k">else</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="k">throw</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">logic_error</span><span class="p">(</span><span class="s">&quot;selected called before initialization&quot;</span><span class="p">);</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
 </pre></div>
 </div>
 <p>where <code class="docutils literal notranslate"><span class="pre">resources_</span></code> is a container of resources, such as
diff --git a/dynamic_selection_api_main.html b/dynamic_selection_api_main.html
index 59151ca771..adc0a4fcf1 100644
--- a/dynamic_selection_api_main.html
+++ b/dynamic_selection_api_main.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Dynamic Selection API &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Dynamic Selection API &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -46,7 +46,7 @@
     <link rel="index" title="Index" href="genindex.html" />
     <link rel="search" title="Search" href="search.html" />
     <link rel="next" title="Functions" href="dynamic_selection_api/functions.html" />
-    <link rel="prev" title="Utility Function Object Classes" href="api_for_sycl_kernels/utility_function_object_classes.html" />
+    <link rel="prev" title="Asynchronous Algorithms" href="parallel_api/async_api.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 current active has-children"><a class="current reference internal" href="#">Dynamic Selection API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -493,12 +498,12 @@ <h1>Dynamic Selection API<a class="headerlink" href="#dynamic-selection-api" tit
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="api_for_sycl_kernels/utility_function_object_classes.html"
+       href="parallel_api/async_api.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">Utility Function Object Classes</p>
+        <p class="prev-next-title">Asynchronous Algorithms</p>
       </div>
     </a>
     <a class="right-next"
diff --git a/genindex.html b/genindex.html
index 93c110719d..a1cd495652 100644
--- a/genindex.html
+++ b/genindex.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Index &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Index &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -149,24 +149,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -182,14 +189,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
diff --git a/index.html b/index.html
index ddf5e4db5f..145eff6520 100644
--- a/index.html
+++ b/index.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>oneAPI DPC++ Library Developer Guide &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>oneAPI DPC++ Library Developer Guide &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -150,24 +150,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -183,14 +190,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -400,48 +405,42 @@ <h1>oneAPI DPC++ Library Developer Guide<a class="headerlink" href="#onedpl-long
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Get Started</span></p>
 <ul>
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
-<li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a><ul>
-<li class="toctree-l2"><a class="reference internal" href="introduction/onedpl_gsg.html#quick-start">Quick Start</a></li>
-<li class="toctree-l2"><a class="reference internal" href="introduction/onedpl_gsg.html#find-more">Find More</a></li>
-</ul>
-</li>
+<li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
 </div>
 <div class="toctree-wrapper compound">
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul>
-<li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a><ul>
-<li class="toctree-l2"><a class="reference internal" href="introduction.html#before-you-begin">Before You Begin</a></li>
-<li class="toctree-l2"><a class="reference internal" href="introduction.html#system-requirements">System Requirements</a></li>
-<li class="toctree-l2"><a class="reference internal" href="introduction.html#build-your-code-with-onedpl-short">Build Your Code with oneDPL</a></li>
-</ul>
-</li>
-<li class="toctree-l1"><a class="reference internal" href="parallel_api_main.html">Parallel API</a></li>
-<li class="toctree-l1"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a></li>
-<li class="toctree-l1"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><ul>
-<li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
-<li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a></li>
-</ul>
-</li>
-<li class="toctree-l1"><a class="reference internal" href="kernel_templates_main.html">Kernel Templates API</a></li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a><ul>
-<li class="toctree-l2"><a class="reference internal" href="macros.html#version-macros">Version Macros</a></li>
-<li class="toctree-l2"><a class="reference internal" href="macros.html#additional-macros">Additional Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
+<li class="toctree-l1"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><ul>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a><ul>
-<li class="toctree-l2"><a class="reference internal" href="cmake_support.html#general-usage">General Usage</a></li>
-<li class="toctree-l2"><a class="reference internal" href="cmake_support.html#requirements">Requirements</a></li>
-<li class="toctree-l2"><a class="reference internal" href="cmake_support.html#onedpl-short-backend-options">oneDPL Backend Options</a></li>
-<li class="toctree-l2"><a class="reference internal" href="cmake_support.html#example-cmake-file">Example CMake File</a></li>
-<li class="toctree-l2"><a class="reference internal" href="cmake_support.html#example-cmake-invocation">Example CMake Invocation</a></li>
-<li class="toctree-l2"><a class="reference internal" href="cmake_support.html#example-build-command">Example Build Command</a></li>
+<li class="toctree-l1"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><ul>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
 <li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 </div>
 <div class="toctree-wrapper compound">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul>
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
+<li class="toctree-l1"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a></li>
+<li class="toctree-l1"><a class="reference internal" href="kernel_templates_main.html">Kernel Templates API</a></li>
+</ul>
+</div>
+<div class="toctree-wrapper compound">
 </div>
 </div>
 
diff --git a/introduction.html b/introduction.html
index 44ea562701..c78d0f9762 100644
--- a/introduction.html
+++ b/introduction.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>oneAPI DPC++ Library Introduction &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>oneAPI DPC++ Library Introduction &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1 current active"><a class="current reference internal" href="#">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -392,12 +397,15 @@ <h2> Contents </h2>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#before-you-begin">Before You Begin</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#system-requirements">System Requirements</a><ul class="nav section-nav flex-column">
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#prerequisites">Prerequisites</a></li>
+</ul>
+</li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#develop-and-build-your-code-with-onedpl-short">Develop and Build Your Code with oneDPL</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#useful-information">Useful Information</a><ul class="nav section-nav flex-column">
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#difference-with-standard-c-parallel-algorithms">Difference with Standard C++ Parallel Algorithms</a></li>
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#restrictions">Restrictions</a></li>
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#known-limitations">Known Limitations</a></li>
 </ul>
 </li>
-<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#build-your-code-with-onedpl-short">Build Your Code with oneDPL</a></li>
 </ul>
             </nav>
         </div>
@@ -411,13 +419,10 @@ <h2> Contents </h2>
                   
   <div class="section" id="onedpl-long-introduction">
 <h1>oneAPI DPC++ Library Introduction<a class="headerlink" href="#onedpl-long-introduction" title="Permalink to this headline">#</a></h1>
-<p>Parallel API can be used with the <a class="reference external" href="https://en.cppreference.com/w/cpp/algorithm/execution_policy_tag_t">C++ Standard Execution
-Policies</a>
-to enable parallelism on the host.</p>
-<p>The oneAPI DPC++ Library (oneDPL) is implemented in accordance with the <a class="reference external" href="https://spec.oneapi.io/versions/latest/elements/oneDPL/source/index.html">oneDPL
+<p>The oneAPI DPC++ Library (oneDPL) is implemented in accordance with the <a class="reference external" href="https://uxlfoundation.github.io/oneAPI-spec/spec/elements/oneDPL/source/index.html">oneDPL
 Specification</a>.</p>
-<p>To support heterogeneity, oneDPL works with the DPC++ API. More information can be found in the
-<a class="reference external" href="https://spec.oneapi.io/versions/latest/elements/sycl/source/index.html">oneAPI Specification</a>.</p>
+<p>To support heterogeneity, oneDPL uses <a class="reference external" href="https://registry.khronos.org/SYCL/">SYCL</a>.
+More information about SYCL can be found in the <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html">SYCL Specification</a>.</p>
 <div class="section" id="before-you-begin">
 <h2>Before You Begin<a class="headerlink" href="#before-you-begin" title="Permalink to this headline">#</a></h2>
 <p>Visit the oneDPL <a class="reference external" href="https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-dpcpp-library-release-notes.html">Release Notes</a>
@@ -431,13 +436,8 @@ <h2>Before You Begin<a class="headerlink" href="#before-you-begin" title="Permal
 <li><p>Known Issues and Limitations</p></li>
 <li><p>Previous Release Notes</p></li>
 </ul>
-<p>Install the <a class="reference external" href="https://www.intel.com/content/www/us/en/developer/tools/oneapi/base-toolkit.html#gs.xaontv">Intel® oneAPI Base Toolkit (Base Kit)</a>
+<p>Install the <a class="reference external" href="https://www.intel.com/content/www/us/en/developer/tools/oneapi/base-toolkit.html">Intel® oneAPI Base Toolkit (Base Kit)</a>
 to use oneDPL.</p>
-<p>All oneDPL header files are in the <code class="docutils literal notranslate"><span class="pre">oneapi/dpl</span></code> directory. To use the oneDPL API,
-include the corresponding header in your source code with the <code class="docutils literal notranslate"><span class="pre">#include</span> <span class="pre">&lt;oneapi/dpl/…&gt;</span></code> directive.
-oneDPL introduces the namespace <code class="docutils literal notranslate"><span class="pre">oneapi::dpl</span></code> for most its classes and functions.</p>
-<p>To use tested C++ standard APIs, you need to include the corresponding C++ standard header files
-and use the <code class="docutils literal notranslate"><span class="pre">std</span></code> namespace.</p>
 </div>
 <div class="section" id="system-requirements">
 <h2>System Requirements<a class="headerlink" href="#system-requirements" title="Permalink to this headline">#</a></h2>
@@ -446,31 +446,61 @@ <h3>Prerequisites<a class="headerlink" href="#prerequisites" title="Permalink to
 <p>C++17 is the minimal supported version of the C++ standard.
 That means, any use of oneDPL may require a C++17 compiler.
 While some APIs of the library may accidentally work with earlier versions of the C++ standard, it is no more guaranteed.</p>
-<p>To call Parallel API with the C++ standard policies, you need to install the following software:</p>
+<p>To call Parallel API with the C++ standard aligned policies, you need to install the following software:</p>
 <ul class="simple">
 <li><p>A C++ compiler with support for OpenMP* 4.0 (or higher) SIMD constructs</p></li>
-<li><p>Depending on what parallel backend you want to use install either:</p>
+<li><p>Depending on what parallel backend you want to use, install either:</p>
 <ul>
-<li><p>oneAPI Threading Building Blocks (oneTBB) or Intel® Threading Building Blocks (Intel® TBB) 2019 and later</p></li>
-<li><p>A C++ compiler with support for OpenMP 4.5 (or higher)</p></li>
+<li><p>oneAPI Threading Building Blocks (oneTBB) or Intel® Threading Building Blocks (Intel® TBB) 2019 and later,</p></li>
+<li><p>A C++ compiler with support for OpenMP 4.5 (or higher).</p></li>
 </ul>
 </li>
 </ul>
-<p>For more information about parallel backends, see <a class="reference internal" href="parallel_api/execution_policies.html"><span class="doc">Execution Policies</span></a></p>
+<p>For more information about parallel backends, see <a class="reference internal" href="parallel_api/execution_policies.html"><span class="doc">Execution Policies</span></a>.</p>
 <p>To use Parallel API with the device execution policies, you need to install the following software:</p>
 <ul class="simple">
-<li><p>A C++ compiler with support for SYCL 2020</p></li>
+<li><p>A C++ compiler with support for SYCL 2020.</p></li>
 </ul>
 </div>
+</div>
+<div class="section" id="develop-and-build-your-code-with-onedpl-short">
+<h2>Develop and Build Your Code with oneDPL<a class="headerlink" href="#develop-and-build-your-code-with-onedpl-short" title="Permalink to this headline">#</a></h2>
+<p>All oneDPL header files are in the <code class="docutils literal notranslate"><span class="pre">oneapi/dpl</span></code> directory. To use the oneDPL API,
+include the corresponding header in your source code with the <code class="docutils literal notranslate"><span class="pre">#include</span> <span class="pre">&lt;oneapi/dpl/…&gt;</span></code> directive.
+For better coexistence with the C++ standard library, include oneDPL header files before the standard C++ ones.</p>
+<p>oneDPL introduces the <code class="docutils literal notranslate"><span class="pre">namespace</span> <span class="pre">oneapi::dpl</span></code> for its classes and functions. For brevity,
+<code class="docutils literal notranslate"><span class="pre">namespace</span> <span class="pre">dpl</span></code> is defined as an alias to <code class="docutils literal notranslate"><span class="pre">oneapi::dpl</span></code> and can be used interchangeably.</p>
+<p>To use <a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html"><span class="doc">tested C++ standard APIs</span></a> in SYCL device code,
+include the corresponding C++ standard header files and use the <code class="docutils literal notranslate"><span class="pre">std</span></code> namespace.</p>
+<p>Follow the steps below to build your code with oneDPL:</p>
+<ol class="arabic simple">
+<li><p>To build with the Intel® oneAPI DPC++/C++ Compiler, see the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/get-started-guide/2025-0/overview.html">Get Started with the Intel® oneAPI DPC++/C++ Compiler</a> for details.</p></li>
+<li><p>Set the environment variables for oneDPL and oneTBB.</p></li>
+</ol>
+<p>Here is an example of a command line used to compile code that contains oneDPL parallel algorithms
+on Linux* (depending on the code, parameters within [] could be unnecessary):</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">icpx</span> <span class="p">[</span><span class="o">-</span><span class="n">fsycl</span><span class="p">]</span> <span class="p">[</span><span class="o">-</span><span class="n">fiopenmp</span><span class="p">]</span> <span class="n">program</span><span class="o">.</span><span class="n">cpp</span> <span class="p">[</span><span class="o">-</span><span class="n">ltbb</span><span class="p">]</span> <span class="o">-</span><span class="n">o</span> <span class="n">program</span>
+</pre></div>
+</div>
+<p>You may also use the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/2025-0/fsycl-pstl-offload.html"><code class="docutils literal notranslate"><span class="pre">-fsycl-pstl-offload</span></code> option</a> of Intel® oneAPI DPC++/C++ Compiler powered by oneDPL
+to build the standard C++ code for execution on a SYCL device:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">icpx</span> <span class="o">-</span><span class="n">fsycl</span> <span class="o">-</span><span class="n">fsycl</span><span class="o">-</span><span class="n">pstl</span><span class="o">-</span><span class="n">offload</span><span class="o">=</span><span class="n">gpu</span> <span class="n">program</span><span class="o">.</span><span class="n">cpp</span> <span class="o">-</span><span class="n">o</span> <span class="n">program</span>
+</pre></div>
+</div>
+<p>This option redirects C++ parallel algorithms invoked with the <code class="docutils literal notranslate"><span class="pre">std::execution::par_unseq</span></code> policy
+to oneDPL algorithms. It does not change the behavior of the oneDPL algorithms and
+execution policies that are directly used in the code.</p>
+</div>
+<div class="section" id="useful-information">
+<h2>Useful Information<a class="headerlink" href="#useful-information" title="Permalink to this headline">#</a></h2>
 <div class="section" id="difference-with-standard-c-parallel-algorithms">
-<h3>Difference with Standard C++ Parallel Algorithms<a class="headerlink" href="#difference-with-standard-c-parallel-algorithms" title="Permalink to this headline">#</a></h3>
+<span id="library-restrictions"></span><h3>Difference with Standard C++ Parallel Algorithms<a class="headerlink" href="#difference-with-standard-c-parallel-algorithms" title="Permalink to this headline">#</a></h3>
 <ul class="simple">
 <li><p>oneDPL execution policies only result in parallel execution if random access iterators are provided,
 the execution will remain serial for other iterator types.</p></li>
 <li><p>Function objects passed in to algorithms executed with device policies must provide <code class="docutils literal notranslate"><span class="pre">const</span></code>-qualified <code class="docutils literal notranslate"><span class="pre">operator()</span></code>.
-<a class="reference external" href="https://registry.khronos.org/SYCL/">The SYCL specification</a> states that writing to such an object during a SYCL
-kernel is undefined behavior.</p></li>
-<li><p>For the following algorithms, par_unseq and unseq policies do not result in vectorized execution:
+The <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html">SYCL specification</a> states that writing to such an object during a SYCL kernel is undefined behavior.</p></li>
+<li><p>For the following algorithms, <code class="docutils literal notranslate"><span class="pre">par_unseq</span></code> and <code class="docutils literal notranslate"><span class="pre">unseq</span></code> policies do not result in SIMD execution:
 <code class="docutils literal notranslate"><span class="pre">includes</span></code>, <code class="docutils literal notranslate"><span class="pre">inplace_merge</span></code>, <code class="docutils literal notranslate"><span class="pre">merge</span></code>, <code class="docutils literal notranslate"><span class="pre">set_difference</span></code>, <code class="docutils literal notranslate"><span class="pre">set_intersection</span></code>,
 <code class="docutils literal notranslate"><span class="pre">set_symmetric_difference</span></code>, <code class="docutils literal notranslate"><span class="pre">set_union</span></code>, <code class="docutils literal notranslate"><span class="pre">stable_partition</span></code>, <code class="docutils literal notranslate"><span class="pre">unique</span></code>.</p></li>
 <li><p>The following algorithms require additional O(n) memory space for parallel execution:
@@ -480,12 +510,13 @@ <h3>Difference with Standard C++ Parallel Algorithms<a class="headerlink" href="
 </div>
 <div class="section" id="restrictions">
 <h3>Restrictions<a class="headerlink" href="#restrictions" title="Permalink to this headline">#</a></h3>
-<p>When called with DPC++ execution policies, oneDPL algorithms apply the same restrictions as
-DPC++ does (see the DPC++ specification and the SYCL specification for details), such as:</p>
+<p>When called with device execution policies, oneDPL algorithms apply the same restrictions as
+DPC++ does (see the Intel® oneAPI DPC++/C++ Compiler documentation and the SYCL specification for details), such as:</p>
 <ul class="simple">
 <li><p>Adding buffers to a lambda capture list is not allowed for lambdas passed to an algorithm.</p></li>
 <li><p>Passing data types, which are not trivially copyable, is only allowed via USM,
 but not via buffers or host-allocated containers.</p></li>
+<li><p>Objects of pointer-to-member types cannot be passed to an algorithm.</p></li>
 <li><p>The definition of lambda functions used with parallel algorithms should not depend on preprocessor macros
 that makes it different for the host and the device. Otherwise, the behavior is undefined.</p></li>
 <li><p>When used within SYCL kernels or transferred to/from a device, a container class can only hold objects
@@ -496,10 +527,9 @@ <h3>Restrictions<a class="headerlink" href="#restrictions" title="Permalink to t
 <div class="section" id="known-limitations">
 <h3>Known Limitations<a class="headerlink" href="#known-limitations" title="Permalink to this headline">#</a></h3>
 <ul class="simple">
-<li><p>When compiled with <code class="docutils literal notranslate"><span class="pre">-fsycl-pstl-offload</span></code> option of Intel oneAPI DPC++/C++ compiler and with
-<code class="docutils literal notranslate"><span class="pre">libstdc++</span></code> version 8 or <code class="docutils literal notranslate"><span class="pre">libc++</span></code>, <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::execution::par_unseq</span></code> offloads
-standard parallel algorithms to the SYCL device similarly to <code class="docutils literal notranslate"><span class="pre">std::execution::par_unseq</span></code>
-in accordance with the <code class="docutils literal notranslate"><span class="pre">-fsycl-pstl-offload</span></code> option value.</p></li>
+<li><p>The <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::execution::par_unseq</span></code> policy is affected by <code class="docutils literal notranslate"><span class="pre">-fsycl-pstl-offload</span></code> option of Intel® oneAPI DPC++/C++ Compiler
+when oneDPL substitutes this policy for the <code class="docutils literal notranslate"><span class="pre">std::execution::par_unseq</span></code> policy
+missing in a standard C++ library, particularly in libstdc++ version 8 and in libc++.</p></li>
 <li><p>For <code class="docutils literal notranslate"><span class="pre">transform_exclusive_scan</span></code> and <code class="docutils literal notranslate"><span class="pre">exclusive_scan</span></code> to run in-place (that is, with the same data
 used for both input and destination) and with an execution policy of <code class="docutils literal notranslate"><span class="pre">unseq</span></code> or <code class="docutils literal notranslate"><span class="pre">par_unseq</span></code>,
 it is required that the provided input and destination iterators are equality comparable.
@@ -509,21 +539,14 @@ <h3>Known Limitations<a class="headerlink" href="#known-limitations" title="Perm
 convertible to the type of the initial value if one is provided, otherwise it is convertible to the type of values
 in the processed data sequence: <code class="docutils literal notranslate"><span class="pre">std::iterator_traits&lt;IteratorType&gt;::value_type</span></code>.</p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">exclusive_scan</span></code> and <code class="docutils literal notranslate"><span class="pre">transform_exclusive_scan</span></code> algorithms may provide wrong results with
-vector execution policies when building a program with GCC 10 and using <code class="docutils literal notranslate"><span class="pre">-O0</span></code> option.</p></li>
-<li><p>Compiling <code class="docutils literal notranslate"><span class="pre">reduce</span></code> and <code class="docutils literal notranslate"><span class="pre">transform_reduce</span></code> algorithms with the Intel DPC++ Compiler, versions 2021 and older,
-may result in a runtime error. To fix this issue, use an Intel DPC++ Compiler version 2022 or newer.</p></li>
+unsequenced execution policies when building a program with GCC 10 and using <code class="docutils literal notranslate"><span class="pre">-O0</span></code> option.</p></li>
+<li><p>Compiling <code class="docutils literal notranslate"><span class="pre">reduce</span></code> and <code class="docutils literal notranslate"><span class="pre">transform_reduce</span></code> algorithms with Intel® oneAPI DPC++/C++ Compiler versions 2021 and older
+may result in a runtime error. To fix this issue, use Intel® oneAPI DPC++/C++ Compiler version 2022 or newer.</p></li>
 <li><p>When compiling on Windows, add the option <code class="docutils literal notranslate"><span class="pre">/EHsc</span></code> to the compilation command to avoid errors with oneDPL’s experimental
 ranges API that uses exceptions.</p></li>
-<li><p>The use of oneDPL together with the GNU C++ standard library (libstdc++) version 9 or 10 may lead to
-compilation errors (caused by oneTBB API changes).
-Using libstdc++ version 9 requires TBB version 2020 for the header file. This may result in compilation errors when
-using C++17 or C++20 and TBB is not found in the environment, even if its use in oneDPL is switched off.
-To overcome these issues, include oneDPL header files before the standard C++ header files,
-or disable parallel algorithms support in the standard library.
-For more information, please see <a class="reference external" href="https://www.intel.com/content/www/us/en/developer/articles/release-notes/intel-oneapi-threading-building-blocks-release-notes.html">Intel® oneAPI Threading Building Blocks (oneTBB) Release Notes</a>.</p></li>
 <li><p>The <code class="docutils literal notranslate"><span class="pre">using</span> <span class="pre">namespace</span> <span class="pre">oneapi;</span></code> directive in a oneDPL program code may result in compilation errors
 with some compilers including GCC 7 and earlier. Instead of this directive, explicitly use
-<code class="docutils literal notranslate"><span class="pre">oneapi::dpl</span></code> namespace, or create a namespace alias.</p></li>
+the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl</span></code> namespace, the shorter <code class="docutils literal notranslate"><span class="pre">dpl</span></code> namespace alias, or create your own alias.</p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">std::array::at</span></code> member function cannot be used in kernels because it may throw an exception;
 use <code class="docutils literal notranslate"><span class="pre">std::array::operator[]</span></code> instead.</p></li>
 <li><p>Due to specifics of Microsoft* Visual C++, some standard floating-point math functions
@@ -531,12 +554,12 @@ <h3>Known Limitations<a class="headerlink" href="#known-limitations" title="Perm
 for double precision.</p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">exclusive_scan</span></code>, <code class="docutils literal notranslate"><span class="pre">inclusive_scan</span></code>, <code class="docutils literal notranslate"><span class="pre">exclusive_scan_by_segment</span></code>,
 <code class="docutils literal notranslate"><span class="pre">inclusive_scan_by_segment</span></code>, <code class="docutils literal notranslate"><span class="pre">transform_exclusive_scan</span></code>, <code class="docutils literal notranslate"><span class="pre">transform_inclusive_scan</span></code>,
-when used with C++ standard policies, impose limitations on the initial value type if an
+when used with C++ standard aligned policies, impose limitations on the initial value type if an
 initial value is provided, and on the value type of the input iterator if an initial value is
 not provided.
 Firstly, it must satisfy the <code class="docutils literal notranslate"><span class="pre">DefaultConstructible</span></code> requirements.
 Secondly, a default-constructed instance of that type should act as the identity element for the binary scan function.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">reduce_by_segment</span></code>, when used with C++ standard policies, imposes limitations on the value type.
+<li><p><code class="docutils literal notranslate"><span class="pre">reduce_by_segment</span></code>, when used with C++ standard aligned policies, imposes limitations on the value type.
 Firstly, it must satisfy the <code class="docutils literal notranslate"><span class="pre">DefaultConstructible</span></code> requirements.
 Secondly, a default-constructed instance of that type should act as the identity element for the binary reduction function.</p></li>
 <li><p>The initial value type for <code class="docutils literal notranslate"><span class="pre">exclusive_scan</span></code>, <code class="docutils literal notranslate"><span class="pre">inclusive_scan</span></code>, <code class="docutils literal notranslate"><span class="pre">exclusive_scan_by_segment</span></code>,
@@ -546,28 +569,9 @@ <h3>Known Limitations<a class="headerlink" href="#known-limitations" title="Perm
 the dereferenced value type of the provided iterators should satisfy the <code class="docutils literal notranslate"><span class="pre">DefaultConstructible</span></code> requirements.</p></li>
 <li><p>For <code class="docutils literal notranslate"><span class="pre">remove</span></code>, <code class="docutils literal notranslate"><span class="pre">remove_if</span></code>, <code class="docutils literal notranslate"><span class="pre">unique</span></code> the dereferenced value type of the provided
 iterators should be <code class="docutils literal notranslate"><span class="pre">MoveConstructible</span></code>.</p></li>
-<li><p>The algorithms that process uninitialized storage: <code class="docutils literal notranslate"><span class="pre">uninitialized_copy</span></code>, <code class="docutils literal notranslate"><span class="pre">uninitialized_copy_n</span></code>, <code class="docutils literal notranslate"><span class="pre">uninitialized_fill</span></code>, <code class="docutils literal notranslate"><span class="pre">uninitialized_fill_n</span></code>, <code class="docutils literal notranslate"><span class="pre">uninitialized_fill_n</span></code>, <code class="docutils literal notranslate"><span class="pre">uninitialized_move</span></code>,
-<code class="docutils literal notranslate"><span class="pre">uninitialized_move_n</span></code>, <code class="docutils literal notranslate"><span class="pre">uninitialized_default_construct</span></code>, <code class="docutils literal notranslate"><span class="pre">uninitialized_default_construct_n</span></code>, <code class="docutils literal notranslate"><span class="pre">uninitialized_value_construct</span></code>, <code class="docutils literal notranslate"><span class="pre">uninitialized_value_construct_n</span></code>
-should be called with a device policy when using device data and should be called with a host policy when using host data. Otherwise, the result is undefined.</p></li>
-<li><p>The algorithms that destroy data: <code class="docutils literal notranslate"><span class="pre">destroy</span></code> and <code class="docutils literal notranslate"><span class="pre">destroy_n</span></code> should be called with a host policy when using host data that was initialized on the host, and should be called with a device policy when using device data that was initialized on the device. Otherwise, the result is undefined.</p></li>
 </ul>
 </div>
 </div>
-<div class="section" id="build-your-code-with-onedpl-short">
-<h2>Build Your Code with oneDPL<a class="headerlink" href="#build-your-code-with-onedpl-short" title="Permalink to this headline">#</a></h2>
-<p>Follow the steps below to build your code with oneDPL:</p>
-<ol class="arabic simple">
-<li><p>To build with the Intel® oneAPI DPC++/C++ Compiler, see the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/get-started-guide/current/overview.html">Get Started with the Intel® oneAPI DPC++/C++ Compiler</a>
-for details.</p></li>
-<li><p>Set the environment variables for oneDPL and oneTBB.</p></li>
-<li><p>To avoid naming device policy objects explicitly, add the <code class="docutils literal notranslate"><span class="pre">-fsycl-unnamed-lambda</span></code> option.</p></li>
-</ol>
-<p>Below is an example of a command line used to compile code that contains
-oneDPL parallel algorithms on Linux* (depending on the code, parameters within [] could be unnecessary):</p>
-<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="n">dpcpp</span><span class="w"> </span><span class="p">[</span><span class="o">-</span><span class="n">fsycl</span><span class="o">-</span><span class="n">unnamed</span><span class="o">-</span><span class="n">lambda</span><span class="p">]</span><span class="w"> </span><span class="n">test</span><span class="p">.</span><span class="n">cpp</span><span class="w"> </span><span class="p">[</span><span class="o">-</span><span class="n">ltbb</span><span class="o">|-</span><span class="n">fopenmp</span><span class="p">]</span><span class="w"> </span><span class="o">-</span><span class="n">o</span><span class="w"> </span><span class="n">test</span>
-</pre></div>
-</div>
-</div>
 </div>
 
 
@@ -621,12 +625,15 @@ <h2>Build Your Code with oneDPL<a class="headerlink" href="#build-your-code-with
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#before-you-begin">Before You Begin</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#system-requirements">System Requirements</a><ul class="nav section-nav flex-column">
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#prerequisites">Prerequisites</a></li>
+</ul>
+</li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#develop-and-build-your-code-with-onedpl-short">Develop and Build Your Code with oneDPL</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#useful-information">Useful Information</a><ul class="nav section-nav flex-column">
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#difference-with-standard-c-parallel-algorithms">Difference with Standard C++ Parallel Algorithms</a></li>
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#restrictions">Restrictions</a></li>
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#known-limitations">Known Limitations</a></li>
 </ul>
 </li>
-<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#build-your-code-with-onedpl-short">Build Your Code with oneDPL</a></li>
 </ul>
   </nav></div>
 
diff --git a/introduction/onedpl_gsg.html b/introduction/onedpl_gsg.html
index fa5326adb1..7c0807f021 100644
--- a/introduction/onedpl_gsg.html
+++ b/introduction/onedpl_gsg.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Get Started with the oneAPI DPC++ Library &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Get Started with the oneAPI DPC++ Library &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="release_notes.html">Release Notes</a></li>
 <li class="toctree-l1 current active"><a class="current reference internal" href="#">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -422,8 +427,7 @@ <h2> Contents </h2>
                   
   <div class="section" id="get-started-with-the-onedpl-long">
 <h1>Get Started with the oneAPI DPC++ Library<a class="headerlink" href="#get-started-with-the-onedpl-long" title="Permalink to this headline">#</a></h1>
-<p>oneAPI DPC++ Library (oneDPL) works with the
-<a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/get-started-guide/current/overview.html">Intel® oneAPI DPC++/C++ Compiler</a>
+<p>oneAPI DPC++ Library (oneDPL) works with the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/get-started-guide/2025-0/overview.html">Intel® oneAPI DPC++/C++ Compiler</a>
 to provide high-productivity APIs to developers, which can minimize SYCL*
 programming efforts across devices for high performance parallel applications.</p>
 <p>oneDPL consists of the following components:</p>
@@ -433,8 +437,7 @@ <h1>Get Started with the oneAPI DPC++ Library<a class="headerlink" href="#get-st
 <li><p>Macros</p></li>
 </ul>
 <p>For general information about oneDPL, visit the <a class="reference external" href="https://github.com/oneapi-src/oneDPL">oneDPL GitHub* repository</a>,
-or visit the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/overview.html">Intel® oneAPI DPC++ Library Guide</a>
-and the <a class="reference external" href="https://www.intel.com/content/www/us/en/developer/tools/oneapi/dpc-library.html">Intel® oneAPI DPC++ Library main page</a>.</p>
+or visit the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/2022-7/overview.html">Intel® oneAPI DPC++ Library Guide</a> and the <a class="reference external" href="https://www.intel.com/content/www/us/en/developer/tools/oneapi/dpc-library.html">Intel® oneAPI DPC++ Library main page</a>.</p>
 <div class="section" id="quick-start">
 <h2>Quick Start<a class="headerlink" href="#quick-start" title="Permalink to this headline">#</a></h2>
 <div class="section" id="installation">
@@ -458,11 +461,15 @@ <h3>Installation<a class="headerlink" href="#installation" title="Permalink to t
 </div>
 <div class="section" id="cmake-support">
 <h3>CMake Support<a class="headerlink" href="#cmake-support" title="Permalink to this headline">#</a></h3>
-<p><a class="reference external" href="https://cmake.org/cmake/help/latest/index.html">CMake</a> generates build scripts which can then be used to build and link your application. oneDPL can be added to your project via CMake.</p>
-<p>A simple example for Linux is provided below. For more detailed usage and options including details specific to Windows, please look to the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/cmake-support.html">CMake Support Page</a>.</p>
+<p><a class="reference external" href="https://cmake.org/cmake/help/latest/index.html">CMake</a> generates build scripts which can then be used
+to build and link your application. oneDPL can be added to your project via CMake.</p>
+<p>A simple example for Linux is provided below. For more detailed usage and options including details specific to Windows,
+please look to the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/2025-0/use-cmake-with-the-compiler.html">CMake support documentation for the Intel® oneAPI DPC++/C++ Compiler</a>.</p>
 <div class="section" id="simple-example-cmake-file">
 <h4>Simple Example CMake File<a class="headerlink" href="#simple-example-cmake-file" title="Permalink to this headline">#</a></h4>
-<p>To use oneDPL with CMake, create a CMakeLists.txt file for your project’s base directory and use <a class="reference external" href="https://cmake.org/cmake/help/latest/command/find_package.html">find_package</a> and <a class="reference external" href="https://cmake.org/cmake/help/latest/command/target_link_libraries.html">target_link_libraries</a> to add oneDPL.
+<p>To use oneDPL with CMake, create a CMakeLists.txt file for your project’s base directory and use
+<a class="reference external" href="https://cmake.org/cmake/help/latest/command/find_package.html">find_package</a>
+and <a class="reference external" href="https://cmake.org/cmake/help/latest/command/target_link_libraries.html">target_link_libraries</a> to add oneDPL.
 For example:</p>
 <div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="n">project</span><span class="p">(</span><span class="n">Foo</span><span class="p">)</span>
 <span class="n">add_executable</span><span class="p">(</span><span class="n">foo</span><span class="w"> </span><span class="n">foo</span><span class="p">.</span><span class="n">cpp</span><span class="p">)</span>
@@ -602,7 +609,7 @@ <h2>Find More<a class="headerlink" href="#find-more" title="Permalink to this he
 </tr>
 </thead>
 <tbody>
-<tr class="row-even"><td><p><a class="reference external" href="https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/overview.html">Intel® oneAPI DPC++ Library Guide</a></p></td>
+<tr class="row-even"><td><p><a class="reference external" href="https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/2022-7/overview.html">Intel® oneAPI DPC++ Library Guide</a></p></td>
 <td><p>Refer to the oneDPL guide for  more in depth information.</p></td>
 </tr>
 <tr class="row-odd"><td><p><a class="reference external" href="https://www.intel.com/content/www/us/en/developer/articles/system-requirements/intel-oneapi-dpcpp-system-requirements.html">System Requirements</a></p></td>
@@ -614,11 +621,12 @@ <h2>Find More<a class="headerlink" href="#find-more" title="Permalink to this he
 <tr class="row-odd"><td><p><a class="reference external" href="https://github.com/oneapi-src/oneAPI-samples/tree/master/Libraries/oneDPL">oneDPL Samples</a></p></td>
 <td><p>Learn how to use oneDPL with samples.</p></td>
 </tr>
-<tr class="row-even"><td><p><a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi-iot-toolkit/get-started-guide-linux/current/adding-oneapi-components-to-yocto-project-builds.html">Layers for Yocto* Project</a></p></td>
+<tr class="row-even"><td><p><a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi-iot-toolkit/get-started-guide-linux/2025-0/adding-oneapi-components-to-yocto-project-builds.html">Layers for Yocto* Project</a></p></td>
 <td><p>Add oneAPI components to a Yocto project build using the meta-intel layers.</p></td>
 </tr>
 <tr class="row-odd"><td><p><a class="reference external" href="https://oneapi-src.github.io/oneAPI-samples/">oneAPI Samples Catalog</a></p></td>
-<td><p>Explore the complete list of oneAPI code samples in the oneAPI Samples Catalog (GitHub*). These samples were designed to help you develop, offload, and optimize multiarchitecture applications targeting CPUs, GPUs, and FPGAs.</p></td>
+<td><p>Explore the complete list of oneAPI code samples in the oneAPI Samples Catalog (GitHub*).
+These samples were designed to help you develop, offload, and optimize multiarchitecture applications targeting CPUs, GPUs, and FPGAs.</p></td>
 </tr>
 </tbody>
 </table>
diff --git a/introduction/release_notes.html b/introduction/release_notes.html
index a26cfb6ffa..55c786baab 100644
--- a/introduction/release_notes.html
+++ b/introduction/release_notes.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Release Notes &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Release Notes &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1 current active"><a class="current reference internal" href="#">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
diff --git a/kernel_templates/esimd/radix_sort.html b/kernel_templates/esimd/radix_sort.html
index 42533315d5..5e9ec6f417 100644
--- a/kernel_templates/esimd/radix_sort.html
+++ b/kernel_templates/esimd/radix_sort.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Radix Sort &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Radix Sort &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,7 +45,7 @@
     <link rel="shortcut icon" href="../../_static/favicons.png"/>
     <link rel="index" title="Index" href="../../genindex.html" />
     <link rel="search" title="Search" href="../../search.html" />
-    <link rel="next" title="Inclusive Scan" href="../single_pass_scan.html" />
+    <link rel="next" title="Radix Sort By Key" href="radix_sort_by_key.html" />
     <link rel="prev" title="ESIMD-Based Kernel Templates" href="../esimd_main.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 current active has-children"><a class="reference internal" href="../esimd_main.html">ESIMD-Based Kernel Templates</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l3 current active"><a class="current reference internal" href="#">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -389,17 +394,15 @@ <h2> Contents </h2>
             </div>
             <nav aria-label="Page">
                 <ul class="visible nav section-nav flex-column">
-<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-and-radix-sort-by-key-function-templates">radix_sort and radix_sort_by_key Function Templates</a><ul class="nav section-nav flex-column">
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-function-templates">radix_sort Function Templates</a><ul class="nav section-nav flex-column">
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#template-parameters">Template Parameters</a></li>
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#parameters">Parameters</a></li>
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#return-value">Return Value</a></li>
 </ul>
 </li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#usage-examples">Usage Examples</a><ul class="nav section-nav flex-column">
-<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-in-place-example">radix_sort In-Place Example</a></li>
-<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-by-key-in-place-example">radix_sort_by_key In-Place Example</a></li>
-<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-out-of-place-example">radix_sort Out-of-Place Example</a></li>
-<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-by-key-out-of-place-example">radix_sort_by_key Out-of-Place Example</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#in-place-example">In-Place Example</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#out-of-place-example">Out-of-Place Example</a></li>
 </ul>
 </li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#memory-requirements">Memory Requirements</a><ul class="nav section-nav flex-column">
@@ -421,18 +424,18 @@ <h2> Contents </h2>
                   
   <div class="section" id="radix-sort">
 <h1>Radix Sort<a class="headerlink" href="#radix-sort" title="Permalink to this headline">#</a></h1>
-<div class="section" id="radix-sort-and-radix-sort-by-key-function-templates">
-<h2>radix_sort and radix_sort_by_key Function Templates<a class="headerlink" href="#radix-sort-and-radix-sort-by-key-function-templates" title="Permalink to this headline">#</a></h2>
-<p>The <code class="docutils literal notranslate"><span class="pre">radix_sort</span></code> and <code class="docutils literal notranslate"><span class="pre">radix_sort_by_key</span></code> functions sort data using the radix sort algorithm.
-The sorting is stable, ensuring the preservation of the relative order of elements with equal keys.
-The functions implement a Onesweep* <a class="footnote-reference brackets" href="#fnote1" id="id1">1</a> algorithm variant. Both in-place and out-of-place
-overloads are provided. For out-of-place overloads, the input data order is preserved.</p>
-<p>A synopsis of the <code class="docutils literal notranslate"><span class="pre">radix_sort</span></code> and <code class="docutils literal notranslate"><span class="pre">radix_sort_by_key</span></code> functions is provided below:</p>
+<div class="section" id="radix-sort-function-templates">
+<h2>radix_sort Function Templates<a class="headerlink" href="#radix-sort-function-templates" title="Permalink to this headline">#</a></h2>
+<p>The <code class="docutils literal notranslate"><span class="pre">radix_sort</span></code> function sorts data using the radix sort algorithm.
+The sorting is stable, preserving the relative order of elements with equal keys.
+Both in-place and out-of-place overloads are provided. Out-of-place overloads do not alter the input sequence.</p>
+<p>The functions implement a Onesweep* <a class="footnote-reference brackets" href="#fnote1" id="id1">1</a> algorithm variant.</p>
+<p>A synopsis of the <code class="docutils literal notranslate"><span class="pre">radix_sort</span></code> function is provided below:</p>
 <div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="c1">// defined in &lt;oneapi/dpl/experimental/kernel_templates&gt;</span>
 
 <span class="k">namespace</span><span class="w"> </span><span class="nn">oneapi</span><span class="o">::</span><span class="nn">dpl</span><span class="o">::</span><span class="nn">experimental</span><span class="o">::</span><span class="nn">kt</span><span class="o">::</span><span class="nn">gpu</span><span class="o">::</span><span class="nn">esimd</span><span class="w"> </span><span class="p">{</span>
 
-<span class="c1">// Sort a single sequence</span>
+<span class="c1">// Sort in-place</span>
 <span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="kt">bool</span><span class="w"> </span><span class="n">IsAscending</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="kt">uint8_t</span><span class="w"> </span><span class="n">RadixBits</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span>
 <span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KernelParam</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Iterator</span><span class="o">&gt;</span>
 <span class="n">sycl</span><span class="o">::</span><span class="n">event</span>
@@ -445,56 +448,27 @@ <h2>radix_sort and radix_sort_by_key Function Templates<a class="headerlink" hre
 <span class="n">radix_sort</span><span class="w"> </span><span class="p">(</span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">Range</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">r</span><span class="p">,</span><span class="w"> </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">);</span><span class="w"> </span><span class="c1">// (2)</span>
 
 
-<span class="c1">// Sort a single sequence out-of-place</span>
+<span class="c1">// Sort out-of-place</span>
 <span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="kt">bool</span><span class="w"> </span><span class="n">IsAscending</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="kt">uint8_t</span><span class="w"> </span><span class="n">RadixBits</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span>
 <span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KernelParam</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Iterator1</span><span class="p">,</span>
 <span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">Iterator2</span><span class="o">&gt;</span>
 <span class="n">sycl</span><span class="o">::</span><span class="n">event</span>
 <span class="n">radix_sort</span><span class="w"> </span><span class="p">(</span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">Iterator1</span><span class="w"> </span><span class="n">first</span><span class="p">,</span><span class="w"> </span><span class="n">Iterator1</span><span class="w"> </span><span class="n">last</span><span class="p">,</span>
-<span class="w">            </span><span class="n">Iterator2</span><span class="w"> </span><span class="n">first_out</span><span class="p">,</span><span class="w"> </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">)</span><span class="w"> </span><span class="c1">// (3)</span>
+<span class="w">            </span><span class="n">Iterator2</span><span class="w"> </span><span class="n">first_out</span><span class="p">,</span><span class="w"> </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">);</span><span class="w"> </span><span class="c1">// (3)</span>
 
 <span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="kt">bool</span><span class="w"> </span><span class="n">IsAscending</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="kt">uint8_t</span><span class="w"> </span><span class="n">RadixBits</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span>
 <span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KernelParam</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Range1</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Range2</span><span class="o">&gt;</span>
 <span class="n">sycl</span><span class="o">::</span><span class="n">event</span>
 <span class="n">radix_sort</span><span class="w"> </span><span class="p">(</span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">Range1</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">r</span><span class="p">,</span><span class="w"> </span><span class="n">Range2</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">r_out</span><span class="p">,</span>
-<span class="w">            </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">)</span><span class="w"> </span><span class="c1">// (4)</span>
-
-
-<span class="c1">// Sort a sequence of keys and apply the same order to a sequence of values</span>
-<span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="kt">bool</span><span class="w"> </span><span class="n">IsAscending</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="kt">uint8_t</span><span class="w"> </span><span class="n">RadixBits</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span>
-<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KernelParam</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Iterator1</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Iterator2</span><span class="o">&gt;</span>
-<span class="n">sycl</span><span class="o">::</span><span class="n">event</span>
-<span class="n">radix_sort_by_key</span><span class="w"> </span><span class="p">(</span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">Iterator1</span><span class="w"> </span><span class="n">keys_first</span><span class="p">,</span><span class="w"> </span><span class="n">Iterator1</span><span class="w"> </span><span class="n">keys_last</span><span class="p">,</span>
-<span class="w">                   </span><span class="n">Iterator2</span><span class="w"> </span><span class="n">values_first</span><span class="p">,</span><span class="w"> </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">);</span><span class="w"> </span><span class="c1">// (5)</span>
-
-<span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="kt">bool</span><span class="w"> </span><span class="n">IsAscending</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="kt">uint8_t</span><span class="w"> </span><span class="n">RadixBits</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span>
-<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KernelParam</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">KeysRng</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">ValuesRng</span><span class="o">&gt;</span>
-<span class="n">sycl</span><span class="o">::</span><span class="n">event</span>
-<span class="n">radix_sort_by_key</span><span class="w"> </span><span class="p">(</span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">KeysRng</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">keys</span><span class="p">,</span>
-<span class="w">                   </span><span class="n">ValuesRng</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">);</span><span class="w"> </span><span class="c1">// (6)</span>
-
-
-<span class="c1">// Sort a sequence of keys and values out-of-place</span>
-<span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="kt">bool</span><span class="w"> </span><span class="n">IsAscending</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="kt">uint8_t</span><span class="w"> </span><span class="n">RadixBits</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span>
-<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KernelParam</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">KeysIterator1</span><span class="p">,</span>
-<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">ValsIterator1</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">KeysIterator2</span><span class="p">,</span>
-<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">ValsIterator2</span><span class="o">&gt;</span>
-<span class="n">sycl</span><span class="o">::</span><span class="n">event</span>
-<span class="n">radix_sort_by_key</span><span class="w"> </span><span class="p">(</span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">KeysIterator1</span><span class="w"> </span><span class="n">keys_first</span><span class="p">,</span>
-<span class="w">                   </span><span class="n">KeysIterator1</span><span class="w"> </span><span class="n">keys_last</span><span class="p">,</span><span class="w"> </span><span class="n">ValsIterator1</span><span class="w"> </span><span class="n">vals_first</span><span class="p">,</span>
-<span class="w">                   </span><span class="n">KeysIterator2</span><span class="w"> </span><span class="n">keys_out_first</span><span class="p">,</span><span class="w"> </span><span class="n">ValsIterator2</span><span class="w"> </span><span class="n">vals_out_first</span><span class="p">,</span>
-<span class="w">                   </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">)</span><span class="w"> </span><span class="c1">// (7)</span>
-
-<span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="kt">bool</span><span class="w"> </span><span class="n">IsAscending</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="kt">uint8_t</span><span class="w"> </span><span class="n">RadixBits</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span>
-<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KernelParam</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">KeysRng1</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">ValsRng1</span><span class="p">,</span>
-<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KeysRng2</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">ValsRng2</span><span class="o">&gt;</span>
-<span class="n">sycl</span><span class="o">::</span><span class="n">event</span>
-<span class="n">radix_sort_by_key</span><span class="w"> </span><span class="p">(</span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">KeysRng1</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">ValsRng1</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">values</span><span class="p">,</span>
-<span class="w">                   </span><span class="n">KeysRng2</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">keys_out</span><span class="p">,</span><span class="w"> </span><span class="n">ValsRng2</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">vals_out</span><span class="p">,</span>
-<span class="w">                   </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">)</span><span class="w"> </span><span class="c1">// (8)</span>
+<span class="w">            </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">);</span><span class="w"> </span><span class="c1">// (4)</span>
 <span class="p">}</span>
 </pre></div>
 </div>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>The <code class="docutils literal notranslate"><span class="pre">radix_sort</span></code> is currently available only for Intel® Data Center GPU Max Series,
+and requires Intel® oneAPI DPC++/C++ Compiler 2023.2 or newer.</p>
+</div>
 <div class="section" id="template-parameters">
 <h3>Template Parameters<a class="headerlink" href="#template-parameters" title="Permalink to this headline">#</a></h3>
 <table class="table">
@@ -537,25 +511,17 @@ <h3>Parameters<a class="headerlink" href="#parameters" title="Permalink to this
 <li><p><code class="docutils literal notranslate"><span class="pre">first</span></code>, <code class="docutils literal notranslate"><span class="pre">last</span></code> (1),</p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">r</span></code> (2),</p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">first</span></code>, <code class="docutils literal notranslate"><span class="pre">last</span></code>, <code class="docutils literal notranslate"><span class="pre">first_out</span></code> (3),</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">r</span></code>, <code class="docutils literal notranslate"><span class="pre">r_out</span></code> (4),</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">keys_first</span></code>, <code class="docutils literal notranslate"><span class="pre">keys_last</span></code>,
-<code class="docutils literal notranslate"><span class="pre">values_first</span></code> (5),</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">keys</span></code>, <code class="docutils literal notranslate"><span class="pre">values</span></code> (6),</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">keys_first</span></code>, <code class="docutils literal notranslate"><span class="pre">keys_last</span></code>,
-<code class="docutils literal notranslate"><span class="pre">vals_first</span></code>, <code class="docutils literal notranslate"><span class="pre">keys_out_first</span></code>,
-<code class="docutils literal notranslate"><span class="pre">values_out_first</span></code> (7)</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">keys</span></code>, <code class="docutils literal notranslate"><span class="pre">values</span></code>,
-<code class="docutils literal notranslate"><span class="pre">keys_out</span></code>, <code class="docutils literal notranslate"><span class="pre">values_out</span></code> (8),</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">r</span></code>, <code class="docutils literal notranslate"><span class="pre">r_out</span></code> (4).</p></li>
 </ul>
 </td>
 <td><p>The sequences to apply the algorithm to.
 Supported sequence types:</p>
 <ul class="simple">
-<li><p><a class="reference internal" href="../../parallel_api/pass_data_algorithms.html#use-usm"><span class="std std-ref">USM pointers</span></a> (1,3,5,7),</p></li>
-<li><p><a class="reference internal" href="../../parallel_api/pass_data_algorithms.html#use-buffer-wrappers"><span class="std std-ref">oneapi::dpl::begin and oneapi::dpl::end</span></a> (1,3,5,7).</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> (2,4,6,8),</p></li>
-<li><p><a class="reference internal" href="../../parallel_api/range_based_api.html#viewable-ranges"><span class="std std-ref">oneapi::dpl::experimental::ranges::views::all</span></a> (2,4,6,8),</p></li>
-<li><p><a class="reference internal" href="../../parallel_api/range_based_api.html#viewable-ranges"><span class="std std-ref">oneapi::dpl::experimental::ranges::views::subrange</span></a> (2,4,6,8),</p></li>
+<li><p><a class="reference internal" href="../../parallel_api/pass_data_algorithms.html#use-usm"><span class="std std-ref">USM pointers</span></a> (1,3),</p></li>
+<li><p><a class="reference internal" href="../../parallel_api/pass_data_algorithms.html#use-buffer-wrappers"><span class="std std-ref">oneapi::dpl::begin and oneapi::dpl::end</span></a> (1,3).</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> (2,4),</p></li>
+<li><p><a class="reference internal" href="../../parallel_api/range_based_api.html#viewable-ranges"><span class="std std-ref">oneapi::dpl::experimental::ranges::views::all</span></a> (2,4),</p></li>
+<li><p><a class="reference internal" href="../../parallel_api/range_based_api.html#viewable-ranges"><span class="std std-ref">oneapi::dpl::experimental::ranges::views::subrange</span></a> (2,4).</p></li>
 </ul>
 </td>
 </tr>
@@ -587,8 +553,8 @@ <h3>Return Value<a class="headerlink" href="#return-value" title="Permalink to t
 </div>
 <div class="section" id="usage-examples">
 <h2>Usage Examples<a class="headerlink" href="#usage-examples" title="Permalink to this headline">#</a></h2>
-<div class="section" id="radix-sort-in-place-example">
-<h3>radix_sort In-Place Example<a class="headerlink" href="#radix-sort-in-place-example" title="Permalink to this headline">#</a></h3>
+<div class="section" id="in-place-example">
+<h3>In-Place Example<a class="headerlink" href="#in-place-example" title="Permalink to this headline">#</a></h3>
 <div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="c1">// possible build and run commands:</span>
 <span class="c1">//    icpx -fsycl radix_sort.cpp -o radix_sort -I /path/to/oneDPL/include &amp;&amp; ./radix_sort</span>
 
@@ -623,69 +589,13 @@ <h3>radix_sort In-Place Example<a class="headerlink" href="#radix-sort-in-place-
 <span class="p">}</span>
 </pre></div>
 </div>
-<p><strong>Output:</strong></p>
-<div class="highlight-none notranslate"><div class="highlight"><pre><span></span>5 3 3 3 2 1
+<p><strong>Output</strong>:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="mi">5</span> <span class="mi">3</span> <span class="mi">3</span> <span class="mi">3</span> <span class="mi">2</span> <span class="mi">1</span>
 </pre></div>
 </div>
 </div>
-<div class="section" id="radix-sort-by-key-in-place-example">
-<h3>radix_sort_by_key In-Place Example<a class="headerlink" href="#radix-sort-by-key-in-place-example" title="Permalink to this headline">#</a></h3>
-<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="c1">// possible build and run commands:</span>
-<span class="c1">//    icpx -fsycl radix_sort_by_key.cpp -o radix_sort_by_key -I /path/to/oneDPL/include &amp;&amp; ./radix_sort_by_key</span>
-
-<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;cstdint&gt;</span>
-<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;iostream&gt;</span>
-<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;sycl/sycl.hpp&gt;</span>
-
-<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/experimental/kernel_templates&gt;</span>
-
-<span class="k">namespace</span><span class="w"> </span><span class="nn">kt</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nn">oneapi</span><span class="o">::</span><span class="nn">dpl</span><span class="o">::</span><span class="nn">experimental</span><span class="o">::</span><span class="nn">kt</span><span class="p">;</span>
-
-<span class="kt">int</span><span class="w"> </span><span class="nf">main</span><span class="p">()</span>
-<span class="p">{</span>
-<span class="w">   </span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">n</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">6</span><span class="p">;</span>
-<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">gpu_selector_v</span><span class="p">};</span>
-<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="n">std</span><span class="o">::</span><span class="kt">uint32_t</span><span class="o">&gt;</span><span class="w"> </span><span class="n">keys</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
-<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">char</span><span class="o">&gt;</span><span class="w"> </span><span class="n">values</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
-
-<span class="w">   </span><span class="c1">// initialize</span>
-<span class="w">   </span><span class="p">{</span>
-<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">k_acc</span><span class="p">{</span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">write_only</span><span class="p">};</span>
-<span class="w">      </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">2</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">2</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">3</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">4</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">5</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">;</span>
-
-<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">v_acc</span><span class="p">{</span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">write_only</span><span class="p">};</span>
-<span class="w">      </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;r&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;o&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">2</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;s&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">3</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;d&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">4</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;t&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">5</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;e&#39;</span><span class="p">;</span>
-<span class="w">   </span><span class="p">}</span>
-
-<span class="w">   </span><span class="c1">// sort</span>
-<span class="w">   </span><span class="k">auto</span><span class="w"> </span><span class="n">e</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">kt</span><span class="o">::</span><span class="n">gpu</span><span class="o">::</span><span class="n">esimd</span><span class="o">::</span><span class="n">radix_sort_by_key</span><span class="o">&lt;</span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="mi">8</span><span class="o">&gt;</span><span class="p">(</span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">kt</span><span class="o">::</span><span class="n">kernel_param</span><span class="o">&lt;</span><span class="mi">96</span><span class="p">,</span><span class="w"> </span><span class="mi">64</span><span class="o">&gt;</span><span class="p">{});</span><span class="w"> </span><span class="c1">// (6)</span>
-<span class="w">   </span><span class="n">e</span><span class="p">.</span><span class="n">wait</span><span class="p">();</span>
-
-<span class="w">   </span><span class="c1">// print</span>
-<span class="w">   </span><span class="p">{</span>
-<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">k_acc</span><span class="p">{</span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
-<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
-<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
-<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39;\n&#39;</span><span class="p">;</span>
-
-<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">v_acc</span><span class="p">{</span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
-<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
-<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
-<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39;\n&#39;</span><span class="p">;</span>
-<span class="w">   </span><span class="p">}</span>
-
-<span class="w">   </span><span class="k">return</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span>
-<span class="p">}</span>
-</pre></div>
-</div>
-<p><strong>Output:</strong></p>
-<div class="highlight-none notranslate"><div class="highlight"><pre><span></span>1 2 3 3 3 5
-s o r t e d
-</pre></div>
-</div>
-</div>
-<div class="section" id="radix-sort-out-of-place-example">
-<h3>radix_sort Out-of-Place Example<a class="headerlink" href="#radix-sort-out-of-place-example" title="Permalink to this headline">#</a></h3>
+<div class="section" id="out-of-place-example">
+<h3>Out-of-Place Example<a class="headerlink" href="#out-of-place-example" title="Permalink to this headline">#</a></h3>
 <div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="c1">// possible build and run commands:</span>
 <span class="c1">//    icpx -fsycl radix_sort.cpp -o radix_sort -I /path/to/oneDPL/include &amp;&amp; ./radix_sort</span>
 
@@ -725,106 +635,28 @@ <h3>radix_sort Out-of-Place Example<a class="headerlink" href="#radix-sort-out-o
 <span class="p">}</span>
 </pre></div>
 </div>
-<p><strong>Output:</strong></p>
-<div class="highlight-none notranslate"><div class="highlight"><pre><span></span>3 2 1 5 3 3
-5 3 3 3 2 1
-</pre></div>
-</div>
-</div>
-<div class="section" id="radix-sort-by-key-out-of-place-example">
-<h3>radix_sort_by_key Out-of-Place Example<a class="headerlink" href="#radix-sort-by-key-out-of-place-example" title="Permalink to this headline">#</a></h3>
-<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="c1">// possible build and run commands:</span>
-<span class="c1">//    icpx -fsycl radix_sort_by_key.cpp -o radix_sort_by_key -I /path/to/oneDPL/include &amp;&amp; ./radix_sort_by_key</span>
-
-<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;cstdint&gt;</span>
-<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;iostream&gt;</span>
-<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;sycl/sycl.hpp&gt;</span>
-
-<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/experimental/kernel_templates&gt;</span>
-
-<span class="k">namespace</span><span class="w"> </span><span class="nn">kt</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nn">oneapi</span><span class="o">::</span><span class="nn">dpl</span><span class="o">::</span><span class="nn">experimental</span><span class="o">::</span><span class="nn">kt</span><span class="p">;</span>
-
-<span class="kt">int</span><span class="w"> </span><span class="nf">main</span><span class="p">()</span>
-<span class="p">{</span>
-<span class="w">   </span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">n</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">6</span><span class="p">;</span>
-<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">gpu_selector_v</span><span class="p">};</span>
-<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="n">std</span><span class="o">::</span><span class="kt">uint32_t</span><span class="o">&gt;</span><span class="w"> </span><span class="n">keys</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
-<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="n">std</span><span class="o">::</span><span class="kt">uint32_t</span><span class="o">&gt;</span><span class="w"> </span><span class="n">keys_out</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
-<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">char</span><span class="o">&gt;</span><span class="w"> </span><span class="n">values</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
-<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">char</span><span class="o">&gt;</span><span class="w"> </span><span class="n">values_out</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
-
-
-<span class="w">   </span><span class="c1">// initialize</span>
-<span class="w">   </span><span class="p">{</span>
-<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">k_acc</span><span class="p">{</span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">write_only</span><span class="p">};</span>
-<span class="w">      </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">2</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">2</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">3</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">4</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">5</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">;</span>
-
-<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">v_acc</span><span class="p">{</span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">write_only</span><span class="p">};</span>
-<span class="w">      </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;r&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;o&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">2</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;s&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">3</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;d&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">4</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;t&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">5</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;e&#39;</span><span class="p">;</span>
-<span class="w">   </span><span class="p">}</span>
-
-<span class="w">   </span><span class="c1">// sort</span>
-<span class="w">   </span><span class="k">auto</span><span class="w"> </span><span class="n">e</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">kt</span><span class="o">::</span><span class="n">gpu</span><span class="o">::</span><span class="n">esimd</span><span class="o">::</span><span class="n">radix_sort_by_key</span><span class="o">&lt;</span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="mi">8</span><span class="o">&gt;</span><span class="p">(</span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">keys_out</span><span class="p">,</span><span class="w"> </span><span class="n">values_out</span><span class="p">,</span>
-<span class="w">                                                       </span><span class="n">kt</span><span class="o">::</span><span class="n">kernel_param</span><span class="o">&lt;</span><span class="mi">96</span><span class="p">,</span><span class="w"> </span><span class="mi">64</span><span class="o">&gt;</span><span class="p">{});</span><span class="w"> </span><span class="c1">// (8)</span>
-<span class="w">   </span><span class="n">e</span><span class="p">.</span><span class="n">wait</span><span class="p">();</span>
-
-<span class="w">   </span><span class="c1">// print</span>
-<span class="w">   </span><span class="p">{</span>
-<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">k_acc</span><span class="p">{</span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
-<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
-<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
-<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39;\n&#39;</span><span class="p">;</span>
-
-<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">v_acc</span><span class="p">{</span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
-<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
-<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
-<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="s">&quot;</span><span class="se">\n\n</span><span class="s">&quot;</span><span class="p">;</span>
-
-<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">k_out_acc</span><span class="p">{</span><span class="n">keys_out</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
-<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
-<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">k_out_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
-<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39;\n&#39;</span><span class="p">;</span>
-
-<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">v_out_acc</span><span class="p">{</span><span class="n">values_out</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
-<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
-<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">v_out_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
-<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39;\n&#39;</span><span class="p">;</span>
-<span class="w">   </span><span class="p">}</span>
-
-<span class="w">   </span><span class="k">return</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span>
-<span class="p">}</span>
-</pre></div>
-</div>
-<p><strong>Output:</strong></p>
-<div class="highlight-none notranslate"><div class="highlight"><pre><span></span>3 2 1 5 3 3
-r o s d t e
-
-1 2 3 3 3 5
-s o r t e d
+<p><strong>Output</strong>:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="mi">3</span> <span class="mi">2</span> <span class="mi">1</span> <span class="mi">5</span> <span class="mi">3</span> <span class="mi">3</span>
+<span class="mi">5</span> <span class="mi">3</span> <span class="mi">3</span> <span class="mi">3</span> <span class="mi">2</span> <span class="mi">1</span>
 </pre></div>
 </div>
 </div>
 </div>
 <div class="section" id="memory-requirements">
-<span id="id2"></span><h2>Memory Requirements<a class="headerlink" href="#memory-requirements" title="Permalink to this headline">#</a></h2>
-<p>The algorithms use global and local device memory (see <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#_sycl_device_memory_model">SYCL 2020 Specification</a>)
-for intermediate data storage. For the algorithms to operate correctly, there must be enough memory
-on the device; otherwise, the behavior is undefined. The amount of memory that is required
-depends on input data and configuration parameters, as described below.</p>
+<span id="radix-sort-memory-requirements"></span><h2>Memory Requirements<a class="headerlink" href="#memory-requirements" title="Permalink to this headline">#</a></h2>
+<p>The algorithm uses global and local device memory (see <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#_sycl_device_memory_model">SYCL 2020 Specification</a>)
+for intermediate data storage. For the algorithm to operate correctly, there must be enough memory on the device.
+If there is not enough global device memory, a <code class="docutils literal notranslate"><span class="pre">std::bad_alloc</span></code> exception is thrown.
+The behavior is undefined if there is not enough local memory.
+The amount of memory that is required depends on input data and configuration parameters, as described below.</p>
 <div class="section" id="global-memory-requirements">
 <h3>Global Memory Requirements<a class="headerlink" href="#global-memory-requirements" title="Permalink to this headline">#</a></h3>
 <p>Global memory is used for copying the input sequence(s) and storing internal data such as radix value counters.
 The used amount depends on many parameters; below is an upper bound approximation:</p>
-<dl class="field-list simple">
-<dt class="field-odd"><code class="docutils literal notranslate"><span class="pre">radix_sort</span></code></dt>
-<dd class="field-odd"><p>N<sub>keys</sub> + C * N<sub>keys</sub></p>
-</dd>
-<dt class="field-even"><code class="docutils literal notranslate"><span class="pre">radix_sort_by_key</span></code></dt>
-<dd class="field-even"><p>N<sub>keys</sub> + N<sub>values</sub> + C * N<sub>keys</sub></p>
-</dd>
-</dl>
-<p>where the sequence with keys takes N<sub>keys</sub> space, the sequence with values takes N<sub>values</sub> space,
-and the additional space is C * N<sub>keys</sub>.</p>
+<blockquote>
+<div><p>N<sub>keys</sub> + C * N<sub>keys</sub></p>
+</div></blockquote>
+<p>where the sequence with keys takes N<sub>keys</sub> space, and the additional space is C * N<sub>keys</sub>.</p>
 <p>The value of <cite>C</cite> depends on <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span></code>, <code class="docutils literal notranslate"><span class="pre">param.workgroup_size</span></code>, and <code class="docutils literal notranslate"><span class="pre">RadixBits</span></code>.
 For <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span></code> set to <cite>32</cite>, <code class="docutils literal notranslate"><span class="pre">param.workgroup_size</span></code> to <cite>64</cite>, and <code class="docutils literal notranslate"><span class="pre">RadixBits</span></code> to <cite>8</cite>,
 <cite>C</cite> approximately equals to <cite>1</cite>.
@@ -833,27 +665,20 @@ <h3>Global Memory Requirements<a class="headerlink" href="#global-memory-require
 <div class="admonition note">
 <p class="admonition-title">Note</p>
 <p>If the number of elements to sort does not exceed <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span> <span class="pre">*</span> <span class="pre">param.workgroup_size</span></code>,
-<code class="docutils literal notranslate"><span class="pre">radix_sort</span></code> is executed by a single work-group and does not use any global memory.
-For <code class="docutils literal notranslate"><span class="pre">radix_sort_by_key</span></code> there is no single work-group implementation yet.</p>
+<code class="docutils literal notranslate"><span class="pre">radix_sort</span></code> is executed by a single work-group and does not use any global memory.</p>
 </div>
 </div>
 <div class="section" id="local-memory-requirements">
-<span id="local-memory"></span><h3>Local Memory Requirements<a class="headerlink" href="#local-memory-requirements" title="Permalink to this headline">#</a></h3>
-<p>Local memory is used for reordering keys or key-value pairs within a work-group,
+<h3>Local Memory Requirements<a class="headerlink" href="#local-memory-requirements" title="Permalink to this headline">#</a></h3>
+<p>Local memory is used for reordering keys within a work-group,
 and for storing internal data such as radix value counters.
 The used amount depends on many parameters; below is an upper bound approximation:</p>
-<dl class="field-list simple">
-<dt class="field-odd"><code class="docutils literal notranslate"><span class="pre">radix_sort</span></code></dt>
-<dd class="field-odd"><p>N<sub>keys_per_workgroup</sub> + C</p>
-</dd>
-<dt class="field-even"><code class="docutils literal notranslate"><span class="pre">radix_sort_by_key</span></code></dt>
-<dd class="field-even"><p>N<sub>keys_per_workgroup</sub> + N<sub>values_per_workgroup</sub> + C</p>
-</dd>
-</dl>
-<p>where N<sub>keys_per_workgroup</sub> and N<sub>values_per_workgroup</sub> are the amounts of memory
-to store keys and values, respectively.  <cite>C</cite> is some additional space for storing internal data.</p>
+<blockquote>
+<div><p>N<sub>keys_per_workgroup</sub> + C</p>
+</div></blockquote>
+<p>where N<sub>keys_per_workgroup</sub> is the amount of memory to store keys.
+<cite>C</cite> is some additional space for storing internal data.</p>
 <p>N<sub>keys_per_workgroup</sub> equals to <code class="docutils literal notranslate"><span class="pre">sizeof(key_type)</span> <span class="pre">*</span> <span class="pre">param.data_per_workitem</span> <span class="pre">*</span> <span class="pre">param.workgroup_size</span></code>,
-N<sub>values_per_workgroup</sub> equals to <code class="docutils literal notranslate"><span class="pre">sizeof(value_type)</span> <span class="pre">*</span> <span class="pre">param.data_per_workitem</span> <span class="pre">*</span> <span class="pre">param.workgroup_size</span></code>,
 <cite>C</cite> does not exceed <cite>4KB</cite>.</p>
 </div>
 </div>
@@ -867,7 +692,7 @@ <h2>Recommended Settings for Best Performance<a class="headerlink" href="#recomm
 Increase the <code class="docutils literal notranslate"><span class="pre">param</span></code> values to make <code class="docutils literal notranslate"><span class="pre">N</span> <span class="pre">&lt;=</span> <span class="pre">param.data_per_workitem</span> <span class="pre">*</span> <span class="pre">param.workgroup_size</span></code>.</p></li>
 <li><p>When the number of elements to sort <code class="docutils literal notranslate"><span class="pre">N</span></code> is between 16K and 1M, utilizing all available
 compute cores is key for better performance. Allow creating enough work chunks to feed all
-X<sup>e</sup>-cores <a class="footnote-reference brackets" href="#fnote2" id="id3">2</a> on a GPU: <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span> <span class="pre">*</span> <span class="pre">param.workgroup_size</span> <span class="pre">≈</span> <span class="pre">N</span> <span class="pre">/</span> <span class="pre">xe_core_count</span></code>.</p></li>
+X<sup>e</sup>-cores <a class="footnote-reference brackets" href="#fnote2" id="id2">2</a> on a GPU: <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span> <span class="pre">*</span> <span class="pre">param.workgroup_size</span> <span class="pre">≈</span> <span class="pre">N</span> <span class="pre">/</span> <span class="pre">xe_core_count</span></code>.</p></li>
 <li><p>When the number of elements to sort is large (more than ~1M), maximizing the number of elements
 processed by a work-group, which equals to <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span> <span class="pre">*</span> <span class="pre">param.workgroup_size</span></code>,
 reduces synchronization overheads between work-groups and usually benefits the overall performance.</p></li>
@@ -875,7 +700,7 @@ <h2>Recommended Settings for Best Performance<a class="headerlink" href="#recomm
 <div class="admonition warning">
 <p class="admonition-title">Warning</p>
 <p>Avoid setting too large <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span></code> and <code class="docutils literal notranslate"><span class="pre">param.workgroup_size</span></code> values.
-Make sure that <a class="reference internal" href="#memory-requirements"><span class="std std-ref">Memory requirements</span></a> are satisfied.</p>
+Make sure that <a class="reference internal" href="#radix-sort-memory-requirements"><span class="std std-ref">Memory requirements</span></a> are satisfied.</p>
 </div>
 <div class="admonition note">
 <p class="admonition-title">Note</p>
@@ -884,9 +709,9 @@ <h2>Recommended Settings for Best Performance<a class="headerlink" href="#recomm
 </div>
 <dl class="footnote brackets">
 <dt class="label" id="fnote1"><span class="brackets"><a class="fn-backref" href="#id1">1</a></span></dt>
-<dd><p>Andy Adinets and Duane Merrill (2022). Onesweep: A Faster Least Significant Digit Radix Sort for GPUs. Retrieved from <a class="reference external" href="https://arxiv.org/abs/2206.01784">https://arxiv.org/abs/2206.01784</a>.</p>
+<dd><p>Andy Adinets and Duane Merrill (2022). Onesweep: A Faster Least Significant Digit Radix Sort for GPUs. <a class="reference external" href="https://arxiv.org/abs/2206.01784">https://arxiv.org/abs/2206.01784</a>.</p>
 </dd>
-<dt class="label" id="fnote2"><span class="brackets"><a class="fn-backref" href="#id3">2</a></span></dt>
+<dt class="label" id="fnote2"><span class="brackets"><a class="fn-backref" href="#id2">2</a></span></dt>
 <dd><p>The X<sup>e</sup>-core term is described in the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi/optimization-guide-gpu/2024-0/intel-xe-gpu-architecture.html#XE-CORE">oneAPI GPU Optimization Guide</a>.
 Check the number of cores in the device specification, such as <a class="reference external" href="https://www.intel.com/content/www/us/en/products/details/discrete-gpus/data-center-gpu/max-series/products.html">Intel® Data Center GPU Max specification</a>.</p>
 </dd>
@@ -916,11 +741,11 @@ <h2>Recommended Settings for Best Performance<a class="headerlink" href="#recomm
       </div>
     </a>
     <a class="right-next"
-       href="../single_pass_scan.html"
+       href="radix_sort_by_key.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">Inclusive Scan</p>
+        <p class="prev-next-title">Radix Sort By Key</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
@@ -942,17 +767,15 @@ <h2>Recommended Settings for Best Performance<a class="headerlink" href="#recomm
   </div>
   <nav class="bd-toc-nav page-toc">
     <ul class="visible nav section-nav flex-column">
-<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-and-radix-sort-by-key-function-templates">radix_sort and radix_sort_by_key Function Templates</a><ul class="nav section-nav flex-column">
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-function-templates">radix_sort Function Templates</a><ul class="nav section-nav flex-column">
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#template-parameters">Template Parameters</a></li>
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#parameters">Parameters</a></li>
 <li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#return-value">Return Value</a></li>
 </ul>
 </li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#usage-examples">Usage Examples</a><ul class="nav section-nav flex-column">
-<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-in-place-example">radix_sort In-Place Example</a></li>
-<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-by-key-in-place-example">radix_sort_by_key In-Place Example</a></li>
-<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-out-of-place-example">radix_sort Out-of-Place Example</a></li>
-<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-by-key-out-of-place-example">radix_sort_by_key Out-of-Place Example</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#in-place-example">In-Place Example</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#out-of-place-example">Out-of-Place Example</a></li>
 </ul>
 </li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#memory-requirements">Memory Requirements</a><ul class="nav section-nav flex-column">
diff --git a/kernel_templates/esimd/radix_sort_by_key.html b/kernel_templates/esimd/radix_sort_by_key.html
new file mode 100644
index 0000000000..7ee0265626
--- /dev/null
+++ b/kernel_templates/esimd/radix_sort_by_key.html
@@ -0,0 +1,888 @@
+
+
+<!DOCTYPE html>
+
+
+<html >
+
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+    <title>Radix Sort By Key &#8212; oneDPL Documentation 2022.7.0 documentation</title>
+  
+  
+  
+  <script data-cfasync="false">
+    document.documentElement.dataset.mode = localStorage.getItem("mode") || "";
+    document.documentElement.dataset.theme = localStorage.getItem("theme") || "light";
+  </script>
+  
+  <!-- Loaded before other Sphinx assets -->
+  <link href="../../_static/styles/theme.css?digest=e353d410970836974a52" rel="stylesheet" />
+<link href="../../_static/styles/bootstrap.css?digest=e353d410970836974a52" rel="stylesheet" />
+<link href="../../_static/styles/pydata-sphinx-theme.css?digest=e353d410970836974a52" rel="stylesheet" />
+
+  
+  <link href="../../_static/vendor/fontawesome/6.1.2/css/all.min.css?digest=e353d410970836974a52" rel="stylesheet" />
+  <link rel="preload" as="font" type="font/woff2" crossorigin href="../../_static/vendor/fontawesome/6.1.2/webfonts/fa-solid-900.woff2" />
+<link rel="preload" as="font" type="font/woff2" crossorigin href="../../_static/vendor/fontawesome/6.1.2/webfonts/fa-brands-400.woff2" />
+<link rel="preload" as="font" type="font/woff2" crossorigin href="../../_static/vendor/fontawesome/6.1.2/webfonts/fa-regular-400.woff2" />
+
+    <link rel="stylesheet" type="text/css" href="../../_static/pygments.css" />
+    <link rel="stylesheet" href="../../_static/styles/sphinx-book-theme.css?digest=14f4ca6b54d191a8c7657f6c759bf11a5fb86285" type="text/css" />
+    <link rel="stylesheet" type="text/css" href="../../_static/custom.css" />
+  
+  <!-- Pre-loaded scripts that we'll load fully later -->
+  <link rel="preload" as="script" href="../../_static/scripts/bootstrap.js?digest=e353d410970836974a52" />
+<link rel="preload" as="script" href="../../_static/scripts/pydata-sphinx-theme.js?digest=e353d410970836974a52" />
+
+    <script data-url_root="../../" id="documentation_options" src="../../_static/documentation_options.js"></script>
+    <script src="../../_static/jquery.js"></script>
+    <script src="../../_static/underscore.js"></script>
+    <script src="../../_static/doctools.js"></script>
+    <script src="../../_static/scripts/sphinx-book-theme.js?digest=5a5c038af52cf7bc1a1ec88eea08e6366ee68824"></script>
+    <script>DOCUMENTATION_OPTIONS.pagename = 'kernel_templates/esimd/radix_sort_by_key';</script>
+    <link rel="shortcut icon" href="../../_static/favicons.png"/>
+    <link rel="index" title="Index" href="../../genindex.html" />
+    <link rel="search" title="Search" href="../../search.html" />
+    <link rel="next" title="Inclusive Scan" href="../single_pass_scan.html" />
+    <link rel="prev" title="Radix Sort" href="radix_sort.html" />
+
+    <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
+    <script type="text/javascript">
+        // Configure TMS settings
+        var wapLocalCode = 'us-en'; // Dynamically set per localized site, see mapping table for values
+        var wapSection = "oneapi-dpl"; // WAP team will give you a unique section for your site
+        // Load TMS
+        if(document.location.href.includes("oneapi-src.github.io")){
+        (function () {
+        var url = 'https://www.intel.com/content/dam/www/global/wap/tms-loader.js'; // WAP file URL
+        var po = document.createElement('script'); po.type = 'text/javascript'; po.async = true; po.src = url;
+        var s = document.getElementsByTagName('script')[0]; s.parentNode.insertBefore(po, s);
+        })();
+        }
+    </script>
+    <link href="../../_static/style.css" rel="stylesheet" type="text/css">
+
+
+
+  </head>
+  
+  
+  <body data-bs-spy="scroll" data-bs-target=".bd-toc-nav" data-offset="180" data-bs-root-margin="0px 0px -60%" data-default-mode="">
+
+  
+  
+  <a class="skip-link" href="#main-content">Skip to main content</a>
+  
+  <input type="checkbox"
+          class="sidebar-toggle"
+          name="__primary"
+          id="__primary"/>
+  <label class="overlay overlay-primary" for="__primary"></label>
+  
+  <input type="checkbox"
+          class="sidebar-toggle"
+          name="__secondary"
+          id="__secondary"/>
+  <label class="overlay overlay-secondary" for="__secondary"></label>
+  
+  <div class="search-button__wrapper">
+    <div class="search-button__overlay"></div>
+    <div class="search-button__search-container">
+<form class="bd-search d-flex align-items-center"
+      action="../../search.html"
+      method="get">
+  <i class="fa-solid fa-magnifying-glass"></i>
+  <input type="search"
+         class="form-control"
+         name="q"
+         id="search-input"
+         placeholder="Search..."
+         aria-label="Search..."
+         autocomplete="off"
+         autocorrect="off"
+         autocapitalize="off"
+         spellcheck="false"/>
+  <span class="search-button__kbd-shortcut"><kbd class="kbd-shortcut__modifier">Ctrl</kbd>+<kbd>K</kbd></span>
+</form></div>
+  </div>
+  
+    <nav class="bd-header navbar navbar-expand-lg bd-navbar">
+    </nav>
+  
+  <div class="bd-container">
+    <div class="bd-container__inner bd-page-width">
+      
+      <div class="bd-sidebar-primary bd-sidebar">
+        
+
+  
+  <div class="sidebar-header-items sidebar-primary__section">
+    
+    
+    
+    
+  </div>
+  
+    <div class="sidebar-primary-items__start sidebar-primary__section">
+        <div class="sidebar-primary-item">
+  
+
+<a class="navbar-brand logo" href="../../index.html">
+  
+  
+  
+  
+    
+    
+      
+    
+    
+    <img src="../../_static/oneAPI-rgb-rev-100.png" class="logo__image only-light" alt="Logo image"/>
+    <script>document.write(`<img src="../../_static/oneAPI-rgb-rev-100.png" class="logo__image only-dark" alt="Logo image"/>`);</script>
+  
+  
+</a></div>
+        <div class="sidebar-primary-item"><nav class="bd-links" id="bd-docs-nav" aria-label="Main">
+    <div class="bd-toc-item navbar-nav active">
+        <p aria-level="2" class="caption" role="heading"><span class="caption-text">Get Started</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../../introduction/release_notes.html">Release Notes</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../../introduction.html">oneAPI DPC++ Library Introduction</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
+<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/execution_policies.html">Execution Policies</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
+</ul>
+</li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
+<li class="toctree-l2"><a class="reference internal" href="../../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="../../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
+<li class="toctree-l2"><a class="reference internal" href="../../dynamic_selection_api/functions.html">Functions</a></li>
+<li class="toctree-l2 has-children"><a class="reference internal" href="../../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
+<li class="toctree-l3"><a class="reference internal" href="../../dynamic_selection_api/fixed_resource_policy.html">Fixed-Resource Policy</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../../dynamic_selection_api/round_robin_policy.html">Round-Robin Policy</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../../dynamic_selection_api/dynamic_load_policy.html">Dynamic Load Policy</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../../dynamic_selection_api/auto_tune_policy.html">Auto-Tune Policy</a></li>
+</ul>
+</li>
+</ul>
+</li>
+<li class="toctree-l1 current active has-children"><a class="reference internal" href="../../kernel_templates_main.html">Kernel Templates API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-5" name="toctree-checkbox-5" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-5"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
+<li class="toctree-l2"><a class="reference internal" href="../kernel_configuration.html">Kernel Configuration</a></li>
+<li class="toctree-l2 current active has-children"><a class="reference internal" href="../esimd_main.html">ESIMD-Based Kernel Templates</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
+<li class="toctree-l3"><a class="reference internal" href="radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3 current active"><a class="current reference internal" href="#">Radix Sort By Key</a></li>
+</ul>
+</li>
+<li class="toctree-l2"><a class="reference internal" href="../single_pass_scan.html">Inclusive Scan</a></li>
+</ul>
+</li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../../notices_disclaimers.html">Notices and Disclaimers</a></li>
+</ul>
+
+    </div>
+</nav></div>
+    </div>
+  
+  
+  <div class="sidebar-primary-items__end sidebar-primary__section">
+  </div>
+  
+  <div id="rtd-footer-container"></div>
+
+
+      </div>
+      
+      <main id="main-content" class="bd-main">
+        
+        
+
+<div class="sbt-scroll-pixel-helper"></div>
+
+          <div class="bd-content">
+            <div class="bd-article-container">
+              
+              <div class="bd-header-article">
+<div class="header-article-items header-article__inner">
+  
+    <div class="header-article-items__start">
+      
+        <div class="header-article-item"><label class="sidebar-toggle primary-toggle btn btn-sm" for="__primary" title="Toggle primary sidebar" data-bs-placement="bottom" data-bs-toggle="tooltip">
+  <span class="fa-solid fa-bars"></span>
+</label></div>
+      
+    </div>
+  
+  
+    <div class="header-article-items__end">
+      
+        <div class="header-article-item">
+
+<div class="article-header-buttons">
+
+
+
+
+
+<div class="dropdown dropdown-source-buttons">
+  <button class="btn dropdown-toggle" type="button" data-bs-toggle="dropdown" aria-expanded="false" aria-label="Source repositories">
+    <i class="fab fa-github"></i>
+  </button>
+  <ul class="dropdown-menu">
+      
+      
+      
+      <li><a href="https://github.com/oneapi-src/oneDPL/edit/main/documentation/library_guide/kernel_templates/esimd/radix_sort_by_key.rst" target="_blank"
+   class="btn btn-sm btn-source-edit-button dropdown-item"
+   title="Suggest edit"
+   data-bs-placement="left" data-bs-toggle="tooltip"
+>
+  
+
+<span class="btn__icon-container">
+  <i class="fas fa-pencil-alt"></i>
+  </span>
+<span class="btn__text-container">Suggest edit</span>
+</a>
+</li>
+      
+      
+      
+      
+      <li><a href="https://github.com/oneapi-src/oneDPL/issues/new?title=Issue%20on%20page%20%2Fkernel_templates/esimd/radix_sort_by_key.html&body=Your%20issue%20content%20here." target="_blank"
+   class="btn btn-sm btn-source-issues-button dropdown-item"
+   title="Open an issue"
+   data-bs-placement="left" data-bs-toggle="tooltip"
+>
+  
+
+<span class="btn__icon-container">
+  <i class="fas fa-lightbulb"></i>
+  </span>
+<span class="btn__text-container">Open issue</span>
+</a>
+</li>
+      
+  </ul>
+</div>
+
+
+
+
+
+
+<div class="dropdown dropdown-download-buttons">
+  <button class="btn dropdown-toggle" type="button" data-bs-toggle="dropdown" aria-expanded="false" aria-label="Download this page">
+    <i class="fas fa-download"></i>
+  </button>
+  <ul class="dropdown-menu">
+      
+      
+      
+      <li><a href="../../_sources/kernel_templates/esimd/radix_sort_by_key.rst" target="_blank"
+   class="btn btn-sm btn-download-source-button dropdown-item"
+   title="Download source file"
+   data-bs-placement="left" data-bs-toggle="tooltip"
+>
+  
+
+<span class="btn__icon-container">
+  <i class="fas fa-file"></i>
+  </span>
+<span class="btn__text-container">.rst</span>
+</a>
+</li>
+      
+      
+      
+      
+      <li>
+<button onclick="window.print()"
+  class="btn btn-sm btn-download-pdf-button dropdown-item"
+  title="Print to PDF"
+  data-bs-placement="left" data-bs-toggle="tooltip"
+>
+  
+
+<span class="btn__icon-container">
+  <i class="fas fa-file-pdf"></i>
+  </span>
+<span class="btn__text-container">.pdf</span>
+</button>
+</li>
+      
+  </ul>
+</div>
+
+
+
+
+<button onclick="toggleFullScreen()"
+  class="btn btn-sm btn-fullscreen-button"
+  title="Fullscreen mode"
+  data-bs-placement="bottom" data-bs-toggle="tooltip"
+>
+  
+
+<span class="btn__icon-container">
+  <i class="fas fa-expand"></i>
+  </span>
+
+</button>
+
+
+<script>
+document.write(`
+  <button class="theme-switch-button btn btn-sm btn-outline-primary navbar-btn rounded-circle" title="light/dark" aria-label="light/dark" data-bs-placement="bottom" data-bs-toggle="tooltip">
+    <span class="theme-switch" data-mode="light"><i class="fa-solid fa-sun"></i></span>
+    <span class="theme-switch" data-mode="dark"><i class="fa-solid fa-moon"></i></span>
+    <span class="theme-switch" data-mode="auto"><i class="fa-solid fa-circle-half-stroke"></i></span>
+  </button>
+`);
+</script>
+
+<script>
+document.write(`
+  <button class="btn btn-sm navbar-btn search-button search-button__button" title="Search" aria-label="Search" data-bs-placement="bottom" data-bs-toggle="tooltip">
+    <i class="fa-solid fa-magnifying-glass"></i>
+  </button>
+`);
+</script>
+<label class="sidebar-toggle secondary-toggle btn btn-sm" for="__secondary"title="Toggle secondary sidebar" data-bs-placement="bottom" data-bs-toggle="tooltip">
+    <span class="fa-solid fa-list"></span>
+</label>
+</div></div>
+      
+    </div>
+  
+</div>
+</div>
+              
+              
+
+<div id="jb-print-docs-body" class="onlyprint">
+    <h1>Radix Sort By Key</h1>
+    <!-- Table of contents -->
+    <div id="print-main-content">
+        <div id="jb-print-toc">
+            
+            <div>
+                <h2> Contents </h2>
+            </div>
+            <nav aria-label="Page">
+                <ul class="visible nav section-nav flex-column">
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-by-key-function-templates">radix_sort_by_key Function Templates</a><ul class="nav section-nav flex-column">
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#template-parameters">Template Parameters</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#parameters">Parameters</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#return-value">Return Value</a></li>
+</ul>
+</li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#usage-examples">Usage Examples</a><ul class="nav section-nav flex-column">
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#in-place-example">In-Place Example</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#out-of-place-example">Out-of-Place Example</a></li>
+</ul>
+</li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#memory-requirements">Memory Requirements</a><ul class="nav section-nav flex-column">
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#global-memory-requirements">Global Memory Requirements</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#local-memory-requirements">Local Memory Requirements</a></li>
+</ul>
+</li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#recommended-settings-for-best-performance">Recommended Settings for Best Performance</a></li>
+</ul>
+            </nav>
+        </div>
+    </div>
+</div>
+
+              
+                
+<div id="searchbox"></div>
+                <article class="bd-article" role="main">
+                  
+  <div class="section" id="radix-sort-by-key">
+<h1>Radix Sort By Key<a class="headerlink" href="#radix-sort-by-key" title="Permalink to this headline">#</a></h1>
+<div class="section" id="radix-sort-by-key-function-templates">
+<h2>radix_sort_by_key Function Templates<a class="headerlink" href="#radix-sort-by-key-function-templates" title="Permalink to this headline">#</a></h2>
+<p>The <code class="docutils literal notranslate"><span class="pre">radix_sort_by_key</span></code> function sorts keys using the radix sort algorithm, applying the same order to the corresponding values.
+The sorting is stable, preserving the relative order of elements with equal keys.
+Both in-place and out-of-place overloads are provided. Out-of-place overloads do not alter the input sequences.</p>
+<p>The functions implement a Onesweep* <a class="footnote-reference brackets" href="#fnote1" id="id1">1</a> algorithm variant.</p>
+<p>A synopsis of the <code class="docutils literal notranslate"><span class="pre">radix_sort_by_key</span></code> function is provided below:</p>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="c1">// defined in &lt;oneapi/dpl/experimental/kernel_templates&gt;</span>
+
+<span class="k">namespace</span><span class="w"> </span><span class="nn">oneapi</span><span class="o">::</span><span class="nn">dpl</span><span class="o">::</span><span class="nn">experimental</span><span class="o">::</span><span class="nn">kt</span><span class="o">::</span><span class="nn">gpu</span><span class="o">::</span><span class="nn">esimd</span><span class="w"> </span><span class="p">{</span>
+
+<span class="c1">// Sort in-place</span>
+<span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="kt">bool</span><span class="w"> </span><span class="n">IsAscending</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="kt">uint8_t</span><span class="w"> </span><span class="n">RadixBits</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span>
+<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KernelParam</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Iterator1</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Iterator2</span><span class="o">&gt;</span>
+<span class="n">sycl</span><span class="o">::</span><span class="n">event</span>
+<span class="n">radix_sort_by_key</span><span class="w"> </span><span class="p">(</span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">Iterator1</span><span class="w"> </span><span class="n">keys_first</span><span class="p">,</span><span class="w"> </span><span class="n">Iterator1</span><span class="w"> </span><span class="n">keys_last</span><span class="p">,</span>
+<span class="w">                   </span><span class="n">Iterator2</span><span class="w"> </span><span class="n">values_first</span><span class="p">,</span><span class="w"> </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">);</span><span class="w"> </span><span class="c1">// (1)</span>
+
+<span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="kt">bool</span><span class="w"> </span><span class="n">IsAscending</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="kt">uint8_t</span><span class="w"> </span><span class="n">RadixBits</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span>
+<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KernelParam</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">KeysRng</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">ValuesRng</span><span class="o">&gt;</span>
+<span class="n">sycl</span><span class="o">::</span><span class="n">event</span>
+<span class="n">radix_sort_by_key</span><span class="w"> </span><span class="p">(</span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">KeysRng</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">keys</span><span class="p">,</span>
+<span class="w">                   </span><span class="n">ValuesRng</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">);</span><span class="w"> </span><span class="c1">// (2)</span>
+
+
+<span class="c1">// Sort out-of-place</span>
+<span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="kt">bool</span><span class="w"> </span><span class="n">IsAscending</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="kt">uint8_t</span><span class="w"> </span><span class="n">RadixBits</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span>
+<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KernelParam</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">KeysIterator1</span><span class="p">,</span>
+<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">ValuesIterator1</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">KeysIterator2</span><span class="p">,</span>
+<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">ValuesIterator2</span><span class="o">&gt;</span>
+<span class="n">sycl</span><span class="o">::</span><span class="n">event</span>
+<span class="n">radix_sort_by_key</span><span class="w"> </span><span class="p">(</span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">KeysIterator1</span><span class="w"> </span><span class="n">keys_first</span><span class="p">,</span>
+<span class="w">                   </span><span class="n">KeysIterator1</span><span class="w"> </span><span class="n">keys_last</span><span class="p">,</span><span class="w"> </span><span class="n">ValuesIterator1</span><span class="w"> </span><span class="n">values_first</span><span class="p">,</span>
+<span class="w">                   </span><span class="n">KeysIterator2</span><span class="w"> </span><span class="n">keys_out_first</span><span class="p">,</span><span class="w"> </span><span class="n">ValuesIterator2</span><span class="w"> </span><span class="n">values_out_first</span><span class="p">,</span>
+<span class="w">                   </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">);</span><span class="w"> </span><span class="c1">// (3)</span>
+
+<span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="kt">bool</span><span class="w"> </span><span class="n">IsAscending</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="kt">uint8_t</span><span class="w"> </span><span class="n">RadixBits</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span>
+<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KernelParam</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">KeysRng1</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">ValuesRng1</span><span class="p">,</span>
+<span class="w">          </span><span class="k">typename</span><span class="w"> </span><span class="nc">KeysRng2</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">ValuesRng2</span><span class="o">&gt;</span>
+<span class="n">sycl</span><span class="o">::</span><span class="n">event</span>
+<span class="n">radix_sort_by_key</span><span class="w"> </span><span class="p">(</span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">KeysRng1</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">ValuesRng1</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">values</span><span class="p">,</span>
+<span class="w">                   </span><span class="n">KeysRng2</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">keys_out</span><span class="p">,</span><span class="w"> </span><span class="n">ValuesRng2</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">values_out</span><span class="p">,</span>
+<span class="w">                   </span><span class="n">KernelParam</span><span class="w"> </span><span class="n">param</span><span class="p">);</span><span class="w"> </span><span class="c1">// (4)</span>
+<span class="p">}</span>
+</pre></div>
+</div>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>The <code class="docutils literal notranslate"><span class="pre">radix_sort_by_key</span></code> is currently available only for Intel® Data Center GPU Max Series,
+and requires Intel® oneAPI DPC++/C++ Compiler 2023.2 or newer.</p>
+</div>
+<div class="section" id="template-parameters">
+<h3>Template Parameters<a class="headerlink" href="#template-parameters" title="Permalink to this headline">#</a></h3>
+<table class="table">
+<colgroup>
+<col style="width: 25%" />
+<col style="width: 75%" />
+</colgroup>
+<thead>
+<tr class="row-odd"><th class="head"><p>Name</p></th>
+<th class="head"><p>Description</p></th>
+</tr>
+</thead>
+<tbody>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">bool</span> <span class="pre">IsAscending</span></code></p></td>
+<td><p>The sort order. Ascending: <code class="docutils literal notranslate"><span class="pre">true</span></code>; Descending: <code class="docutils literal notranslate"><span class="pre">false</span></code>.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">std::uint8_t</span> <span class="pre">RadixBits</span></code></p></td>
+<td><p>The number of bits to sort for each radix sort algorithm pass.</p></td>
+</tr>
+</tbody>
+</table>
+</div>
+<div class="section" id="parameters">
+<h3>Parameters<a class="headerlink" href="#parameters" title="Permalink to this headline">#</a></h3>
+<table class="table">
+<colgroup>
+<col style="width: 41%" />
+<col style="width: 59%" />
+</colgroup>
+<thead>
+<tr class="row-odd"><th class="head"><p>Name</p></th>
+<th class="head"><p>Description</p></th>
+</tr>
+</thead>
+<tbody>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">q</span></code></p></td>
+<td><p>The SYCL* queue where kernels are submitted.</p></td>
+</tr>
+<tr class="row-odd"><td><ul class="simple">
+<li><p><code class="docutils literal notranslate"><span class="pre">keys_first</span></code>, <code class="docutils literal notranslate"><span class="pre">keys_last</span></code>,
+<code class="docutils literal notranslate"><span class="pre">values_first</span></code> (1),</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">keys</span></code>, <code class="docutils literal notranslate"><span class="pre">values</span></code> (2),</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">keys_first</span></code>, <code class="docutils literal notranslate"><span class="pre">keys_last</span></code>,
+<code class="docutils literal notranslate"><span class="pre">values_first</span></code>, <code class="docutils literal notranslate"><span class="pre">keys_out_first</span></code>,
+<code class="docutils literal notranslate"><span class="pre">values_out_first</span></code> (3)</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">keys</span></code>, <code class="docutils literal notranslate"><span class="pre">values</span></code>,
+<code class="docutils literal notranslate"><span class="pre">keys_out</span></code>, <code class="docutils literal notranslate"><span class="pre">values_out</span></code> (4).</p></li>
+</ul>
+</td>
+<td><p>The sequences to apply the algorithm to.
+Supported sequence types:</p>
+<ul class="simple">
+<li><p><a class="reference internal" href="../../parallel_api/pass_data_algorithms.html#use-usm"><span class="std std-ref">USM pointers</span></a> (1,3),</p></li>
+<li><p><a class="reference internal" href="../../parallel_api/pass_data_algorithms.html#use-buffer-wrappers"><span class="std std-ref">oneapi::dpl::begin and oneapi::dpl::end</span></a> (1,3).</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> (2,4),</p></li>
+<li><p><a class="reference internal" href="../../parallel_api/range_based_api.html#viewable-ranges"><span class="std std-ref">oneapi::dpl::experimental::ranges::views::all</span></a> (2,4),</p></li>
+<li><p><a class="reference internal" href="../../parallel_api/range_based_api.html#viewable-ranges"><span class="std std-ref">oneapi::dpl::experimental::ranges::views::subrange</span></a> (2,4).</p></li>
+</ul>
+</td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">param</span></code></p></td>
+<td><p>A <a class="reference internal" href="../kernel_configuration.html"><span class="doc">kernel_param</span></a> object.
+Its <code class="docutils literal notranslate"><span class="pre">data_per_workitem</span></code> must be a positive multiple of 32.</p></td>
+</tr>
+</tbody>
+</table>
+<p><strong>Type Requirements</strong>:</p>
+<ul class="simple">
+<li><p>The element type of sequence(s) to sort must be a C++ integral or floating-point type
+other than <code class="docutils literal notranslate"><span class="pre">bool</span></code> with a width of up to 64 bits.</p></li>
+</ul>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>Current limitations:</p>
+<ul class="simple">
+<li><p>Number of elements to sort must not exceed <cite>2^30</cite>.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">RadixBits</span></code> can only be <cite>8</cite>.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">param.workgroup_size</span></code> can only be <cite>64</cite>.</p></li>
+</ul>
+</div>
+</div>
+<div class="section" id="return-value">
+<h3>Return Value<a class="headerlink" href="#return-value" title="Permalink to this headline">#</a></h3>
+<p>A <code class="docutils literal notranslate"><span class="pre">sycl::event</span></code> object representing the status of the algorithm execution.</p>
+</div>
+</div>
+<div class="section" id="usage-examples">
+<h2>Usage Examples<a class="headerlink" href="#usage-examples" title="Permalink to this headline">#</a></h2>
+<div class="section" id="in-place-example">
+<h3>In-Place Example<a class="headerlink" href="#in-place-example" title="Permalink to this headline">#</a></h3>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="c1">// possible build and run commands:</span>
+<span class="c1">//    icpx -fsycl radix_sort_by_key.cpp -o radix_sort_by_key -I /path/to/oneDPL/include &amp;&amp; ./radix_sort_by_key</span>
+
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;cstdint&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;iostream&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;sycl/sycl.hpp&gt;</span>
+
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/experimental/kernel_templates&gt;</span>
+
+<span class="k">namespace</span><span class="w"> </span><span class="nn">kt</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nn">oneapi</span><span class="o">::</span><span class="nn">dpl</span><span class="o">::</span><span class="nn">experimental</span><span class="o">::</span><span class="nn">kt</span><span class="p">;</span>
+
+<span class="kt">int</span><span class="w"> </span><span class="nf">main</span><span class="p">()</span>
+<span class="p">{</span>
+<span class="w">   </span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">n</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">6</span><span class="p">;</span>
+<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">gpu_selector_v</span><span class="p">};</span>
+<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="n">std</span><span class="o">::</span><span class="kt">uint32_t</span><span class="o">&gt;</span><span class="w"> </span><span class="n">keys</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
+<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">char</span><span class="o">&gt;</span><span class="w"> </span><span class="n">values</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
+
+<span class="w">   </span><span class="c1">// initialize</span>
+<span class="w">   </span><span class="p">{</span>
+<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">k_acc</span><span class="p">{</span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">write_only</span><span class="p">};</span>
+<span class="w">      </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">2</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">2</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">3</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">4</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">5</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">;</span>
+
+<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">v_acc</span><span class="p">{</span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">write_only</span><span class="p">};</span>
+<span class="w">      </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;r&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;o&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">2</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;s&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">3</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;d&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">4</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;t&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">5</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;e&#39;</span><span class="p">;</span>
+<span class="w">   </span><span class="p">}</span>
+
+<span class="w">   </span><span class="c1">// sort</span>
+<span class="w">   </span><span class="k">auto</span><span class="w"> </span><span class="n">e</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">kt</span><span class="o">::</span><span class="n">gpu</span><span class="o">::</span><span class="n">esimd</span><span class="o">::</span><span class="n">radix_sort_by_key</span><span class="o">&lt;</span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="mi">8</span><span class="o">&gt;</span><span class="p">(</span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">kt</span><span class="o">::</span><span class="n">kernel_param</span><span class="o">&lt;</span><span class="mi">96</span><span class="p">,</span><span class="w"> </span><span class="mi">64</span><span class="o">&gt;</span><span class="p">{});</span><span class="w"> </span><span class="c1">// (2)</span>
+<span class="w">   </span><span class="n">e</span><span class="p">.</span><span class="n">wait</span><span class="p">();</span>
+
+<span class="w">   </span><span class="c1">// print</span>
+<span class="w">   </span><span class="p">{</span>
+<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">k_acc</span><span class="p">{</span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
+<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
+<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
+<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39;\n&#39;</span><span class="p">;</span>
+
+<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">v_acc</span><span class="p">{</span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
+<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
+<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
+<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39;\n&#39;</span><span class="p">;</span>
+<span class="w">   </span><span class="p">}</span>
+
+<span class="w">   </span><span class="k">return</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span>
+<span class="p">}</span>
+</pre></div>
+</div>
+<p><strong>Output</strong>:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="mi">1</span> <span class="mi">2</span> <span class="mi">3</span> <span class="mi">3</span> <span class="mi">3</span> <span class="mi">5</span>
+<span class="n">s</span> <span class="n">o</span> <span class="n">r</span> <span class="n">t</span> <span class="n">e</span> <span class="n">d</span>
+</pre></div>
+</div>
+</div>
+<div class="section" id="out-of-place-example">
+<h3>Out-of-Place Example<a class="headerlink" href="#out-of-place-example" title="Permalink to this headline">#</a></h3>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="c1">// possible build and run commands:</span>
+<span class="c1">//    icpx -fsycl radix_sort_by_key.cpp -o radix_sort_by_key -I /path/to/oneDPL/include &amp;&amp; ./radix_sort_by_key</span>
+
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;cstdint&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;iostream&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;sycl/sycl.hpp&gt;</span>
+
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/experimental/kernel_templates&gt;</span>
+
+<span class="k">namespace</span><span class="w"> </span><span class="nn">kt</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nn">oneapi</span><span class="o">::</span><span class="nn">dpl</span><span class="o">::</span><span class="nn">experimental</span><span class="o">::</span><span class="nn">kt</span><span class="p">;</span>
+
+<span class="kt">int</span><span class="w"> </span><span class="nf">main</span><span class="p">()</span>
+<span class="p">{</span>
+<span class="w">   </span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">n</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">6</span><span class="p">;</span>
+<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">gpu_selector_v</span><span class="p">};</span>
+<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="n">std</span><span class="o">::</span><span class="kt">uint32_t</span><span class="o">&gt;</span><span class="w"> </span><span class="n">keys</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
+<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="n">std</span><span class="o">::</span><span class="kt">uint32_t</span><span class="o">&gt;</span><span class="w"> </span><span class="n">keys_out</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
+<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">char</span><span class="o">&gt;</span><span class="w"> </span><span class="n">values</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
+<span class="w">   </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">char</span><span class="o">&gt;</span><span class="w"> </span><span class="n">values_out</span><span class="p">{</span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">)};</span>
+
+
+<span class="w">   </span><span class="c1">// initialize</span>
+<span class="w">   </span><span class="p">{</span>
+<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">k_acc</span><span class="p">{</span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">write_only</span><span class="p">};</span>
+<span class="w">      </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">2</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">2</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">3</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">4</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="mi">5</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">3</span><span class="p">;</span>
+
+<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">v_acc</span><span class="p">{</span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">write_only</span><span class="p">};</span>
+<span class="w">      </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;r&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;o&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">2</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;s&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">3</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;d&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">4</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;t&#39;</span><span class="p">,</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="mi">5</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="sc">&#39;e&#39;</span><span class="p">;</span>
+<span class="w">   </span><span class="p">}</span>
+
+<span class="w">   </span><span class="c1">// sort</span>
+<span class="w">   </span><span class="k">auto</span><span class="w"> </span><span class="n">e</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">kt</span><span class="o">::</span><span class="n">gpu</span><span class="o">::</span><span class="n">esimd</span><span class="o">::</span><span class="n">radix_sort_by_key</span><span class="o">&lt;</span><span class="nb">true</span><span class="p">,</span><span class="w"> </span><span class="mi">8</span><span class="o">&gt;</span><span class="p">(</span><span class="n">q</span><span class="p">,</span><span class="w"> </span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">keys_out</span><span class="p">,</span><span class="w"> </span><span class="n">values_out</span><span class="p">,</span>
+<span class="w">                                                       </span><span class="n">kt</span><span class="o">::</span><span class="n">kernel_param</span><span class="o">&lt;</span><span class="mi">96</span><span class="p">,</span><span class="w"> </span><span class="mi">64</span><span class="o">&gt;</span><span class="p">{});</span><span class="w"> </span><span class="c1">// (4)</span>
+<span class="w">   </span><span class="n">e</span><span class="p">.</span><span class="n">wait</span><span class="p">();</span>
+
+<span class="w">   </span><span class="c1">// print</span>
+<span class="w">   </span><span class="p">{</span>
+<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">k_acc</span><span class="p">{</span><span class="n">keys</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
+<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
+<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">k_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
+<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39;\n&#39;</span><span class="p">;</span>
+
+<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">v_acc</span><span class="p">{</span><span class="n">values</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
+<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
+<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">v_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
+<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="s">&quot;</span><span class="se">\n\n</span><span class="s">&quot;</span><span class="p">;</span>
+
+<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">k_out_acc</span><span class="p">{</span><span class="n">keys_out</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
+<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
+<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">k_out_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
+<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39;\n&#39;</span><span class="p">;</span>
+
+<span class="w">      </span><span class="n">sycl</span><span class="o">::</span><span class="n">host_accessor</span><span class="w"> </span><span class="n">v_out_acc</span><span class="p">{</span><span class="n">values_out</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">};</span>
+<span class="w">      </span><span class="k">for</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="kt">size_t</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span><span class="w"> </span><span class="n">i</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">n</span><span class="p">;</span><span class="w"> </span><span class="o">++</span><span class="n">i</span><span class="p">)</span>
+<span class="w">            </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="n">v_out_acc</span><span class="p">[</span><span class="n">i</span><span class="p">]</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39; &#39;</span><span class="p">;</span>
+<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">cout</span><span class="w"> </span><span class="o">&lt;&lt;</span><span class="w"> </span><span class="sc">&#39;\n&#39;</span><span class="p">;</span>
+<span class="w">   </span><span class="p">}</span>
+
+<span class="w">   </span><span class="k">return</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span>
+<span class="p">}</span>
+</pre></div>
+</div>
+<p><strong>Output</strong>:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="mi">3</span> <span class="mi">2</span> <span class="mi">1</span> <span class="mi">5</span> <span class="mi">3</span> <span class="mi">3</span>
+<span class="n">r</span> <span class="n">o</span> <span class="n">s</span> <span class="n">d</span> <span class="n">t</span> <span class="n">e</span>
+
+<span class="mi">1</span> <span class="mi">2</span> <span class="mi">3</span> <span class="mi">3</span> <span class="mi">3</span> <span class="mi">5</span>
+<span class="n">s</span> <span class="n">o</span> <span class="n">r</span> <span class="n">t</span> <span class="n">e</span> <span class="n">d</span>
+</pre></div>
+</div>
+</div>
+</div>
+<div class="section" id="memory-requirements">
+<span id="radix-sort-by-key-memory-requirements"></span><h2>Memory Requirements<a class="headerlink" href="#memory-requirements" title="Permalink to this headline">#</a></h2>
+<p>The algorithm uses global and local device memory (see <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#_sycl_device_memory_model">SYCL 2020 Specification</a>)
+for intermediate data storage. For the algorithm to operate correctly, there must be enough memory on the device.
+If there is not enough global device memory, a <code class="docutils literal notranslate"><span class="pre">std::bad_alloc</span></code> exception is thrown.
+The behavior is undefined if there is not enough local memory.
+The amount of memory that is required depends on input data and configuration parameters, as described below.</p>
+<div class="section" id="global-memory-requirements">
+<h3>Global Memory Requirements<a class="headerlink" href="#global-memory-requirements" title="Permalink to this headline">#</a></h3>
+<p>Global memory is used for copying the input sequence(s) and storing internal data such as radix value counters.
+The used amount depends on many parameters; below is an upper bound approximation:</p>
+<blockquote>
+<div><p>N<sub>keys</sub> + N<sub>values</sub> + C * N<sub>keys</sub></p>
+</div></blockquote>
+<p>where the sequence with keys takes N<sub>keys</sub> space, the sequence with values takes N<sub>values</sub> space,
+and the additional space is C * N<sub>keys</sub>.</p>
+<p>The value of <cite>C</cite> depends on <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span></code>, <code class="docutils literal notranslate"><span class="pre">param.workgroup_size</span></code>, and <code class="docutils literal notranslate"><span class="pre">RadixBits</span></code>.
+For <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span></code> set to <cite>32</cite>, <code class="docutils literal notranslate"><span class="pre">param.workgroup_size</span></code> to <cite>64</cite>, and <code class="docutils literal notranslate"><span class="pre">RadixBits</span></code> to <cite>8</cite>,
+<cite>C</cite> approximately equals to <cite>1</cite>.
+Incrementing <code class="docutils literal notranslate"><span class="pre">RadixBits</span></code> increases <cite>C</cite> up to twice, while doubling either
+<code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span></code> or <code class="docutils literal notranslate"><span class="pre">param.workgroup_size</span></code> leads to a halving of <cite>C</cite>.</p>
+</div>
+<div class="section" id="local-memory-requirements">
+<h3>Local Memory Requirements<a class="headerlink" href="#local-memory-requirements" title="Permalink to this headline">#</a></h3>
+<p>Local memory is used for reordering key-value pairs within a work-group,
+and for storing internal data such as radix value counters.
+The used amount depends on many parameters; below is an upper bound approximation:</p>
+<blockquote>
+<div><p>N<sub>keys_per_workgroup</sub> + N<sub>values_per_workgroup</sub> + C</p>
+</div></blockquote>
+<p>where N<sub>keys_per_workgroup</sub> and N<sub>values_per_workgroup</sub> are the amounts of memory
+to store keys and values, respectively. <cite>C</cite> is some additional space for storing internal data.</p>
+<p>N<sub>keys_per_workgroup</sub> equals to <code class="docutils literal notranslate"><span class="pre">sizeof(key_type)</span> <span class="pre">*</span> <span class="pre">param.data_per_workitem</span> <span class="pre">*</span> <span class="pre">param.workgroup_size</span></code>,
+N<sub>values_per_workgroup</sub> equals to <code class="docutils literal notranslate"><span class="pre">sizeof(value_type)</span> <span class="pre">*</span> <span class="pre">param.data_per_workitem</span> <span class="pre">*</span> <span class="pre">param.workgroup_size</span></code>,
+<cite>C</cite> does not exceed <cite>4KB</cite>.</p>
+</div>
+</div>
+<div class="section" id="recommended-settings-for-best-performance">
+<h2>Recommended Settings for Best Performance<a class="headerlink" href="#recommended-settings-for-best-performance" title="Permalink to this headline">#</a></h2>
+<p>The general advice is to choose kernel parameters based on performance measurements and profiling information.
+The initial configuration may be selected according to these high-level guidelines:</p>
+<ul class="simple">
+<li><p>When the number of elements to sort <code class="docutils literal notranslate"><span class="pre">N</span></code> is less than 1M, utilizing all available
+compute cores is key for better performance. Allow creating enough work chunks to feed all
+X<sup>e</sup>-cores <a class="footnote-reference brackets" href="#fnote2" id="id2">2</a> on a GPU: <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span> <span class="pre">*</span> <span class="pre">param.workgroup_size</span> <span class="pre">≈</span> <span class="pre">N</span> <span class="pre">/</span> <span class="pre">xe_core_count</span></code>.</p></li>
+<li><p>When the number of elements to sort is large (more than ~1M), maximizing the number of elements
+processed by a work-group, which equals to <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span> <span class="pre">*</span> <span class="pre">param.workgroup_size</span></code>,
+reduces synchronization overheads between work-groups and usually benefits the overall performance.</p></li>
+</ul>
+<div class="admonition warning">
+<p class="admonition-title">Warning</p>
+<p>Avoid setting too large <code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span></code> and <code class="docutils literal notranslate"><span class="pre">param.workgroup_size</span></code> values.
+Make sure that <a class="reference internal" href="#radix-sort-by-key-memory-requirements"><span class="std std-ref">Memory requirements</span></a> are satisfied.</p>
+</div>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p><code class="docutils literal notranslate"><span class="pre">param.data_per_workitem</span></code> is the only available parameter to tune the performance,
+since <code class="docutils literal notranslate"><span class="pre">param.workgroup_size</span></code> currently supports only one value (<cite>64</cite>).</p>
+</div>
+<dl class="footnote brackets">
+<dt class="label" id="fnote1"><span class="brackets"><a class="fn-backref" href="#id1">1</a></span></dt>
+<dd><p>Andy Adinets and Duane Merrill (2022). Onesweep: A Faster Least Significant Digit Radix Sort for GPUs. <a class="reference external" href="https://arxiv.org/abs/2206.01784">https://arxiv.org/abs/2206.01784</a>.</p>
+</dd>
+<dt class="label" id="fnote2"><span class="brackets"><a class="fn-backref" href="#id2">2</a></span></dt>
+<dd><p>The X<sup>e</sup>-core term is described in the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi/optimization-guide-gpu/2024-0/intel-xe-gpu-architecture.html#XE-CORE">oneAPI GPU Optimization Guide</a>.
+Check the number of cores in the device specification, such as <a class="reference external" href="https://www.intel.com/content/www/us/en/products/details/discrete-gpus/data-center-gpu/max-series/products.html">Intel® Data Center GPU Max specification</a>.</p>
+</dd>
+</dl>
+</div>
+</div>
+
+
+                </article>
+              
+
+              
+              
+                <footer class="bd-footer-article">
+                  
+<div class="footer-article-items footer-article__inner">
+  
+    <div class="footer-article-item"><!-- Previous / next buttons -->
+<div class="prev-next-area">
+    <a class="left-prev"
+       href="radix_sort.html"
+       title="previous page">
+      <i class="fa-solid fa-angle-left"></i>
+      <div class="prev-next-info">
+        <p class="prev-next-subtitle">previous</p>
+        <p class="prev-next-title">Radix Sort</p>
+      </div>
+    </a>
+    <a class="right-next"
+       href="../single_pass_scan.html"
+       title="next page">
+      <div class="prev-next-info">
+        <p class="prev-next-subtitle">next</p>
+        <p class="prev-next-title">Inclusive Scan</p>
+      </div>
+      <i class="fa-solid fa-angle-right"></i>
+    </a>
+</div></div>
+  
+</div>
+
+                </footer>
+              
+            </div>
+            
+            
+              
+                <div class="bd-sidebar-secondary bd-toc"><div class="sidebar-secondary-items sidebar-secondary__inner">
+
+  <div class="sidebar-secondary-item">
+  <div class="page-toc tocsection onthispage">
+    <i class="fa-solid fa-list"></i> Contents
+  </div>
+  <nav class="bd-toc-nav page-toc">
+    <ul class="visible nav section-nav flex-column">
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#radix-sort-by-key-function-templates">radix_sort_by_key Function Templates</a><ul class="nav section-nav flex-column">
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#template-parameters">Template Parameters</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#parameters">Parameters</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#return-value">Return Value</a></li>
+</ul>
+</li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#usage-examples">Usage Examples</a><ul class="nav section-nav flex-column">
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#in-place-example">In-Place Example</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#out-of-place-example">Out-of-Place Example</a></li>
+</ul>
+</li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#memory-requirements">Memory Requirements</a><ul class="nav section-nav flex-column">
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#global-memory-requirements">Global Memory Requirements</a></li>
+<li class="toc-h3 nav-item toc-entry"><a class="reference internal nav-link" href="#local-memory-requirements">Local Memory Requirements</a></li>
+</ul>
+</li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#recommended-settings-for-best-performance">Recommended Settings for Best Performance</a></li>
+</ul>
+  </nav></div>
+
+</div></div>
+              
+            
+          </div>
+          <footer class="bd-footer-content">
+            
+<div class="bd-footer-content__inner container">
+  
+  <div class="footer-item">
+    
+<p class="component-author">
+By Intel
+</p>
+
+  </div>
+  
+  <div class="footer-item">
+    
+  <p class="copyright">
+    
+      © Copyright Intel Corporation.
+      <br/>
+    
+  </p>
+
+  </div>
+  
+  <div class="footer-item">
+    
+  </div>
+  
+  <div class="footer-item">
+    
+<div class="extra_footer">
+  <p align="right"><a data-cookie-notice="true" href="https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html">Cookies</a></p>
+</div>
+  </div>
+  
+</div>
+          </footer>
+        
+
+      </main>
+    </div>
+  </div>
+  
+  <!-- Scripts loaded after <body> so the DOM is not blocked -->
+  <script src="../../_static/scripts/bootstrap.js?digest=e353d410970836974a52"></script>
+<script src="../../_static/scripts/pydata-sphinx-theme.js?digest=e353d410970836974a52"></script>
+
+  <footer class="bd-footer">
+  </footer>
+  </body>
+</html>
\ No newline at end of file
diff --git a/kernel_templates/esimd_main.html b/kernel_templates/esimd_main.html
index ff0a22d50a..caeb4c126a 100644
--- a/kernel_templates/esimd_main.html
+++ b/kernel_templates/esimd_main.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>ESIMD-Based Kernel Templates &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>ESIMD-Based Kernel Templates &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 current active has-children"><a class="current reference internal" href="#">ESIMD-Based Kernel Templates</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -366,9 +371,7 @@
   </button>
 `);
 </script>
-<label class="sidebar-toggle secondary-toggle btn btn-sm" for="__secondary"title="Toggle secondary sidebar" data-bs-placement="bottom" data-bs-toggle="tooltip">
-    <span class="fa-solid fa-list"></span>
-</label>
+
 </div></div>
       
     </div>
@@ -384,14 +387,6 @@ <h1>ESIMD-Based Kernel Templates</h1>
     <div id="print-main-content">
         <div id="jb-print-toc">
             
-            <div>
-                <h2> Contents </h2>
-            </div>
-            <nav aria-label="Page">
-                <ul class="visible nav section-nav flex-column">
-<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#system-requirements">System Requirements</a></li>
-</ul>
-            </nav>
         </div>
     </div>
 </div>
@@ -403,29 +398,15 @@ <h2> Contents </h2>
                   
   <div class="section" id="esimd-based-kernel-templates">
 <h1>ESIMD-Based Kernel Templates<a class="headerlink" href="#esimd-based-kernel-templates" title="Permalink to this headline">#</a></h1>
-<p>The ESIMD kernel templates are based on <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/2024-0/explicit-simd-sycl-extension.html">Explicit SIMD SYCL extension</a>
-of Intel® oneAPI DPC++/C++ Compiler.
+<p>The ESIMD kernel templates are based on <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/2025-0/explicit-simd-sycl-extension.html">Explicit SIMD SYCL extension</a> of Intel® oneAPI DPC++/C++ Compiler.
 This technology only supports Intel GPU devices.</p>
 <p>These templates are available in the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::experimental::kt::gpu::esimd</span></code> namespace. The following are implemented:</p>
 <ul class="simple">
-<li><p><a class="reference internal" href="esimd/radix_sort.html"><span class="doc">radix_sort and radix_sort_by_key</span></a></p></li>
+<li><p><a class="reference internal" href="esimd/radix_sort.html"><span class="doc">radix_sort</span></a></p></li>
+<li><p><a class="reference internal" href="esimd/radix_sort_by_key.html"><span class="doc">radix_sort_by_key</span></a></p></li>
 </ul>
 <div class="toctree-wrapper compound">
 </div>
-<div class="section" id="system-requirements">
-<h2>System Requirements<a class="headerlink" href="#system-requirements" title="Permalink to this headline">#</a></h2>
-<ul class="simple">
-<li><p>Hardware: Intel® Data Center GPU Max Series.</p></li>
-<li><p>Compiler: Intel® oneAPI DPC++/C++ Compiler 2023.2 and newer.</p></li>
-<li><p>Operating Systems:</p>
-<ul>
-<li><p>Red Hat Enterprise Linux* 9.2,</p></li>
-<li><p>SUSE Linux Enterprise Server* 15 SP5,</p></li>
-<li><p>Ubuntu* 22.04.</p></li>
-</ul>
-</li>
-</ul>
-</div>
 </div>
 
 
@@ -468,20 +449,6 @@ <h2>System Requirements<a class="headerlink" href="#system-requirements" title="
             
             
               
-                <div class="bd-sidebar-secondary bd-toc"><div class="sidebar-secondary-items sidebar-secondary__inner">
-
-  <div class="sidebar-secondary-item">
-  <div class="page-toc tocsection onthispage">
-    <i class="fa-solid fa-list"></i> Contents
-  </div>
-  <nav class="bd-toc-nav page-toc">
-    <ul class="visible nav section-nav flex-column">
-<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#system-requirements">System Requirements</a></li>
-</ul>
-  </nav></div>
-
-</div></div>
-              
             
           </div>
           <footer class="bd-footer-content">
diff --git a/kernel_templates/kernel_configuration.html b/kernel_templates/kernel_configuration.html
index 80360cddf6..98b4485ded 100644
--- a/kernel_templates/kernel_configuration.html
+++ b/kernel_templates/kernel_configuration.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Kernel Configuration &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Kernel Configuration &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2 current active"><a class="current reference internal" href="#">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -482,13 +487,13 @@ <h3>Member Types<a class="headerlink" href="#member-types" title="Permalink to t
 <td><p>An optional parameter that is used to set a kernel name.</p>
 <div class="admonition note">
 <p class="admonition-title">Note</p>
-<p>The <code class="docutils literal notranslate"><span class="pre">KernelName</span></code> parameter might be required in case an implementation of
-SYCL is not fully compliant with the SYCL 2020 Specification and
-does not support optional kernel names.</p>
+<p>The <code class="docutils literal notranslate"><span class="pre">KernelName</span></code> parameter might be required in case an implementation
+of SYCL is not fully compliant with the <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#sec:naming.kernels">SYCL 2020 Specification</a>
+and does not support optional kernel names.</p>
 </div>
 <p>If omitted, SYCL kernel name(s) will be automatically generated.</p>
 <p>If provided, it must be a unique C++ typename that satisfies the requirements
-for SYCL kernel names (see <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#sec:naming.kernels">SYCL 2020 Specification</a>).</p>
+for SYCL kernel names in the <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#sec:naming.kernels">SYCL 2020 Specification</a>.</p>
 <div class="admonition note">
 <p class="admonition-title">Note</p>
 <p>The provided name can be augmented by oneDPL when used with
diff --git a/kernel_templates/single_pass_scan.html b/kernel_templates/single_pass_scan.html
index 6649abb3b7..cc92aa30e9 100644
--- a/kernel_templates/single_pass_scan.html
+++ b/kernel_templates/single_pass_scan.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Inclusive Scan &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Inclusive Scan &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,8 +45,8 @@
     <link rel="shortcut icon" href="../_static/favicons.png"/>
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="Macros" href="../macros.html" />
-    <link rel="prev" title="Radix Sort" href="esimd/radix_sort.html" />
+    <link rel="next" title="Notices and Disclaimers" href="../notices_disclaimers.html" />
+    <link rel="prev" title="Radix Sort By Key" href="esimd/radix_sort_by_key.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2 current active"><a class="current reference internal" href="#">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -495,10 +500,12 @@ <h3>Parameters<a class="headerlink" href="#parameters" title="Permalink to this
 <p class="admonition-title">Note</p>
 <p>Current limitations:</p>
 <ul class="simple">
-<li><p>The function will internally block until the issued kernels have completed execution.
+<li><p>The function is intended to be asynchronous, but in some cases, the function will not return until the algorithm fully completes.
 Although intended in the future to be an asynchronous call, the algorithm is currently synchronous.</p></li>
 <li><p>The SYCL device associated with the provided queue must support 64-bit atomic operations if the element type is 64-bits.</p></li>
-<li><p>There must be a known identity value for the provided combination of the element type and the binary operation. That is, <code class="docutils literal notranslate"><span class="pre">sycl::has_known_identity_v</span></code> must evaluate to true. Such operators are listed in the <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#table.identities">SYCL 2020 specification</a>.</p></li>
+<li><p>There must be a known identity value for the provided combination of the element type and the binary operation. That is,
+<code class="docutils literal notranslate"><span class="pre">sycl::has_known_identity_v</span></code> must evaluate to true. Such operators are listed in
+the <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#table.identities">SYCL 2020 specification</a>.</p></li>
 </ul>
 </div>
 </div>
@@ -547,8 +554,8 @@ <h3>inclusive_scan Example<a class="headerlink" href="#inclusive-scan-example" t
 <span class="p">}</span>
 </pre></div>
 </div>
-<p><strong>Output:</strong></p>
-<div class="highlight-none notranslate"><div class="highlight"><pre><span></span>1 3 4 7 8 10
+<p><strong>Output</strong>:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="mi">1</span> <span class="mi">3</span> <span class="mi">4</span> <span class="mi">7</span> <span class="mi">8</span> <span class="mi">10</span>
 </pre></div>
 </div>
 </div>
@@ -556,9 +563,10 @@ <h3>inclusive_scan Example<a class="headerlink" href="#inclusive-scan-example" t
 <div class="section" id="memory-requirements">
 <span id="scan-memory-requirements"></span><h2>Memory Requirements<a class="headerlink" href="#memory-requirements" title="Permalink to this headline">#</a></h2>
 <p>The algorithm uses global and local device memory (see <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#_sycl_device_memory_model">SYCL 2020 Specification</a>)
-for intermediate data storage. For the algorithm to operate correctly, there must be enough memory
-on the device. It throws a <code class="docutils literal notranslate"><span class="pre">std::bad_alloc</span></code> exception if there is not enough global device memory. The behavior is undefined if there is not enough local memory. The amount of memory that is required
-depends on input data and configuration parameters, as described below.</p>
+for intermediate data storage. For the algorithm to operate correctly, there must be enough memory on the device.
+If there is not enough global device memory, a <code class="docutils literal notranslate"><span class="pre">std::bad_alloc</span></code> exception is thrown.
+The behavior is undefined if there is not enough local memory.
+The amount of memory that is required depends on input data and configuration parameters, as described below.</p>
 <div class="section" id="global-memory-requirements">
 <h3>Global Memory Requirements<a class="headerlink" href="#global-memory-requirements" title="Permalink to this headline">#</a></h3>
 <p>Global memory is used for copying the input sequence and storing internal data such as status flags.
@@ -624,20 +632,20 @@ <h2>Recommended Settings for Best Performance<a class="headerlink" href="#recomm
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="esimd/radix_sort.html"
+       href="esimd/radix_sort_by_key.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">Radix Sort</p>
+        <p class="prev-next-title">Radix Sort By Key</p>
       </div>
     </a>
     <a class="right-next"
-       href="../macros.html"
+       href="../notices_disclaimers.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">Macros</p>
+        <p class="prev-next-title">Notices and Disclaimers</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
diff --git a/kernel_templates_main.html b/kernel_templates_main.html
index 40cb5c80e5..32300ac80b 100644
--- a/kernel_templates_main.html
+++ b/kernel_templates_main.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Kernel Templates API &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Kernel Templates API &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -400,7 +405,7 @@ <h1>Kernel Templates API<a class="headerlink" href="#kernel-templates-api" title
 <p>It is recommended to use kernel templates when there is an opportunity to customize an algorithm
 for a particular workload (for example, the number of elements and their type),
 or for a specific device (for example, based on the available local memory).</p>
-<p>To use the API, include the <code class="docutils literal notranslate"><span class="pre">oneapi/dpl/experimental/kernel_templates</span></code> header file.
+<p>To use the API, include the <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/experimental/kernel_templates&gt;</span></code> header file.
 The primary API namespace is <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::experimental::kt</span></code>, and nested namespaces are used to further categorize the templates.</p>
 <ul class="simple">
 <li><p><a class="reference internal" href="kernel_templates/kernel_configuration.html"><span class="doc">Kernel Configuration</span></a>. Generic structure for configuring a kernel template.</p></li>
diff --git a/macros.html b/macros.html
index bbad44cf41..784c1ecce5 100644
--- a/macros.html
+++ b/macros.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Macros &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Macros &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -46,7 +46,7 @@
     <link rel="index" title="Index" href="genindex.html" />
     <link rel="search" title="Search" href="search.html" />
     <link rel="next" title="CMake Support" href="cmake_support.html" />
-    <link rel="prev" title="Inclusive Scan" href="kernel_templates/single_pass_scan.html" />
+    <link rel="prev" title="Utility Function Object Classes" href="api_for_sycl_kernels/utility_function_object_classes.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1 current active"><a class="current reference internal" href="#">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1 current active"><a class="current reference internal" href="#">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -390,6 +395,7 @@ <h2> Contents </h2>
             <nav aria-label="Page">
                 <ul class="visible nav section-nav flex-column">
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#version-macros">Version Macros</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#feature-macros">Feature Macros</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#additional-macros">Additional Macros</a></li>
 </ul>
             </nav>
@@ -446,14 +452,45 @@ <h2>Version Macros<a class="headerlink" href="#version-macros" title="Permalink
 </tbody>
 </table>
 </div>
+<div class="section" id="feature-macros">
+<span id="id1"></span><h2>Feature Macros<a class="headerlink" href="#feature-macros" title="Permalink to this headline">#</a></h2>
+<p>Use these macros to test presence of specific oneDPL functionality.</p>
+<table class="table">
+<colgroup>
+<col style="width: 25%" />
+<col style="width: 75%" />
+</colgroup>
+<thead>
+<tr class="row-odd"><th class="head"><p>Macro</p></th>
+<th class="head"><p>Macro values and the functionality</p></th>
+</tr>
+</thead>
+<tbody>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">ONEDPL_HAS_RANDOM_NUMBERS</span></code></p></td>
+<td><p>Pseudo-random number generators and distributions.</p>
+<ul class="simple">
+<li><p><code class="docutils literal notranslate"><span class="pre">202409L</span></code> - added support of comparison and I/O stream operators and an experimental Philox engine</p></li>
+</ul>
+</td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">ONEDPL_HAS_RANGE_ALGORITHMS</span></code></p></td>
+<td><p>Parallel range algorithms.</p>
+<ul class="simple">
+<li><p><code class="docutils literal notranslate"><span class="pre">202409L</span></code> - see <a class="reference internal" href="parallel_api/parallel_range_algorithms.html#range-algorithms-202409l"><span class="std std-ref">available algorithms</span></a>.</p></li>
+</ul>
+</td>
+</tr>
+</tbody>
+</table>
+</div>
 <div class="section" id="additional-macros">
 <h2>Additional Macros<a class="headerlink" href="#additional-macros" title="Permalink to this headline">#</a></h2>
 <p>Use these macros to control aspects of oneDPL usage. You can set them in your program code
 before including oneDPL headers.</p>
 <table class="table">
 <colgroup>
-<col style="width: 23%" />
-<col style="width: 77%" />
+<col style="width: 26%" />
+<col style="width: 74%" />
 </colgroup>
 <thead>
 <tr class="row-odd"><th class="head"><p>Macro</p></th>
@@ -465,8 +502,7 @@ <h2>Additional Macros<a class="headerlink" href="#additional-macros" title="Perm
 <td><p>This macro enables the use of <code class="docutils literal notranslate"><span class="pre">#pragma</span> <span class="pre">vector</span> <span class="pre">nontemporal</span></code>
 for write-only data when algorithms such as <code class="docutils literal notranslate"><span class="pre">std::copy</span></code>, <code class="docutils literal notranslate"><span class="pre">std::fill</span></code>, etc.,
 are executed with unsequenced policies.
-For further details about the pragma,
-see the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/current/vector.html">vector page in the Intel® oneAPI DPC++/C++ Compiler Developer Guide and Reference</a>.
+For further details about the pragma, see the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/2025-0/vector.html">pragma vector documentation in the Intel® oneAPI DPC++/C++ Compiler Developer Guide and Reference</a>.
 If the macro evaluates to a non-zero value,
 the use of <code class="docutils literal notranslate"><span class="pre">#pragma</span> <span class="pre">vector</span> <span class="pre">nontemporal</span></code> is enabled.
 By default, the macro is not defined.</p>
@@ -523,12 +559,20 @@ <h2>Additional Macros<a class="headerlink" href="#additional-macros" title="Perm
 such as <code class="docutils literal notranslate"><span class="pre">dpcpp_default</span></code> and <code class="docutils literal notranslate"><span class="pre">dpcpp_fpga</span></code>. When the macro is not defined (by default)
 or evaluates to non-zero, predefined policies objects can be used.
 When the macro is set to 0, predefined policies objects and make functions
-without arguments, when <code class="docutils literal notranslate"><span class="pre">make_device_policy()</span></code>,
-<code class="docutils literal notranslate"><span class="pre">make_fpga_policy()</span></code>, are not available.</p></td>
+without arguments (<code class="docutils literal notranslate"><span class="pre">make_device_policy()</span></code> and <code class="docutils literal notranslate"><span class="pre">make_fpga_policy()</span></code>) are not available.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">ONEDPL_ALLOW_DEFERRED_WAITING</span></code></p></td>
 <td><p>This macro allows waiting for completion of certain algorithms executed with
-device policies to be deferred. (Disabled by default.)</p></td>
+device policies to be deferred. (Disabled by default.)</p>
+<p>When the macro evaluates to non-zero, a call to a oneDPL algorithm with
+a device policy might return before the computation completes on the device.</p>
+<div class="admonition warning">
+<p class="admonition-title">Warning</p>
+<p>Before accessing data produced or modified by the call, waiting
+for completion of all tasks in the corresponding SYCL queue is required;
+otherwise, the program behavior is undefined.</p>
+</div>
+</td>
 </tr>
 <tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">ONEDPL_FPGA_DEVICE</span></code></p></td>
 <td><p>Use this macro to build your code containing oneDPL parallel
@@ -563,12 +607,12 @@ <h2>Additional Macros<a class="headerlink" href="#additional-macros" title="Perm
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="kernel_templates/single_pass_scan.html"
+       href="api_for_sycl_kernels/utility_function_object_classes.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">Inclusive Scan</p>
+        <p class="prev-next-title">Utility Function Object Classes</p>
       </div>
     </a>
     <a class="right-next"
@@ -599,6 +643,7 @@ <h2>Additional Macros<a class="headerlink" href="#additional-macros" title="Perm
   <nav class="bd-toc-nav page-toc">
     <ul class="visible nav section-nav flex-column">
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#version-macros">Version Macros</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#feature-macros">Feature Macros</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#additional-macros">Additional Macros</a></li>
 </ul>
   </nav></div>
diff --git a/notices_disclaimers.html b/notices_disclaimers.html
index f03e904769..84285a2d28 100644
--- a/notices_disclaimers.html
+++ b/notices_disclaimers.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Notices and Disclaimers &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Notices and Disclaimers &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,7 +45,7 @@
     <link rel="shortcut icon" href="_static/favicons.png"/>
     <link rel="index" title="Index" href="genindex.html" />
     <link rel="search" title="Search" href="search.html" />
-    <link rel="prev" title="oneDPL 2022 Breaking Changes" href="oneDPL_2022.0_changes.html" />
+    <link rel="prev" title="Inclusive Scan" href="kernel_templates/single_pass_scan.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -150,24 +150,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -183,14 +190,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="current nav bd-sidenav">
@@ -429,12 +434,12 @@ <h2>License<a class="headerlink" href="#license" title="Permalink to this headli
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="oneDPL_2022.0_changes.html"
+       href="kernel_templates/single_pass_scan.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">oneDPL 2022 Breaking Changes</p>
+        <p class="prev-next-title">Inclusive Scan</p>
       </div>
     </a>
 </div></div>
diff --git a/objects.inv b/objects.inv
index 20733c4f91..60c6931331 100644
Binary files a/objects.inv and b/objects.inv differ
diff --git a/oneDPL_2022.0_changes.html b/oneDPL_2022.0_changes.html
index 807dc7bf67..3f3e13f2de 100644
--- a/oneDPL_2022.0_changes.html
+++ b/oneDPL_2022.0_changes.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>oneDPL 2022 Breaking Changes &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>oneDPL 2022 Breaking Changes &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,7 +45,7 @@
     <link rel="shortcut icon" href="_static/favicons.png"/>
     <link rel="index" title="Index" href="genindex.html" />
     <link rel="search" title="Search" href="search.html" />
-    <link rel="next" title="Notices and Disclaimers" href="notices_disclaimers.html" />
+    <link rel="next" title="Asynchronous Algorithms" href="parallel_api/async_api.html" />
     <link rel="prev" title="CMake Support" href="cmake_support.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1 current active"><a class="current reference internal" href="#">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1 current active"><a class="current reference internal" href="#">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -455,11 +460,11 @@ <h1>oneDPL 2022 Breaking Changes<a class="headerlink" href="#onedpl-2022-breakin
       </div>
     </a>
     <a class="right-next"
-       href="notices_disclaimers.html"
+       href="parallel_api/async_api.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">Notices and Disclaimers</p>
+        <p class="prev-next-title">Asynchronous Algorithms</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
diff --git a/onedpl_gsg.html b/onedpl_gsg.html
index d93ec90fee..7cb7136a26 100644
--- a/onedpl_gsg.html
+++ b/onedpl_gsg.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Get Started with the oneAPI DPC++ Library &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Get Started with the oneAPI DPC++ Library &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -149,24 +149,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -182,14 +189,12 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -420,8 +425,7 @@ <h2> Contents </h2>
                   
   <div class="section" id="get-started-with-the-onedpl-long">
 <h1>Get Started with the oneAPI DPC++ Library<a class="headerlink" href="#get-started-with-the-onedpl-long" title="Permalink to this headline">#</a></h1>
-<p>oneAPI DPC++ Library (oneDPL) works with the
-<a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/get-started-guide/current/overview.html">Intel® oneAPI DPC++/C++ Compiler</a>
+<p>oneAPI DPC++ Library (oneDPL) works with the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/get-started-guide/2025-0/overview.html">Intel® oneAPI DPC++/C++ Compiler</a>
 to provide high-productivity APIs to developers, which can minimize SYCL*
 programming efforts across devices for high performance parallel applications.</p>
 <p>oneDPL consists of the following components:</p>
@@ -431,8 +435,7 @@ <h1>Get Started with the oneAPI DPC++ Library<a class="headerlink" href="#get-st
 <li><p>Macros</p></li>
 </ul>
 <p>For general information about oneDPL, visit the <a class="reference external" href="https://github.com/oneapi-src/oneDPL">oneDPL GitHub* repository</a>,
-or visit the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/overview.html">Intel® oneAPI DPC++ Library Guide</a>
-and the <a class="reference external" href="https://www.intel.com/content/www/us/en/developer/tools/oneapi/dpc-library.html">Intel® oneAPI DPC++ Library main page</a>.</p>
+or visit the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/2022-7/overview.html">Intel® oneAPI DPC++ Library Guide</a> and the <a class="reference external" href="https://www.intel.com/content/www/us/en/developer/tools/oneapi/dpc-library.html">Intel® oneAPI DPC++ Library main page</a>.</p>
 <div class="section" id="quick-start">
 <h2>Quick Start<a class="headerlink" href="#quick-start" title="Permalink to this headline">#</a></h2>
 <div class="section" id="installation">
@@ -456,11 +459,15 @@ <h3>Installation<a class="headerlink" href="#installation" title="Permalink to t
 </div>
 <div class="section" id="cmake-support">
 <h3>CMake Support<a class="headerlink" href="#cmake-support" title="Permalink to this headline">#</a></h3>
-<p><a class="reference external" href="https://cmake.org/cmake/help/latest/index.html">CMake</a> generates build scripts which can then be used to build and link your application. oneDPL can be added to your project via CMake.</p>
-<p>A simple example for Linux is provided below. For more detailed usage and options including details specific to Windows, please look to the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/cmake-support.html">CMake Support Page</a>.</p>
+<p><a class="reference external" href="https://cmake.org/cmake/help/latest/index.html">CMake</a> generates build scripts which can then be used
+to build and link your application. oneDPL can be added to your project via CMake.</p>
+<p>A simple example for Linux is provided below. For more detailed usage and options including details specific to Windows,
+please look to the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/dpcpp-cpp-compiler/developer-guide-reference/2025-0/use-cmake-with-the-compiler.html">CMake support documentation for the Intel® oneAPI DPC++/C++ Compiler</a>.</p>
 <div class="section" id="simple-example-cmake-file">
 <h4>Simple Example CMake File<a class="headerlink" href="#simple-example-cmake-file" title="Permalink to this headline">#</a></h4>
-<p>To use oneDPL with CMake, create a CMakeLists.txt file for your project’s base directory and use <a class="reference external" href="https://cmake.org/cmake/help/latest/command/find_package.html">find_package</a> and <a class="reference external" href="https://cmake.org/cmake/help/latest/command/target_link_libraries.html">target_link_libraries</a> to add oneDPL.
+<p>To use oneDPL with CMake, create a CMakeLists.txt file for your project’s base directory and use
+<a class="reference external" href="https://cmake.org/cmake/help/latest/command/find_package.html">find_package</a>
+and <a class="reference external" href="https://cmake.org/cmake/help/latest/command/target_link_libraries.html">target_link_libraries</a> to add oneDPL.
 For example:</p>
 <div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="n">project</span><span class="p">(</span><span class="n">Foo</span><span class="p">)</span>
 <span class="n">add_executable</span><span class="p">(</span><span class="n">foo</span><span class="w"> </span><span class="n">foo</span><span class="p">.</span><span class="n">cpp</span><span class="p">)</span>
@@ -600,7 +607,7 @@ <h2>Find More<a class="headerlink" href="#find-more" title="Permalink to this he
 </tr>
 </thead>
 <tbody>
-<tr class="row-even"><td><p><a class="reference external" href="https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/current/overview.html">Intel® oneAPI DPC++ Library Guide</a></p></td>
+<tr class="row-even"><td><p><a class="reference external" href="https://www.intel.com/content/www/us/en/docs/onedpl/developer-guide/2022-7/overview.html">Intel® oneAPI DPC++ Library Guide</a></p></td>
 <td><p>Refer to the oneDPL guide for  more in depth information.</p></td>
 </tr>
 <tr class="row-odd"><td><p><a class="reference external" href="https://www.intel.com/content/www/us/en/developer/articles/system-requirements/intel-oneapi-dpcpp-system-requirements.html">System Requirements</a></p></td>
@@ -612,11 +619,12 @@ <h2>Find More<a class="headerlink" href="#find-more" title="Permalink to this he
 <tr class="row-odd"><td><p><a class="reference external" href="https://github.com/oneapi-src/oneAPI-samples/tree/master/Libraries/oneDPL">oneDPL Samples</a></p></td>
 <td><p>Learn how to use oneDPL with samples.</p></td>
 </tr>
-<tr class="row-even"><td><p><a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi-iot-toolkit/get-started-guide-linux/current/adding-oneapi-components-to-yocto-project-builds.html">Layers for Yocto* Project</a></p></td>
+<tr class="row-even"><td><p><a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi-iot-toolkit/get-started-guide-linux/2025-0/adding-oneapi-components-to-yocto-project-builds.html">Layers for Yocto* Project</a></p></td>
 <td><p>Add oneAPI components to a Yocto project build using the meta-intel layers.</p></td>
 </tr>
 <tr class="row-odd"><td><p><a class="reference external" href="https://oneapi-src.github.io/oneAPI-samples/">oneAPI Samples Catalog</a></p></td>
-<td><p>Explore the complete list of oneAPI code samples in the oneAPI Samples Catalog (GitHub*). These samples were designed to help you develop, offload, and optimize multiarchitecture applications targeting CPUs, GPUs, and FPGAs.</p></td>
+<td><p>Explore the complete list of oneAPI code samples in the oneAPI Samples Catalog (GitHub*).
+These samples were designed to help you develop, offload, and optimize multiarchitecture applications targeting CPUs, GPUs, and FPGAs.</p></td>
 </tr>
 </tbody>
 </table>
diff --git a/parallel_api/additional_algorithms.html b/parallel_api/additional_algorithms.html
index 0909c0862a..d6f0e7ce1b 100644
--- a/parallel_api/additional_algorithms.html
+++ b/parallel_api/additional_algorithms.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Additional Algorithms &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Additional Algorithms &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -46,7 +46,7 @@
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
     <link rel="next" title="Pass Data to Algorithms" href="pass_data_algorithms.html" />
-    <link rel="prev" title="Range-Based API Algorithms" href="range_based_api.html" />
+    <link rel="prev" title="Parallel Range Algorithms" href="parallel_range_algorithms.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 current active has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2 current active"><a class="current reference internal" href="#">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -393,7 +398,7 @@ <h1>Additional Algorithms</h1>
                   
   <div class="section" id="additional-algorithms">
 <h1>Additional Algorithms<a class="headerlink" href="#additional-algorithms" title="Permalink to this headline">#</a></h1>
-<p>The definitions of the algorithms listed below are available through the <code class="docutils literal notranslate"><span class="pre">oneapi/dpl/algorithm</span></code>
+<p>The definitions of the algorithms listed below are available through the <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/algorithm&gt;</span></code>
 header.  All algorithms are implemented in the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl</span></code> namespace.</p>
 <ul>
 <li><p><code class="docutils literal notranslate"><span class="pre">reduce_by_segment</span></code>: performs partial reductions on a sequence’s values and keys. Each
@@ -471,11 +476,12 @@ <h1>Additional Algorithms<a class="headerlink" href="#additional-algorithms" tit
 </pre></div>
 </div>
 </li>
-<li><p><code class="docutils literal notranslate"><span class="pre">sort_by_key</span></code>: performs a stable key-value sort. The algorithm sorts the sequence’s keys according to
-a comparioson operator. If no comparator is provided, then the elements are compared with <code class="docutils literal notranslate"><span class="pre">operator&lt;</span></code>.
-The sequence’s values are permutated according to the sorted sequence’s keys. The prerequisite for correct
-behavior is that the size for both keys sequence and values sequence shall be the same.
-For example:</p>
+<li><p><code class="docutils literal notranslate"><span class="pre">sort_by_key</span></code>: performs a key-value sort.
+The algorithm sorts a sequence of keys using a given comparison function object.
+If it is not provided, the elements are compared with <code class="docutils literal notranslate"><span class="pre">operator&lt;</span></code>.
+A sequence of values is simultaneously permuted according to the sorted order of keys.
+There must be at least as many values as the keys, otherwise the behavior is undefined.</p>
+<p>For example:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">keys</span><span class="p">:</span>   <span class="p">[</span><span class="mi">3</span><span class="p">,</span>    <span class="mi">5</span><span class="p">,</span>   <span class="mi">0</span><span class="p">,</span>   <span class="mi">4</span><span class="p">,</span>   <span class="mi">3</span><span class="p">,</span>   <span class="mi">0</span><span class="p">]</span>
 <span class="n">values</span><span class="p">:</span> <span class="p">[</span><span class="s1">&#39;a&#39;</span><span class="p">,</span> <span class="s1">&#39;b&#39;</span><span class="p">,</span> <span class="s1">&#39;c&#39;</span><span class="p">,</span> <span class="s1">&#39;d&#39;</span><span class="p">,</span> <span class="s1">&#39;e&#39;</span><span class="p">,</span> <span class="s1">&#39;f&#39;</span><span class="p">]</span>
 <span class="n">output_keys</span><span class="p">:</span>   <span class="p">[</span><span class="mi">0</span><span class="p">,</span>    <span class="mi">0</span><span class="p">,</span>   <span class="mi">3</span><span class="p">,</span>   <span class="mi">3</span><span class="p">,</span>   <span class="mi">4</span><span class="p">,</span>   <span class="mi">5</span><span class="p">]</span>
@@ -483,6 +489,16 @@ <h1>Additional Algorithms<a class="headerlink" href="#additional-algorithms" tit
 </pre></div>
 </div>
 </li>
+</ul>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p><code class="docutils literal notranslate"><span class="pre">sort_by_key</span></code> currently implements a stable sort for device execution policies,
+but may implement an unstable sort in the future.
+Use <code class="docutils literal notranslate"><span class="pre">stable_sort_by_key</span></code> if stability is essential.</p>
+</div>
+<ul>
+<li><p><code class="docutils literal notranslate"><span class="pre">stable_sort_by_key</span></code>: performs a key-value sort similar to <code class="docutils literal notranslate"><span class="pre">sort_by_key</span></code>,
+but with the added guarantee of stability.</p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">transform_if</span></code>: performs a transform on the input sequence(s) elements and stores the result into the
 corresponding position in the output sequence at each position for which the predicate applied to the
 element(s) evaluates to <code class="docutils literal notranslate"><span class="pre">true</span></code>. If the predicate evaluates to <code class="docutils literal notranslate"><span class="pre">false</span></code>, the transform is not applied for
@@ -552,12 +568,12 @@ <h1>Additional Algorithms<a class="headerlink" href="#additional-algorithms" tit
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="range_based_api.html"
+       href="parallel_range_algorithms.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">Range-Based API Algorithms</p>
+        <p class="prev-next-title">Parallel Range Algorithms</p>
       </div>
     </a>
     <a class="right-next"
diff --git a/parallel_api/async_api.html b/parallel_api/async_api.html
index acc8f27a7f..8f2110f96c 100644
--- a/parallel_api/async_api.html
+++ b/parallel_api/async_api.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Asynchronous API Algorithms &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Asynchronous Algorithms &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,8 +45,8 @@
     <link rel="shortcut icon" href="../_static/favicons.png"/>
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="Range-Based API Algorithms" href="range_based_api.html" />
-    <link rel="prev" title="Iterators" href="iterators.html" />
+    <link rel="next" title="Dynamic Selection API" href="../dynamic_selection_api_main.html" />
+    <link rel="prev" title="oneDPL 2022 Breaking Changes" href="../oneDPL_2022.0_changes.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
-<ul class="current nav bd-sidenav">
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
-<li class="toctree-l1 current active has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
+<li class="toctree-l1 has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="iterators.html">Iterators</a></li>
-<li class="toctree-l2 current active"><a class="current reference internal" href="#">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1 current active"><a class="current reference internal" href="#">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -379,7 +384,7 @@
               
 
 <div id="jb-print-docs-body" class="onlyprint">
-    <h1>Asynchronous API Algorithms</h1>
+    <h1>Asynchronous Algorithms</h1>
     <!-- Table of contents -->
     <div id="print-main-content">
         <div id="jb-print-toc">
@@ -401,8 +406,8 @@ <h2> Contents </h2>
 <div id="searchbox"></div>
                 <article class="bd-article" role="main">
                   
-  <div class="section" id="asynchronous-api-algorithms">
-<h1>Asynchronous API Algorithms<a class="headerlink" href="#asynchronous-api-algorithms" title="Permalink to this headline">#</a></h1>
+  <div class="section" id="asynchronous-algorithms">
+<h1>Asynchronous Algorithms<a class="headerlink" href="#asynchronous-algorithms" title="Permalink to this headline">#</a></h1>
 <p>The functions defined in the STL <code class="docutils literal notranslate"><span class="pre">&lt;algorithm&gt;</span></code> or <code class="docutils literal notranslate"><span class="pre">&lt;numeric&gt;</span></code> headers are traditionally blocking. oneAPI DPC++ Library (oneDPL)
 extends the functionality of the C++17 parallel algorithms by providing asynchronous algorithms with non-blocking behavior.
 This experimental feature enables you to express a concurrent control flow by building dependency chains, interleaving algorithm calls,
@@ -450,20 +455,17 @@ <h2>Example of Async API Usage<a class="headerlink" href="#example-of-async-api-
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;sycl/sycl.hpp&gt;</span>
 
 <span class="kt">int</span><span class="w"> </span><span class="nf">main</span><span class="p">()</span><span class="w"> </span><span class="p">{</span>
-<span class="w">    </span><span class="k">using</span><span class="w"> </span><span class="k">namespace</span><span class="w"> </span><span class="nn">oneapi</span><span class="p">;</span>
-<span class="w">    </span><span class="p">{</span>
-<span class="w">        </span><span class="cm">/* Build and compute a simple dependency chain: Fill buffer -&gt; Transform -&gt; Reduce */</span>
-<span class="w">        </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">a</span><span class="p">{</span><span class="mi">10</span><span class="p">};</span>
-
-<span class="w">        </span><span class="k">auto</span><span class="w"> </span><span class="n">fut1</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">experimental</span><span class="o">::</span><span class="n">fill_async</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
-<span class="w">                                                  </span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="n">dpl</span><span class="o">::</span><span class="n">end</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="mi">7</span><span class="p">);</span>
-
-<span class="w">        </span><span class="k">auto</span><span class="w"> </span><span class="n">fut2</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">experimental</span><span class="o">::</span><span class="n">transform_async</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
-<span class="w">                                                       </span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="n">dpl</span><span class="o">::</span><span class="n">end</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">a</span><span class="p">),</span>
-<span class="w">                                                       </span><span class="p">[</span><span class="o">&amp;</span><span class="p">](</span><span class="k">const</span><span class="w"> </span><span class="kt">int</span><span class="o">&amp;</span><span class="w"> </span><span class="n">x</span><span class="p">){</span><span class="k">return</span><span class="w"> </span><span class="n">x</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="mi">1</span><span class="p">;</span><span class="w"> </span><span class="p">},</span><span class="n">fut1</span><span class="p">);</span>
-<span class="w">        </span><span class="k">auto</span><span class="w"> </span><span class="n">ret_val</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">experimental</span><span class="o">::</span><span class="n">reduce_async</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
-<span class="w">                                                       </span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="n">dpl</span><span class="o">::</span><span class="n">end</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="n">fut1</span><span class="p">,</span><span class="n">fut2</span><span class="p">).</span><span class="n">get</span><span class="p">();</span>
-<span class="w">    </span><span class="p">}</span>
+<span class="w">    </span><span class="cm">/* Build and compute a simple dependency chain: Fill buffer -&gt; Transform -&gt; Reduce */</span>
+<span class="w">    </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">a</span><span class="p">{</span><span class="mi">10</span><span class="p">};</span>
+
+<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">fut1</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">experimental</span><span class="o">::</span><span class="n">fill_async</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
+<span class="w">                                              </span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="n">dpl</span><span class="o">::</span><span class="n">end</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="mi">7</span><span class="p">);</span>
+
+<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">fut2</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">experimental</span><span class="o">::</span><span class="n">transform_async</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
+<span class="w">                                                   </span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="n">dpl</span><span class="o">::</span><span class="n">end</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">a</span><span class="p">),</span>
+<span class="w">                                                   </span><span class="p">[</span><span class="o">&amp;</span><span class="p">](</span><span class="k">const</span><span class="w"> </span><span class="kt">int</span><span class="o">&amp;</span><span class="w"> </span><span class="n">x</span><span class="p">){</span><span class="k">return</span><span class="w"> </span><span class="n">x</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="mi">1</span><span class="p">;</span><span class="w"> </span><span class="p">},</span><span class="n">fut1</span><span class="p">);</span>
+<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">ret_val</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">experimental</span><span class="o">::</span><span class="n">reduce_async</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
+<span class="w">                                                   </span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="n">dpl</span><span class="o">::</span><span class="n">end</span><span class="p">(</span><span class="n">a</span><span class="p">),</span><span class="n">fut1</span><span class="p">,</span><span class="n">fut2</span><span class="p">).</span><span class="n">get</span><span class="p">();</span>
 <span class="w">    </span><span class="k">return</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span>
 <span class="p">}</span>
 </pre></div>
@@ -484,20 +486,20 @@ <h2>Example of Async API Usage<a class="headerlink" href="#example-of-async-api-
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="iterators.html"
+       href="../oneDPL_2022.0_changes.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">Iterators</p>
+        <p class="prev-next-title">oneDPL 2022 Breaking Changes</p>
       </div>
     </a>
     <a class="right-next"
-       href="range_based_api.html"
+       href="../dynamic_selection_api_main.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">Range-Based API Algorithms</p>
+        <p class="prev-next-title">Dynamic Selection API</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
diff --git a/parallel_api/execution_policies.html b/parallel_api/execution_policies.html
index 6440769f50..a66b53c4fe 100644
--- a/parallel_api/execution_policies.html
+++ b/parallel_api/execution_policies.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Execution Policies &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Execution Policies &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,7 +45,7 @@
     <link rel="shortcut icon" href="../_static/favicons.png"/>
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="Iterators" href="iterators.html" />
+    <link rel="next" title="Parallel Range Algorithms" href="parallel_range_algorithms.html" />
     <link rel="prev" title="Parallel API" href="../parallel_api_main.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 current active has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2 current active"><a class="current reference internal" href="#">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -389,7 +394,7 @@ <h2> Contents </h2>
             </div>
             <nav aria-label="Page">
                 <ul class="visible nav section-nav flex-column">
-<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-the-c-standard-execution-policies">Use the C++ Standard Execution Policies</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-the-c-standard-aligned-execution-policies">Use the C++ Standard Aligned Execution Policies</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-the-device-execution-policies">Use the Device Execution Policies</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#usage-examples">Usage Examples</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-the-fpga-policy">Use the FPGA Policy</a></li>
@@ -408,41 +413,47 @@ <h2> Contents </h2>
                   
   <div class="section" id="execution-policies">
 <h1>Execution Policies<a class="headerlink" href="#execution-policies" title="Permalink to this headline">#</a></h1>
-<p>The implementation supports the device execution policies used to run the massive parallel
-computational model for heterogeneous systems. The policies are specified in
-the oneAPI DPC++ Library (oneDPL) section of the <a class="reference external" href="https://spec.oneapi.io/versions/latest/elements/oneDPL/source/parallel_api.html#dpc-execution-policy">oneAPI Specification</a>.</p>
-<p>For any of the implemented algorithms, pass one of the execution policy objects as the first
-argument in a call to specify the desired execution behavior. The policies have
-the following meaning:</p>
+<p>According to <a class="reference external" href="https://uxlfoundation.github.io/oneAPI-spec/spec/elements/oneDPL/source/index.html">the oneAPI specification</a>,
+oneAPI DPC++ Library (oneDPL) provides execution policies semantically aligned with the C++ standard,
+referred to as <em>standard-aligned</em> or <em>host execution policies</em>, as well as <em>device execution policies</em>
+to run data parallel computations on heterogeneous systems.</p>
+<p>The execution policies are defined in the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::execution</span></code> namespace and provided
+in the <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/execution&gt;</span></code> header. The policies have the following meaning:</p>
 <table class="table">
 <colgroup>
-<col style="width: 36%" />
-<col style="width: 64%" />
+<col style="width: 22%" />
+<col style="width: 78%" />
 </colgroup>
 <thead>
-<tr class="row-odd"><th class="head"><p>Execution Policy Value</p></th>
+<tr class="row-odd"><th class="head"><p>Policy Name / Type</p></th>
 <th class="head"><p>Description</p></th>
 </tr>
 </thead>
 <tbody>
 <tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">seq</span></code></p></td>
-<td><p>Sequential execution.</p></td>
+<td><p>The standard-aligned policy for sequential execution.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">unseq</span></code></p></td>
-<td><p>Unsequenced SIMD execution. This policy requires that
-all functions provided are SIMD-safe.</p></td>
+<td><p>The standard-aligned policy for possible unsequenced SIMD execution.
+This policy requires user-provided functions to be SIMD-safe.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">par</span></code></p></td>
-<td><p>Parallel execution by multiple threads.</p></td>
+<td><p>The standard-aligned policy for possible parallel execution by multiple threads.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">par_unseq</span></code></p></td>
-<td><p>Combined effect of <code class="docutils literal notranslate"><span class="pre">unseq</span></code> and <code class="docutils literal notranslate"><span class="pre">par</span></code>.</p></td>
+<td><p>The standard-aligned policy with the combined effect of <code class="docutils literal notranslate"><span class="pre">unseq</span></code> and <code class="docutils literal notranslate"><span class="pre">par</span></code>.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">device_policy</span></code></p></td>
+<td><p>The class template to create device policies for data parallel execution.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">dpcpp_default</span></code></p></td>
-<td><p>Massive parallel execution on devices using DPC++.</p></td>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">dpcpp_default</span></code></p></td>
+<td><p>The device policy for data parallel execution on the default SYCL device.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">fpga_policy</span></code></p></td>
+<td><p>The class template to create policies for execution on FPGA devices.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">dpcpp_fpga</span></code></p></td>
-<td><p>Massive parallel execution on FPGA devices.</p></td>
+<td><p>The device policy for data parallel execution on a SYCL FPGA device.</p></td>
 </tr>
 </tbody>
 </table>
@@ -450,39 +461,34 @@ <h1>Execution Policies<a class="headerlink" href="#execution-policies" title="Pe
 <a class="reference external" href="https://github.com/llvm/llvm-project/tree/main/pstl">LLVM Project</a>.</p>
 <p>oneDPL supports two parallel backends for execution with <code class="docutils literal notranslate"><span class="pre">par</span></code> and <code class="docutils literal notranslate"><span class="pre">par_unseq</span></code> policies:</p>
 <ol class="arabic simple">
-<li><p>TBB backend (enabled by default) uses oneAPI Threading Building Blocks (oneTBB) or Intel® Threading Building Blocks (Intel® TBB) for parallel execution.</p></li>
-<li><p>OpenMP backend uses OpenMP* pragmas for parallel execution. Visit
+<li><p>The TBB backend (enabled by default) uses oneAPI Threading Building Blocks (oneTBB) or Intel® Threading Building Blocks (Intel® TBB) for parallel execution.</p></li>
+<li><p>The OpenMP backend uses OpenMP* pragmas for parallel execution. Visit
 <a class="reference internal" href="../macros.html"><span class="doc">Macros</span></a> for the information how to enable the OpenMP backend.</p></li>
 </ol>
+<p>OpenMP pragmas are also used for SIMD execution with <code class="docutils literal notranslate"><span class="pre">unseq</span></code> and <code class="docutils literal notranslate"><span class="pre">par_unseq</span></code> policies.</p>
 <p>Follow these steps to add Parallel API to your application:</p>
 <ol class="arabic">
 <li><p>Add <code class="docutils literal notranslate"><span class="pre">#include</span> <span class="pre">&lt;oneapi/dpl/execution&gt;</span></code> to your code.
 Then include one or more of the following header files, depending on the algorithms you
 intend to use:</p>
-<ol class="arabic simple">
+<ul class="simple">
 <li><p><code class="docutils literal notranslate"><span class="pre">#include</span> <span class="pre">&lt;oneapi/dpl/algorithm&gt;</span></code></p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">#include</span> <span class="pre">&lt;oneapi/dpl/numeric&gt;</span></code></p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">#include</span> <span class="pre">&lt;oneapi/dpl/memory&gt;</span></code></p></li>
-</ol>
-<p>For better coexistence with the C++ standard library,
-include oneDPL header files before the standard C++ ones.</p>
-</li>
-<li><p>Pass a oneDPL execution policy object, defined in the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::execution</span></code>
-namespace, to a parallel algorithm.</p></li>
-<li><p>Use the C++ standard execution policies:</p>
-<ol class="arabic simple">
-<li><p>Compile the code with options that enable OpenMP parallelism and/or vectorization pragmas.</p></li>
-<li><p>Link with the oneAPI Threading Building Blocks (oneTBB) or Intel® Threading Building Blocks (Intel® TBB) dynamic library for TBB-based parallelism.</p></li>
-</ol>
+</ul>
 </li>
-<li><p>Use the device execution policies:</p>
-<ol class="arabic simple">
-<li><p>Compile the code with options that enable support for SYCL 2020.</p></li>
-</ol>
+<li><p>Pass a oneDPL execution policy object as the first argument to a parallel algorithm
+to indicate the desired execution behavior.</p></li>
+<li><p>If you use the standard-aligned execution policies:</p>
+<ul class="simple">
+<li><p>Compile the code with options that enable OpenMP parallelism and/or SIMD vectorization pragmas.</p></li>
+<li><p>Compile and link with the oneTBB or Intel® TBB library for TBB-based parallelism.</p></li>
+</ul>
+<p>If you use the device execution policies, compile the code with options that enable support for SYCL 2020.</p>
 </li>
 </ol>
-<div class="section" id="use-the-c-standard-execution-policies">
-<h2>Use the C++ Standard Execution Policies<a class="headerlink" href="#use-the-c-standard-execution-policies" title="Permalink to this headline">#</a></h2>
+<div class="section" id="use-the-c-standard-aligned-execution-policies">
+<h2>Use the C++ Standard Aligned Execution Policies<a class="headerlink" href="#use-the-c-standard-aligned-execution-policies" title="Permalink to this headline">#</a></h2>
 <p>Example:</p>
 <div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/execution&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/algorithm&gt;</span>
@@ -499,10 +505,8 @@ <h2>Use the C++ Standard Execution Policies<a class="headerlink" href="#use-the-
 </div>
 <div class="section" id="use-the-device-execution-policies">
 <h2>Use the Device Execution Policies<a class="headerlink" href="#use-the-device-execution-policies" title="Permalink to this headline">#</a></h2>
-<p>The device execution policy specifies where a parallel algorithm runs.
-It encapsulates a SYCL device or queue and allows you to
-set an optional kernel name. Device execution policies can be used with all
-standard C++ algorithms that support execution policies.</p>
+<p>The device execution policy specifies where a oneDPL parallel algorithm runs.
+It encapsulates a SYCL device or queue and allows you to set an optional kernel name.</p>
 <p>To create a policy object, you may use one of the following constructor arguments:</p>
 <ul class="simple">
 <li><p>A SYCL queue</p></li>
@@ -515,8 +519,8 @@ <h2>Use the Device Execution Policies<a class="headerlink" href="#use-the-device
 names for SYCL kernel functions. The Intel® oneAPI DPC++/C++ Compiler supports it by default;
 for other compilers it may need to be enabled with compilation options such as
 <code class="docutils literal notranslate"><span class="pre">-fsycl-unnamed-lambda</span></code>. Refer to your compiler documentation for more information.</p>
-<p>The <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::execution::dpcpp_default</span></code> object is a predefined object of
-the <code class="docutils literal notranslate"><span class="pre">device_policy</span></code> class. It is created with a default kernel name and a default queue.
+<p>The <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::execution::dpcpp_default</span></code> object is a predefined immutable object of
+the <code class="docutils literal notranslate"><span class="pre">device_policy</span></code> class. It is created with a default kernel name and uses a default queue.
 Use it to construct customized policy objects or pass directly when invoking an algorithm.</p>
 <p>If <code class="docutils literal notranslate"><span class="pre">dpcpp_default</span></code> is passed directly to more than one algorithm, you must ensure that the
 compiler you use supports implicit kernel names (see above) and this option is turned on.</p>
@@ -572,16 +576,15 @@ <h2>Use the FPGA Policy<a class="headerlink" href="#use-the-fpga-policy" title="
 <p>The default constructor of <code class="docutils literal notranslate"><span class="pre">fpga_policy</span></code> wraps a SYCL queue created
 for <code class="docutils literal notranslate"><span class="pre">fpga_selector</span></code>, or for <code class="docutils literal notranslate"><span class="pre">fpga_emulator_selector</span></code>
 if the <code class="docutils literal notranslate"><span class="pre">ONEDPL_FPGA_EMULATOR</span></code> is defined.</p>
-<p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::execution::dpcpp_fpga</span></code> is a predefined object of
+<p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::execution::dpcpp_fpga</span></code> is a predefined immutable object of
 the <code class="docutils literal notranslate"><span class="pre">fpga_policy</span></code> class created with a default unroll factor and a default kernel name.
 Use it to create customized policy objects or pass directly when invoking an algorithm.</p>
 <div class="admonition note">
 <p class="admonition-title">Note</p>
 <p>Specifying the unroll factor for a policy enables loop unrolling in the implementation of
-your algorithms. The default value is 1.
-To find out how to choose a more precise value, refer to the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi-fpga-add-on/developer-guide/current/unroll-pragma.html">unroll Pragma</a>
-and <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi-fpga-add-on/developer-guide/current/loop-analysis.html">Loop Analysis</a> content in
-the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi-fpga-add-on/developer-guide/2024-0/intel-oneapi-fpga-handbook.html">Intel® oneAPI FPGA Handbook</a>.</p>
+oneDPL algorithms. The default value is 1.
+To find out how to choose a more precise value, refer to the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi-fpga-add-on/developer-guide/2025-0/unroll-pragma.html">unroll Pragma</a>
+and <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi-fpga-add-on/developer-guide/2025-0/loop-analysis.html">Loop Analysis</a> content in the <a class="reference external" href="https://www.intel.com/content/www/us/en/docs/oneapi-fpga-add-on/developer-guide/2025-0/intel-oneapi-fpga-handbook.html">Intel® oneAPI FPGA Handbook</a>.</p>
 </div>
 <p>The <code class="docutils literal notranslate"><span class="pre">make_fpga_policy</span></code> function templates simplify <code class="docutils literal notranslate"><span class="pre">fpga_policy</span></code> creation.</p>
 </div>
@@ -598,8 +601,8 @@ <h2>FPGA Policy Usage Examples<a class="headerlink" href="#fpga-policy-usage-exa
 </div>
 <div class="section" id="error-handling-with-device-execution-policies">
 <h2>Error Handling with Device Execution Policies<a class="headerlink" href="#error-handling-with-device-execution-policies" title="Permalink to this headline">#</a></h2>
-<p>The SYCL error handling model supports two types of errors: Synchronous errors cause the SYCL host
-runtime libraries throw exceptions. Asynchronous errors may only be processed in a user-supplied error handler
+<p>The SYCL error handling model supports two types of errors. Synchronous errors cause the SYCL API functions
+to throw exceptions. Asynchronous errors may only be processed in a user-supplied error handler
 associated with a SYCL queue.</p>
 <p>For algorithms executed with device policies, handling all errors, synchronous or asynchronous, is a
 responsibility of the caller. Specifically:</p>
@@ -637,11 +640,11 @@ <h2>Error Handling with Device Execution Policies<a class="headerlink" href="#er
       </div>
     </a>
     <a class="right-next"
-       href="iterators.html"
+       href="parallel_range_algorithms.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">Iterators</p>
+        <p class="prev-next-title">Parallel Range Algorithms</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
@@ -663,7 +666,7 @@ <h2>Error Handling with Device Execution Policies<a class="headerlink" href="#er
   </div>
   <nav class="bd-toc-nav page-toc">
     <ul class="visible nav section-nav flex-column">
-<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-the-c-standard-execution-policies">Use the C++ Standard Execution Policies</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-the-c-standard-aligned-execution-policies">Use the C++ Standard Aligned Execution Policies</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-the-device-execution-policies">Use the Device Execution Policies</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#usage-examples">Usage Examples</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-the-fpga-policy">Use the FPGA Policy</a></li>
diff --git a/parallel_api/iterators.html b/parallel_api/iterators.html
index fd8ef8905d..d9eefc7eeb 100644
--- a/parallel_api/iterators.html
+++ b/parallel_api/iterators.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Iterators &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Iterators &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,8 +45,8 @@
     <link rel="shortcut icon" href="../_static/favicons.png"/>
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="Asynchronous API Algorithms" href="async_api.html" />
-    <link rel="prev" title="Execution Policies" href="execution_policies.html" />
+    <link rel="next" title="Experimental Range-Based API" href="range_based_api.html" />
+    <link rel="prev" title="Pass Data to Algorithms" href="pass_data_algorithms.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 current active has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2 current active"><a class="current reference internal" href="#">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2 current active"><a class="current reference internal" href="#">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -393,19 +398,18 @@ <h1>Iterators</h1>
                   
   <div class="section" id="iterators">
 <h1>Iterators<a class="headerlink" href="#iterators" title="Permalink to this headline">#</a></h1>
-<p>The definitions of the iterators are available through the <code class="docutils literal notranslate"><span class="pre">oneapi/dpl/iterator</span></code>
+<p>The definitions of the iterators are available through the <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/iterator&gt;</span></code>
 header.  All iterators are implemented in the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl</span></code> namespace.</p>
 <ul>
 <li><p><code class="docutils literal notranslate"><span class="pre">counting_iterator</span></code>: a random-access iterator-like type whose dereferenced value is an integer
 counter. Instances of a <code class="docutils literal notranslate"><span class="pre">counting_iterator</span></code> provide read-only dereference operations. The counter of an
 <code class="docutils literal notranslate"><span class="pre">counting_iterator</span></code> instance changes according to the arithmetic of the random-access iterator type:</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">using</span> <span class="n">namespace</span> <span class="n">oneapi</span><span class="p">;</span>
-<span class="n">dpl</span><span class="p">::</span><span class="n">counting_iterator</span><span class="o">&lt;</span><span class="nb">int</span><span class="o">&gt;</span> <span class="n">count_a</span><span class="p">(</span><span class="mi">0</span><span class="p">);</span>
-<span class="n">dpl</span><span class="p">::</span><span class="n">counting_iterator</span><span class="o">&lt;</span><span class="nb">int</span><span class="o">&gt;</span> <span class="n">count_b</span> <span class="o">=</span> <span class="n">count_a</span> <span class="o">+</span> <span class="mi">10</span><span class="p">;</span>
-<span class="nb">int</span> <span class="n">init</span> <span class="o">=</span> <span class="n">count_a</span><span class="p">[</span><span class="mi">0</span><span class="p">];</span> <span class="o">//</span> <span class="n">OK</span><span class="p">:</span> <span class="n">init</span> <span class="o">==</span> <span class="mi">0</span>
-<span class="o">*</span><span class="n">count_b</span> <span class="o">=</span> <span class="mi">7</span><span class="p">;</span> <span class="o">//</span> <span class="n">ERROR</span><span class="p">:</span> <span class="n">counting_iterator</span> <span class="n">does</span> <span class="ow">not</span> <span class="n">provide</span> <span class="n">write</span> <span class="n">operations</span>
-<span class="n">auto</span> <span class="nb">sum</span> <span class="o">=</span> <span class="n">std</span><span class="p">::</span><span class="n">reduce</span><span class="p">(</span><span class="n">dpl</span><span class="p">::</span><span class="n">execution</span><span class="p">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
-                       <span class="n">count_a</span><span class="p">,</span> <span class="n">count_b</span><span class="p">,</span> <span class="n">init</span><span class="p">);</span> <span class="o">//</span> <span class="nb">sum</span> <span class="ow">is</span> <span class="p">(</span><span class="mi">0</span> <span class="o">+</span> <span class="mi">0</span> <span class="o">+</span> <span class="mi">1</span> <span class="o">+</span> <span class="o">...</span> <span class="o">+</span> <span class="mi">9</span><span class="p">)</span> <span class="o">=</span> <span class="mi">45</span>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="n">dpl</span><span class="o">::</span><span class="n">counting_iterator</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">count_a</span><span class="p">(</span><span class="mi">0</span><span class="p">);</span>
+<span class="n">dpl</span><span class="o">::</span><span class="n">counting_iterator</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">count_b</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">count_a</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="mi">10</span><span class="p">;</span>
+<span class="kt">int</span><span class="w"> </span><span class="n">init</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">count_a</span><span class="p">[</span><span class="mi">0</span><span class="p">];</span><span class="w"> </span><span class="c1">// OK: init == 0</span>
+<span class="o">*</span><span class="n">count_b</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">7</span><span class="p">;</span><span class="w"> </span><span class="c1">// ERROR: counting_iterator does not provide write operations</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">sum</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">reduce</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
+<span class="w">                       </span><span class="n">count_a</span><span class="p">,</span><span class="w"> </span><span class="n">count_b</span><span class="p">,</span><span class="w"> </span><span class="n">init</span><span class="p">);</span><span class="w"> </span><span class="c1">// sum is (0 + 0 + 1 + ... + 9) = 45</span>
 </pre></div>
 </div>
 </li>
@@ -418,21 +422,19 @@ <h1>Iterators<a class="headerlink" href="#iterators" title="Permalink to this he
 <p>The <code class="docutils literal notranslate"><span class="pre">zip_iterator</span></code> is useful in defining by key algorithms where input iterators
 representing keys and values are processed as key-value pairs. The example below demonstrates a stable sort
 by key, where only the keys are compared but both keys and values are swapped:</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">using</span> <span class="n">namespace</span> <span class="n">oneapi</span><span class="p">;</span>
-<span class="n">auto</span> <span class="n">zipped_begin</span> <span class="o">=</span> <span class="n">dpl</span><span class="p">::</span><span class="n">make_zip_iterator</span><span class="p">(</span><span class="n">keys_begin</span><span class="p">,</span> <span class="n">vals_begin</span><span class="p">);</span>
-<span class="n">std</span><span class="p">::</span><span class="n">stable_sort</span><span class="p">(</span><span class="n">dpl</span><span class="p">::</span><span class="n">execution</span><span class="p">::</span><span class="n">dpcpp_default</span><span class="p">,</span> <span class="n">zipped_begin</span><span class="p">,</span> <span class="n">zipped_begin</span> <span class="o">+</span> <span class="n">n</span><span class="p">,</span>
-    <span class="p">[](</span><span class="n">auto</span> <span class="n">lhs</span><span class="p">,</span> <span class="n">auto</span> <span class="n">rhs</span><span class="p">)</span> <span class="p">{</span> <span class="k">return</span> <span class="n">get</span><span class="o">&lt;</span><span class="mi">0</span><span class="o">&gt;</span><span class="p">(</span><span class="n">lhs</span><span class="p">)</span> <span class="o">&lt;</span> <span class="n">get</span><span class="o">&lt;</span><span class="mi">0</span><span class="o">&gt;</span><span class="p">(</span><span class="n">rhs</span><span class="p">);</span> <span class="p">});</span>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">auto</span><span class="w"> </span><span class="n">zipped_begin</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">make_zip_iterator</span><span class="p">(</span><span class="n">keys_begin</span><span class="p">,</span><span class="w"> </span><span class="n">vals_begin</span><span class="p">);</span>
+<span class="n">dpl</span><span class="o">::</span><span class="n">stable_sort</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span><span class="w"> </span><span class="n">zipped_begin</span><span class="p">,</span><span class="w"> </span><span class="n">zipped_begin</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">n</span><span class="p">,</span>
+<span class="w">    </span><span class="p">[](</span><span class="k">auto</span><span class="w"> </span><span class="n">lhs</span><span class="p">,</span><span class="w"> </span><span class="k">auto</span><span class="w"> </span><span class="n">rhs</span><span class="p">)</span><span class="w"> </span><span class="p">{</span><span class="w"> </span><span class="k">return</span><span class="w"> </span><span class="n">get</span><span class="o">&lt;</span><span class="mi">0</span><span class="o">&gt;</span><span class="p">(</span><span class="n">lhs</span><span class="p">)</span><span class="w"> </span><span class="o">&lt;</span><span class="w"> </span><span class="n">get</span><span class="o">&lt;</span><span class="mi">0</span><span class="o">&gt;</span><span class="p">(</span><span class="n">rhs</span><span class="p">);</span><span class="w"> </span><span class="p">});</span>
 </pre></div>
 </div>
 <p>The dereferenced object of <code class="docutils literal notranslate"><span class="pre">zip_iterator</span></code> supports the <em>structured binding</em> feature (<a class="reference external" href="https://en.cppreference.com/w/cpp/language/structured_binding">C++17 and above</a>) for easier access to
 wrapped iterators values:</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">using</span> <span class="n">namespace</span> <span class="n">oneapi</span><span class="p">;</span>
-<span class="n">auto</span> <span class="n">zipped_begin</span> <span class="o">=</span> <span class="n">dpl</span><span class="p">::</span><span class="n">make_zip_iterator</span><span class="p">(</span><span class="n">sequence1</span><span class="o">.</span><span class="n">begin</span><span class="p">(),</span> <span class="n">sequence2</span><span class="o">.</span><span class="n">begin</span><span class="p">(),</span> <span class="n">sequence3</span><span class="o">.</span><span class="n">begin</span><span class="p">());</span>
-<span class="n">auto</span> <span class="n">found</span> <span class="o">=</span> <span class="n">std</span><span class="p">::</span><span class="n">find</span><span class="p">(</span><span class="n">dpl</span><span class="p">::</span><span class="n">execution</span><span class="p">::</span><span class="n">dpcpp_default</span><span class="p">,</span> <span class="n">zipped_begin</span><span class="p">,</span> <span class="n">zipped_begin</span> <span class="o">+</span> <span class="n">n</span><span class="p">,</span>
-    <span class="p">[](</span><span class="n">auto</span> <span class="n">tuple_like_obj</span><span class="p">)</span> <span class="p">{</span>
-      <span class="n">auto</span> <span class="p">[</span><span class="n">e1</span><span class="p">,</span> <span class="n">e2</span><span class="p">,</span> <span class="n">e3</span><span class="p">]</span> <span class="o">=</span> <span class="n">tuple_like_obj</span><span class="p">;</span>
-      <span class="k">return</span> <span class="n">e1</span> <span class="o">==</span> <span class="n">e2</span> <span class="o">&amp;&amp;</span> <span class="n">e1</span> <span class="o">==</span> <span class="n">e3</span><span class="p">;</span>
-    <span class="p">}</span>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">auto</span><span class="w"> </span><span class="n">zipped_begin</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">make_zip_iterator</span><span class="p">(</span><span class="n">sequence1</span><span class="p">.</span><span class="n">begin</span><span class="p">(),</span><span class="w"> </span><span class="n">sequence2</span><span class="p">.</span><span class="n">begin</span><span class="p">(),</span><span class="w"> </span><span class="n">sequence3</span><span class="p">.</span><span class="n">begin</span><span class="p">());</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">found</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">find</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span><span class="w"> </span><span class="n">zipped_begin</span><span class="p">,</span><span class="w"> </span><span class="n">zipped_begin</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">n</span><span class="p">,</span>
+<span class="w">    </span><span class="p">[](</span><span class="k">auto</span><span class="w"> </span><span class="n">tuple_like_obj</span><span class="p">)</span><span class="w"> </span><span class="p">{</span>
+<span class="w">      </span><span class="k">auto</span><span class="w"> </span><span class="p">[</span><span class="n">e1</span><span class="p">,</span><span class="w"> </span><span class="n">e2</span><span class="p">,</span><span class="w"> </span><span class="n">e3</span><span class="p">]</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">tuple_like_obj</span><span class="p">;</span>
+<span class="w">      </span><span class="k">return</span><span class="w"> </span><span class="n">e1</span><span class="w"> </span><span class="o">==</span><span class="w"> </span><span class="n">e2</span><span class="w"> </span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">e1</span><span class="w"> </span><span class="o">==</span><span class="w"> </span><span class="n">e3</span><span class="p">;</span>
+<span class="w">    </span><span class="p">}</span>
 <span class="p">);</span>
 </pre></div>
 </div>
@@ -446,12 +448,11 @@ <h1>Iterators<a class="headerlink" href="#iterators" title="Permalink to this he
 desired output. An example of this would be a <code class="docutils literal notranslate"><span class="pre">copy_if</span></code> algorithm that receives an input iterator range,
 a stencil iterator range, and copies the elements of the input whose corresponding stencil value is 1. Use
 <code class="docutils literal notranslate"><span class="pre">discard_iterator</span></code> so you do not declare a temporary allocation to store the copy of the stencil:</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">using</span> <span class="n">namespace</span> <span class="n">oneapi</span><span class="p">;</span>
-<span class="n">auto</span> <span class="n">zipped_first</span> <span class="o">=</span> <span class="n">dpl</span><span class="p">::</span><span class="n">make_zip_iterator</span><span class="p">(</span><span class="n">first</span><span class="p">,</span> <span class="n">stencil</span><span class="p">);</span>
-<span class="n">std</span><span class="p">::</span><span class="n">copy_if</span><span class="p">(</span><span class="n">dpl</span><span class="p">::</span><span class="n">execution</span><span class="p">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
-             <span class="n">zipped_first</span><span class="p">,</span> <span class="n">zipped_first</span> <span class="o">+</span> <span class="p">(</span><span class="n">last</span> <span class="o">-</span> <span class="n">first</span><span class="p">),</span>
-             <span class="n">dpl</span><span class="p">::</span><span class="n">make_zip_iterator</span><span class="p">(</span><span class="n">result</span><span class="p">,</span> <span class="n">dpl</span><span class="p">::</span><span class="n">discard_iterator</span><span class="p">()),</span>
-             <span class="p">[](</span><span class="n">auto</span> <span class="n">t</span><span class="p">){</span><span class="k">return</span> <span class="n">get</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">t</span><span class="p">)</span> <span class="o">==</span> <span class="mi">1</span><span class="p">;}</span>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">auto</span><span class="w"> </span><span class="n">zipped_first</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">make_zip_iterator</span><span class="p">(</span><span class="n">first</span><span class="p">,</span><span class="w"> </span><span class="n">stencil</span><span class="p">);</span>
+<span class="n">dpl</span><span class="o">::</span><span class="n">copy_if</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
+<span class="w">             </span><span class="n">zipped_first</span><span class="p">,</span><span class="w"> </span><span class="n">zipped_first</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="p">(</span><span class="n">last</span><span class="w"> </span><span class="o">-</span><span class="w"> </span><span class="n">first</span><span class="p">),</span>
+<span class="w">             </span><span class="n">dpl</span><span class="o">::</span><span class="n">make_zip_iterator</span><span class="p">(</span><span class="n">result</span><span class="p">,</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">discard_iterator</span><span class="p">()),</span>
+<span class="w">             </span><span class="p">[](</span><span class="k">auto</span><span class="w"> </span><span class="n">t</span><span class="p">){</span><span class="k">return</span><span class="w"> </span><span class="n">get</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">t</span><span class="p">)</span><span class="w"> </span><span class="o">==</span><span class="w"> </span><span class="mi">1</span><span class="p">;}</span>
 </pre></div>
 </div>
 </li>
@@ -473,13 +474,12 @@ <h1>Iterators<a class="headerlink" href="#iterators" title="Permalink to this he
 <p>To simplify the construction of the iterator, <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::make_transform_iterator</span></code> is provided. The
 function receives the base iterator and transform operation instance as arguments, and constructs the
 <code class="docutils literal notranslate"><span class="pre">transform_iterator</span></code> instance:</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">using</span> <span class="n">namespace</span> <span class="n">oneapi</span><span class="p">;</span>
-<span class="n">dpl</span><span class="p">::</span><span class="n">counting_iterator</span><span class="o">&lt;</span><span class="nb">int</span><span class="o">&gt;</span> <span class="n">first</span><span class="p">(</span><span class="mi">0</span><span class="p">);</span>
-<span class="n">dpl</span><span class="p">::</span><span class="n">counting_iterator</span><span class="o">&lt;</span><span class="nb">int</span><span class="o">&gt;</span> <span class="n">last</span><span class="p">(</span><span class="mi">10</span><span class="p">);</span>
-<span class="n">auto</span> <span class="n">transform_first</span> <span class="o">=</span> <span class="n">dpl</span><span class="p">::</span><span class="n">make_transform_iterator</span><span class="p">(</span><span class="n">first</span><span class="p">,</span> <span class="n">std</span><span class="p">::</span><span class="n">negate</span><span class="o">&lt;</span><span class="nb">int</span><span class="o">&gt;</span><span class="p">());</span>
-<span class="n">auto</span> <span class="n">transform_last</span> <span class="o">=</span> <span class="n">transform_first</span> <span class="o">+</span> <span class="p">(</span><span class="n">last</span> <span class="o">-</span> <span class="n">first</span><span class="p">);</span>
-<span class="n">auto</span> <span class="nb">sum</span> <span class="o">=</span> <span class="n">std</span><span class="p">::</span><span class="n">reduce</span><span class="p">(</span><span class="n">dpl</span><span class="p">::</span><span class="n">execution</span><span class="p">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
-                       <span class="n">transform_first</span><span class="p">,</span> <span class="n">transform_last</span><span class="p">);</span> <span class="o">//</span> <span class="nb">sum</span> <span class="ow">is</span> <span class="p">(</span><span class="mi">0</span> <span class="o">+</span> <span class="o">-</span><span class="mi">1</span> <span class="o">+</span> <span class="o">...</span> <span class="o">+</span> <span class="o">-</span><span class="mi">9</span><span class="p">)</span> <span class="o">=</span> <span class="o">-</span><span class="mi">45</span>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="n">dpl</span><span class="o">::</span><span class="n">counting_iterator</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">first</span><span class="p">(</span><span class="mi">0</span><span class="p">);</span>
+<span class="n">dpl</span><span class="o">::</span><span class="n">counting_iterator</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">last</span><span class="p">(</span><span class="mi">10</span><span class="p">);</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">transform_first</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">make_transform_iterator</span><span class="p">(</span><span class="n">first</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">negate</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="p">());</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">transform_last</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">transform_first</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="p">(</span><span class="n">last</span><span class="w"> </span><span class="o">-</span><span class="w"> </span><span class="n">first</span><span class="p">);</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">sum</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">reduce</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span>
+<span class="w">                       </span><span class="n">transform_first</span><span class="p">,</span><span class="w"> </span><span class="n">transform_last</span><span class="p">);</span><span class="w"> </span><span class="c1">// sum is (0 + -1 + ... + -9) = -45</span>
 </pre></div>
 </div>
 </li>
@@ -492,20 +492,19 @@ <h1>Iterators<a class="headerlink" href="#iterators" title="Permalink to this he
 in cases where algorithms are executed with device policies.</p>
 <p>The <code class="docutils literal notranslate"><span class="pre">make_permutation_iterator</span></code> is provided to simplify construction of iterator instances. The function
 receives the source iterator and the iterator or function object representing the index map:</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">struct</span> <span class="n">multiply_index_by_two</span> <span class="p">{</span>
-    <span class="n">template</span> <span class="o">&lt;</span><span class="n">typename</span> <span class="n">Index</span><span class="o">&gt;</span>
-    <span class="n">Index</span> <span class="n">operator</span><span class="p">()(</span><span class="n">const</span> <span class="n">Index</span><span class="o">&amp;</span> <span class="n">i</span><span class="p">)</span> <span class="n">const</span>
-    <span class="p">{</span> <span class="k">return</span> <span class="n">i</span><span class="o">*</span><span class="mi">2</span><span class="p">;</span> <span class="p">}</span>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">struct</span><span class="w"> </span><span class="nc">multiply_index_by_two</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="k">typename</span><span class="w"> </span><span class="nc">Index</span><span class="o">&gt;</span>
+<span class="w">    </span><span class="n">Index</span><span class="w"> </span><span class="k">operator</span><span class="p">()(</span><span class="k">const</span><span class="w"> </span><span class="n">Index</span><span class="o">&amp;</span><span class="w"> </span><span class="n">i</span><span class="p">)</span><span class="w"> </span><span class="k">const</span>
+<span class="w">    </span><span class="p">{</span><span class="w"> </span><span class="k">return</span><span class="w"> </span><span class="n">i</span><span class="o">*</span><span class="mi">2</span><span class="p">;</span><span class="w"> </span><span class="p">}</span>
 <span class="p">};</span>
 
-<span class="o">//</span> <span class="n">first</span> <span class="ow">and</span> <span class="n">last</span> <span class="n">are</span> <span class="n">iterators</span> <span class="n">that</span> <span class="n">define</span> <span class="n">a</span> <span class="n">contiguous</span> <span class="nb">range</span> <span class="n">of</span> <span class="nb">input</span> <span class="n">elements</span>
-<span class="o">//</span> <span class="n">compute</span> <span class="n">the</span> <span class="n">number</span> <span class="n">of</span> <span class="n">elements</span> <span class="ow">in</span> <span class="n">the</span> <span class="nb">range</span> <span class="n">between</span> <span class="n">the</span> <span class="n">first</span> <span class="ow">and</span> <span class="n">last</span> <span class="n">that</span> <span class="n">are</span> <span class="n">accessed</span>
-<span class="o">//</span> <span class="n">by</span> <span class="n">the</span> <span class="n">permutation</span> <span class="n">iterator</span>
-<span class="n">size_t</span> <span class="n">num_elements</span> <span class="o">=</span> <span class="n">std</span><span class="p">::</span><span class="n">distance</span><span class="p">(</span><span class="n">first</span><span class="p">,</span> <span class="n">last</span><span class="p">)</span> <span class="o">/</span> <span class="mi">2</span> <span class="o">+</span> <span class="n">std</span><span class="p">::</span><span class="n">distance</span><span class="p">(</span><span class="n">first</span><span class="p">,</span> <span class="n">last</span><span class="p">)</span> <span class="o">%</span> <span class="mi">2</span><span class="p">;</span>
-<span class="n">using</span> <span class="n">namespace</span> <span class="n">oneapi</span><span class="p">;</span>
-<span class="n">auto</span> <span class="n">permutation_first</span> <span class="o">=</span> <span class="n">dpl</span><span class="p">::</span><span class="n">make_permutation_iterator</span><span class="p">(</span><span class="n">first</span><span class="p">,</span> <span class="n">multiply_index_by_two</span><span class="p">());</span>
-<span class="n">auto</span> <span class="n">permutation_last</span> <span class="o">=</span> <span class="n">permutation_first</span> <span class="o">+</span> <span class="n">num_elements</span><span class="p">;</span>
-<span class="n">std</span><span class="p">::</span><span class="n">copy</span><span class="p">(</span><span class="n">dpl</span><span class="p">::</span><span class="n">execution</span><span class="p">::</span><span class="n">dpcpp_default</span><span class="p">,</span> <span class="n">permutation_first</span><span class="p">,</span> <span class="n">permutation_last</span><span class="p">,</span> <span class="n">result</span><span class="p">);</span>
+<span class="c1">// first and last are iterators that define a contiguous range of input elements</span>
+<span class="c1">// compute the number of elements in the range between the first and last that are accessed</span>
+<span class="c1">// by the permutation iterator</span>
+<span class="kt">size_t</span><span class="w"> </span><span class="n">num_elements</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">distance</span><span class="p">(</span><span class="n">first</span><span class="p">,</span><span class="w"> </span><span class="n">last</span><span class="p">)</span><span class="w"> </span><span class="o">/</span><span class="w"> </span><span class="mi">2</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">distance</span><span class="p">(</span><span class="n">first</span><span class="p">,</span><span class="w"> </span><span class="n">last</span><span class="p">)</span><span class="w"> </span><span class="o">%</span><span class="w"> </span><span class="mi">2</span><span class="p">;</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">permutation_first</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">dpl</span><span class="o">::</span><span class="n">make_permutation_iterator</span><span class="p">(</span><span class="n">first</span><span class="p">,</span><span class="w"> </span><span class="n">multiply_index_by_two</span><span class="p">());</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">permutation_last</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">permutation_first</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">num_elements</span><span class="p">;</span>
+<span class="n">dpl</span><span class="o">::</span><span class="n">copy</span><span class="p">(</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span><span class="w"> </span><span class="n">permutation_first</span><span class="p">,</span><span class="w"> </span><span class="n">permutation_last</span><span class="p">,</span><span class="w"> </span><span class="n">result</span><span class="p">);</span>
 </pre></div>
 </div>
 </li>
@@ -525,20 +524,20 @@ <h1>Iterators<a class="headerlink" href="#iterators" title="Permalink to this he
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="execution_policies.html"
+       href="pass_data_algorithms.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">Execution Policies</p>
+        <p class="prev-next-title">Pass Data to Algorithms</p>
       </div>
     </a>
     <a class="right-next"
-       href="async_api.html"
+       href="range_based_api.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">Asynchronous API Algorithms</p>
+        <p class="prev-next-title">Experimental Range-Based API</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
diff --git a/parallel_api/parallel_range_algorithms.html b/parallel_api/parallel_range_algorithms.html
new file mode 100644
index 0000000000..573614ec15
--- /dev/null
+++ b/parallel_api/parallel_range_algorithms.html
@@ -0,0 +1,620 @@
+
+
+<!DOCTYPE html>
+
+
+<html >
+
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+    <title>Parallel Range Algorithms &#8212; oneDPL Documentation 2022.7.0 documentation</title>
+  
+  
+  
+  <script data-cfasync="false">
+    document.documentElement.dataset.mode = localStorage.getItem("mode") || "";
+    document.documentElement.dataset.theme = localStorage.getItem("theme") || "light";
+  </script>
+  
+  <!-- Loaded before other Sphinx assets -->
+  <link href="../_static/styles/theme.css?digest=e353d410970836974a52" rel="stylesheet" />
+<link href="../_static/styles/bootstrap.css?digest=e353d410970836974a52" rel="stylesheet" />
+<link href="../_static/styles/pydata-sphinx-theme.css?digest=e353d410970836974a52" rel="stylesheet" />
+
+  
+  <link href="../_static/vendor/fontawesome/6.1.2/css/all.min.css?digest=e353d410970836974a52" rel="stylesheet" />
+  <link rel="preload" as="font" type="font/woff2" crossorigin href="../_static/vendor/fontawesome/6.1.2/webfonts/fa-solid-900.woff2" />
+<link rel="preload" as="font" type="font/woff2" crossorigin href="../_static/vendor/fontawesome/6.1.2/webfonts/fa-brands-400.woff2" />
+<link rel="preload" as="font" type="font/woff2" crossorigin href="../_static/vendor/fontawesome/6.1.2/webfonts/fa-regular-400.woff2" />
+
+    <link rel="stylesheet" type="text/css" href="../_static/pygments.css" />
+    <link rel="stylesheet" href="../_static/styles/sphinx-book-theme.css?digest=14f4ca6b54d191a8c7657f6c759bf11a5fb86285" type="text/css" />
+    <link rel="stylesheet" type="text/css" href="../_static/custom.css" />
+  
+  <!-- Pre-loaded scripts that we'll load fully later -->
+  <link rel="preload" as="script" href="../_static/scripts/bootstrap.js?digest=e353d410970836974a52" />
+<link rel="preload" as="script" href="../_static/scripts/pydata-sphinx-theme.js?digest=e353d410970836974a52" />
+
+    <script data-url_root="../" id="documentation_options" src="../_static/documentation_options.js"></script>
+    <script src="../_static/jquery.js"></script>
+    <script src="../_static/underscore.js"></script>
+    <script src="../_static/doctools.js"></script>
+    <script src="../_static/scripts/sphinx-book-theme.js?digest=5a5c038af52cf7bc1a1ec88eea08e6366ee68824"></script>
+    <script>DOCUMENTATION_OPTIONS.pagename = 'parallel_api/parallel_range_algorithms';</script>
+    <link rel="shortcut icon" href="../_static/favicons.png"/>
+    <link rel="index" title="Index" href="../genindex.html" />
+    <link rel="search" title="Search" href="../search.html" />
+    <link rel="next" title="Additional Algorithms" href="additional_algorithms.html" />
+    <link rel="prev" title="Execution Policies" href="execution_policies.html" />
+
+    <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
+    <script type="text/javascript">
+        // Configure TMS settings
+        var wapLocalCode = 'us-en'; // Dynamically set per localized site, see mapping table for values
+        var wapSection = "oneapi-dpl"; // WAP team will give you a unique section for your site
+        // Load TMS
+        if(document.location.href.includes("oneapi-src.github.io")){
+        (function () {
+        var url = 'https://www.intel.com/content/dam/www/global/wap/tms-loader.js'; // WAP file URL
+        var po = document.createElement('script'); po.type = 'text/javascript'; po.async = true; po.src = url;
+        var s = document.getElementsByTagName('script')[0]; s.parentNode.insertBefore(po, s);
+        })();
+        }
+    </script>
+    <link href="../_static/style.css" rel="stylesheet" type="text/css">
+
+
+
+  </head>
+  
+  
+  <body data-bs-spy="scroll" data-bs-target=".bd-toc-nav" data-offset="180" data-bs-root-margin="0px 0px -60%" data-default-mode="">
+
+  
+  
+  <a class="skip-link" href="#main-content">Skip to main content</a>
+  
+  <input type="checkbox"
+          class="sidebar-toggle"
+          name="__primary"
+          id="__primary"/>
+  <label class="overlay overlay-primary" for="__primary"></label>
+  
+  <input type="checkbox"
+          class="sidebar-toggle"
+          name="__secondary"
+          id="__secondary"/>
+  <label class="overlay overlay-secondary" for="__secondary"></label>
+  
+  <div class="search-button__wrapper">
+    <div class="search-button__overlay"></div>
+    <div class="search-button__search-container">
+<form class="bd-search d-flex align-items-center"
+      action="../search.html"
+      method="get">
+  <i class="fa-solid fa-magnifying-glass"></i>
+  <input type="search"
+         class="form-control"
+         name="q"
+         id="search-input"
+         placeholder="Search..."
+         aria-label="Search..."
+         autocomplete="off"
+         autocorrect="off"
+         autocapitalize="off"
+         spellcheck="false"/>
+  <span class="search-button__kbd-shortcut"><kbd class="kbd-shortcut__modifier">Ctrl</kbd>+<kbd>K</kbd></span>
+</form></div>
+  </div>
+  
+    <nav class="bd-header navbar navbar-expand-lg bd-navbar">
+    </nav>
+  
+  <div class="bd-container">
+    <div class="bd-container__inner bd-page-width">
+      
+      <div class="bd-sidebar-primary bd-sidebar">
+        
+
+  
+  <div class="sidebar-header-items sidebar-primary__section">
+    
+    
+    
+    
+  </div>
+  
+    <div class="sidebar-primary-items__start sidebar-primary__section">
+        <div class="sidebar-primary-item">
+  
+
+<a class="navbar-brand logo" href="../index.html">
+  
+  
+  
+  
+    
+    
+      
+    
+    
+    <img src="../_static/oneAPI-rgb-rev-100.png" class="logo__image only-light" alt="Logo image"/>
+    <script>document.write(`<img src="../_static/oneAPI-rgb-rev-100.png" class="logo__image only-dark" alt="Logo image"/>`);</script>
+  
+  
+</a></div>
+        <div class="sidebar-primary-item"><nav class="bd-links" id="bd-docs-nav" aria-label="Main">
+    <div class="bd-toc-item navbar-nav active">
+        <p aria-level="2" class="caption" role="heading"><span class="caption-text">Get Started</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
+<ul class="current nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
+<li class="toctree-l1 current active has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
+<li class="toctree-l2"><a class="reference internal" href="execution_policies.html">Execution Policies</a></li>
+<li class="toctree-l2 current active"><a class="current reference internal" href="#">Parallel Range Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="additional_algorithms.html">Additional Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="range_based_api.html">Experimental Range-Based API</a></li>
+</ul>
+</li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="async_api.html">Asynchronous Algorithms</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
+<li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
+<li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
+<li class="toctree-l3"><a class="reference internal" href="../dynamic_selection_api/fixed_resource_policy.html">Fixed-Resource Policy</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../dynamic_selection_api/round_robin_policy.html">Round-Robin Policy</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../dynamic_selection_api/dynamic_load_policy.html">Dynamic Load Policy</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../dynamic_selection_api/auto_tune_policy.html">Auto-Tune Policy</a></li>
+</ul>
+</li>
+</ul>
+</li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../kernel_templates_main.html">Kernel Templates API</a><input class="toctree-checkbox" id="toctree-checkbox-5" name="toctree-checkbox-5" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-5"><i class="fa-solid fa-chevron-down"></i></label><ul>
+<li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
+<li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
+</ul>
+</li>
+<li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
+</ul>
+</li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="../notices_disclaimers.html">Notices and Disclaimers</a></li>
+</ul>
+
+    </div>
+</nav></div>
+    </div>
+  
+  
+  <div class="sidebar-primary-items__end sidebar-primary__section">
+  </div>
+  
+  <div id="rtd-footer-container"></div>
+
+
+      </div>
+      
+      <main id="main-content" class="bd-main">
+        
+        
+
+<div class="sbt-scroll-pixel-helper"></div>
+
+          <div class="bd-content">
+            <div class="bd-article-container">
+              
+              <div class="bd-header-article">
+<div class="header-article-items header-article__inner">
+  
+    <div class="header-article-items__start">
+      
+        <div class="header-article-item"><label class="sidebar-toggle primary-toggle btn btn-sm" for="__primary" title="Toggle primary sidebar" data-bs-placement="bottom" data-bs-toggle="tooltip">
+  <span class="fa-solid fa-bars"></span>
+</label></div>
+      
+    </div>
+  
+  
+    <div class="header-article-items__end">
+      
+        <div class="header-article-item">
+
+<div class="article-header-buttons">
+
+
+
+
+
+<div class="dropdown dropdown-source-buttons">
+  <button class="btn dropdown-toggle" type="button" data-bs-toggle="dropdown" aria-expanded="false" aria-label="Source repositories">
+    <i class="fab fa-github"></i>
+  </button>
+  <ul class="dropdown-menu">
+      
+      
+      
+      <li><a href="https://github.com/oneapi-src/oneDPL/edit/main/documentation/library_guide/parallel_api/parallel_range_algorithms.rst" target="_blank"
+   class="btn btn-sm btn-source-edit-button dropdown-item"
+   title="Suggest edit"
+   data-bs-placement="left" data-bs-toggle="tooltip"
+>
+  
+
+<span class="btn__icon-container">
+  <i class="fas fa-pencil-alt"></i>
+  </span>
+<span class="btn__text-container">Suggest edit</span>
+</a>
+</li>
+      
+      
+      
+      
+      <li><a href="https://github.com/oneapi-src/oneDPL/issues/new?title=Issue%20on%20page%20%2Fparallel_api/parallel_range_algorithms.html&body=Your%20issue%20content%20here." target="_blank"
+   class="btn btn-sm btn-source-issues-button dropdown-item"
+   title="Open an issue"
+   data-bs-placement="left" data-bs-toggle="tooltip"
+>
+  
+
+<span class="btn__icon-container">
+  <i class="fas fa-lightbulb"></i>
+  </span>
+<span class="btn__text-container">Open issue</span>
+</a>
+</li>
+      
+  </ul>
+</div>
+
+
+
+
+
+
+<div class="dropdown dropdown-download-buttons">
+  <button class="btn dropdown-toggle" type="button" data-bs-toggle="dropdown" aria-expanded="false" aria-label="Download this page">
+    <i class="fas fa-download"></i>
+  </button>
+  <ul class="dropdown-menu">
+      
+      
+      
+      <li><a href="../_sources/parallel_api/parallel_range_algorithms.rst" target="_blank"
+   class="btn btn-sm btn-download-source-button dropdown-item"
+   title="Download source file"
+   data-bs-placement="left" data-bs-toggle="tooltip"
+>
+  
+
+<span class="btn__icon-container">
+  <i class="fas fa-file"></i>
+  </span>
+<span class="btn__text-container">.rst</span>
+</a>
+</li>
+      
+      
+      
+      
+      <li>
+<button onclick="window.print()"
+  class="btn btn-sm btn-download-pdf-button dropdown-item"
+  title="Print to PDF"
+  data-bs-placement="left" data-bs-toggle="tooltip"
+>
+  
+
+<span class="btn__icon-container">
+  <i class="fas fa-file-pdf"></i>
+  </span>
+<span class="btn__text-container">.pdf</span>
+</button>
+</li>
+      
+  </ul>
+</div>
+
+
+
+
+<button onclick="toggleFullScreen()"
+  class="btn btn-sm btn-fullscreen-button"
+  title="Fullscreen mode"
+  data-bs-placement="bottom" data-bs-toggle="tooltip"
+>
+  
+
+<span class="btn__icon-container">
+  <i class="fas fa-expand"></i>
+  </span>
+
+</button>
+
+
+<script>
+document.write(`
+  <button class="theme-switch-button btn btn-sm btn-outline-primary navbar-btn rounded-circle" title="light/dark" aria-label="light/dark" data-bs-placement="bottom" data-bs-toggle="tooltip">
+    <span class="theme-switch" data-mode="light"><i class="fa-solid fa-sun"></i></span>
+    <span class="theme-switch" data-mode="dark"><i class="fa-solid fa-moon"></i></span>
+    <span class="theme-switch" data-mode="auto"><i class="fa-solid fa-circle-half-stroke"></i></span>
+  </button>
+`);
+</script>
+
+<script>
+document.write(`
+  <button class="btn btn-sm navbar-btn search-button search-button__button" title="Search" aria-label="Search" data-bs-placement="bottom" data-bs-toggle="tooltip">
+    <i class="fa-solid fa-magnifying-glass"></i>
+  </button>
+`);
+</script>
+<label class="sidebar-toggle secondary-toggle btn btn-sm" for="__secondary"title="Toggle secondary sidebar" data-bs-placement="bottom" data-bs-toggle="tooltip">
+    <span class="fa-solid fa-list"></span>
+</label>
+</div></div>
+      
+    </div>
+  
+</div>
+</div>
+              
+              
+
+<div id="jb-print-docs-body" class="onlyprint">
+    <h1>Parallel Range Algorithms</h1>
+    <!-- Table of contents -->
+    <div id="print-main-content">
+        <div id="jb-print-toc">
+            
+            <div>
+                <h2> Contents </h2>
+            </div>
+            <nav aria-label="Page">
+                <ul class="visible nav section-nav flex-column">
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#supported-range-views">Supported Range Views</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#supported-algorithms">Supported Algorithms</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#usage-example-for-parallel-range-algorithms">Usage Example for Parallel Range Algorithms</a></li>
+</ul>
+            </nav>
+        </div>
+    </div>
+</div>
+
+              
+                
+<div id="searchbox"></div>
+                <article class="bd-article" role="main">
+                  
+  <div class="section" id="parallel-range-algorithms">
+<h1>Parallel Range Algorithms<a class="headerlink" href="#parallel-range-algorithms" title="Permalink to this headline">#</a></h1>
+<p>C++20 introduces the <a class="reference external" href="https://en.cppreference.com/w/cpp/ranges">Ranges library</a> and
+<a class="reference external" href="https://en.cppreference.com/w/cpp/algorithm/ranges">range algorithms</a> as a modern paradigm for expressing
+generic operations on data sequences.</p>
+<p>oneAPI DPC++ Library (oneDPL) extends it with <em>parallel range algorithms</em>, which can be used with the standard range
+classes to leverage oneDPL ability of parallel execution on both the host computer and data parallel devices.</p>
+<p>oneDPL only supports random access ranges, because they allow simultaneous constant-time access to elements
+at any position in the range. This enables efficient workload distribution among multiple threads or processing units,
+which is essential for achieving high performance in parallel execution.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>The use of parallel range algorithms requires C++20 and the C++ standard libraries coming with GCC 10 (or higher),
+Clang 16 (or higher) and Microsoft* Visual Studio* 2019 16.10 (or higher).</p>
+</div>
+<div class="section" id="supported-range-views">
+<h2>Supported Range Views<a class="headerlink" href="#supported-range-views" title="Permalink to this headline">#</a></h2>
+<p><a class="reference external" href="https://en.cppreference.com/w/cpp/ranges/view">Views</a> are lightweight ranges typically used to describe
+data transformation pipelines. The C++20 standard defines two categories of standard range views, called
+<em>factories</em> and <em>adaptors</em>:</p>
+<ul class="simple">
+<li><p>A range factory generates its data elements on access via an index or an iterator to the range.</p></li>
+<li><p>A range adaptor transforms its underlying data range(s) or view(s) into a new view with modified behavior.</p></li>
+</ul>
+<p>The following C++ standard random access adaptors and factories can be used with the oneDPL
+parallel range algorithms:</p>
+<ul class="simple">
+<li><p><code class="docutils literal notranslate"><span class="pre">std::ranges::views::all</span></code>: A range adaptor that returns a view that includes all elements of a range
+(only with standard-aligned execution policies).</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">std::ranges::subrange</span></code>: A utility that produces a view from an iterator and a sentinel or from a range.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">std::span</span></code>: A view to a contiguous data sequence.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">std::ranges::iota_view</span></code>: A range factory that generates a sequence of elements by repeatedly incrementing
+an initial value.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">std::ranges::single_view</span></code>: A view that contains exactly one element of a specified value.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">std::ranges::transform_view</span></code>: A range adaptor that produces a view that applies a transformation to each element
+of another view.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">std::ranges::reverse_view</span></code>: A range adaptor that produces a reversed sequence of elements provided by another view.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">std::ranges::take_view</span></code>: A range adaptor that produces a view of the first N elements from another view.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">std::ranges::drop_view</span></code>: A range adaptor that produces a view excluding the first N elements from another view.</p></li>
+</ul>
+<p>Visit <a class="reference internal" href="pass_data_algorithms.html"><span class="doc">Pass Data to Algorithms</span></a> for more information, especially on the <a class="reference internal" href="pass_data_algorithms.html#use-range-views"><span class="std std-ref">use of range views</span></a>
+with device execution policies.</p>
+</div>
+<div class="section" id="supported-algorithms">
+<h2>Supported Algorithms<a class="headerlink" href="#supported-algorithms" title="Permalink to this headline">#</a></h2>
+<p>The <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/algorithm&gt;</span></code> header defines the parallel range algorithms in the <code class="docutils literal notranslate"><span class="pre">namespace</span> <span class="pre">oneapi::dpl::ranges</span></code>.
+All algorithms work with both standard-aligned (host) and device execution policies.</p>
+<p>The <code class="docutils literal notranslate"><span class="pre">ONEDPL_HAS_RANGE_ALGORITHMS</span></code> <a class="reference internal" href="../macros.html#feature-macros"><span class="std std-ref">feature macro</span></a> may be used to test for the presence of
+parallel range algorithms.</p>
+<p id="range-algorithms-202409l">If <code class="docutils literal notranslate"><span class="pre">ONEDPL_HAS_RANGE_ALGORITHMS</span></code> is defined to <code class="docutils literal notranslate"><span class="pre">202409L</span></code> or a greater value, the following algorithms are provided:</p>
+<ul class="simple">
+<li><p><code class="docutils literal notranslate"><span class="pre">for_each</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">transform</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">find</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">find_if</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">find_if_not</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">adjacent_find</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">all_of</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">any_of</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">none_of</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">search</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">search_n</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">count</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">count_if</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">equal</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">sort</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">stable_sort</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">is_sorted</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">min_element</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">max_element</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">copy</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">copy_if</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">merge</span></code></p></li>
+</ul>
+</div>
+<div class="section" id="usage-example-for-parallel-range-algorithms">
+<h2>Usage Example for Parallel Range Algorithms<a class="headerlink" href="#usage-example-for-parallel-range-algorithms" title="Permalink to this headline">#</a></h2>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="p">{</span>
+<span class="w">    </span><span class="n">std</span><span class="o">::</span><span class="n">vector</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">vec_in</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="p">{</span><span class="mi">0</span><span class="p">,</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span><span class="w"> </span><span class="mi">2</span><span class="p">,</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span><span class="w"> </span><span class="mi">4</span><span class="p">,</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span><span class="w"> </span><span class="mi">6</span><span class="p">,</span><span class="w"> </span><span class="mi">7</span><span class="p">,</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span><span class="w"> </span><span class="mi">9</span><span class="p">};</span>
+<span class="w">    </span><span class="n">std</span><span class="o">::</span><span class="n">vector</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">vec_out</span><span class="p">{</span><span class="n">vec_in</span><span class="p">.</span><span class="n">size</span><span class="p">()};</span>
+
+<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">view_in</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">ranges</span><span class="o">::</span><span class="n">views</span><span class="o">::</span><span class="n">all</span><span class="p">(</span><span class="n">vec_in</span><span class="p">)</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">ranges</span><span class="o">::</span><span class="n">views</span><span class="o">::</span><span class="n">reverse</span><span class="p">;</span>
+<span class="w">    </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">ranges</span><span class="o">::</span><span class="n">copy</span><span class="p">(</span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">par</span><span class="p">,</span><span class="w"> </span><span class="n">view_in</span><span class="p">,</span><span class="w"> </span><span class="n">vec_out</span><span class="p">);</span>
+<span class="p">}</span>
+<span class="p">{</span>
+<span class="w">    </span><span class="k">using</span><span class="w"> </span><span class="n">usm_shared_allocator</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">usm_allocator</span><span class="o">&lt;</span><span class="kt">int</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">usm</span><span class="o">::</span><span class="n">alloc</span><span class="o">::</span><span class="n">shared</span><span class="o">&gt;</span><span class="p">;</span>
+<span class="w">    </span><span class="c1">// Allocate for the queue used by the execution policy</span>
+<span class="w">    </span><span class="n">usm_shared_allocator</span><span class="w"> </span><span class="n">alloc</span><span class="p">{</span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">.</span><span class="n">queue</span><span class="p">()};</span>
+
+<span class="w">    </span><span class="n">std</span><span class="o">::</span><span class="n">vector</span><span class="o">&lt;</span><span class="kt">int</span><span class="p">,</span><span class="w"> </span><span class="n">usm_shared_allocator</span><span class="o">&gt;</span><span class="w"> </span><span class="n">vec_in</span><span class="p">{{</span><span class="mi">0</span><span class="p">,</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span><span class="w"> </span><span class="mi">2</span><span class="p">,</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span><span class="w"> </span><span class="mi">4</span><span class="p">,</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span><span class="w"> </span><span class="mi">6</span><span class="p">,</span><span class="w"> </span><span class="mi">7</span><span class="p">,</span><span class="w"> </span><span class="mi">8</span><span class="p">,</span><span class="w"> </span><span class="mi">9</span><span class="p">},</span><span class="w"> </span><span class="n">alloc</span><span class="p">};</span>
+<span class="w">    </span><span class="n">std</span><span class="o">::</span><span class="n">vector</span><span class="o">&lt;</span><span class="kt">int</span><span class="p">,</span><span class="w"> </span><span class="n">usm_shared_allocator</span><span class="o">&gt;</span><span class="w"> </span><span class="n">vec_out</span><span class="p">{</span><span class="n">vec_in</span><span class="p">.</span><span class="n">size</span><span class="p">(),</span><span class="w"> </span><span class="n">alloc</span><span class="p">};</span>
+
+<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">view_in</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">ranges</span><span class="o">::</span><span class="n">subrange</span><span class="p">(</span><span class="n">vec_in</span><span class="p">.</span><span class="n">begin</span><span class="p">(),</span><span class="w"> </span><span class="n">vec_in</span><span class="p">.</span><span class="n">end</span><span class="p">())</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">ranges</span><span class="o">::</span><span class="n">views</span><span class="o">::</span><span class="n">reverse</span><span class="p">;</span>
+<span class="w">    </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">ranges</span><span class="o">::</span><span class="n">copy</span><span class="p">(</span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span><span class="w"> </span><span class="n">view_in</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">span</span><span class="p">(</span><span class="n">vec_out</span><span class="p">));</span>
+<span class="p">}</span>
+</pre></div>
+</div>
+<p class="rubric">See also:</p>
+<p><a class="reference internal" href="range_based_api.html"><span class="doc">Experimental Range-Based API</span></a></p>
+</div>
+</div>
+
+
+                </article>
+              
+
+              
+              
+                <footer class="bd-footer-article">
+                  
+<div class="footer-article-items footer-article__inner">
+  
+    <div class="footer-article-item"><!-- Previous / next buttons -->
+<div class="prev-next-area">
+    <a class="left-prev"
+       href="execution_policies.html"
+       title="previous page">
+      <i class="fa-solid fa-angle-left"></i>
+      <div class="prev-next-info">
+        <p class="prev-next-subtitle">previous</p>
+        <p class="prev-next-title">Execution Policies</p>
+      </div>
+    </a>
+    <a class="right-next"
+       href="additional_algorithms.html"
+       title="next page">
+      <div class="prev-next-info">
+        <p class="prev-next-subtitle">next</p>
+        <p class="prev-next-title">Additional Algorithms</p>
+      </div>
+      <i class="fa-solid fa-angle-right"></i>
+    </a>
+</div></div>
+  
+</div>
+
+                </footer>
+              
+            </div>
+            
+            
+              
+                <div class="bd-sidebar-secondary bd-toc"><div class="sidebar-secondary-items sidebar-secondary__inner">
+
+  <div class="sidebar-secondary-item">
+  <div class="page-toc tocsection onthispage">
+    <i class="fa-solid fa-list"></i> Contents
+  </div>
+  <nav class="bd-toc-nav page-toc">
+    <ul class="visible nav section-nav flex-column">
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#supported-range-views">Supported Range Views</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#supported-algorithms">Supported Algorithms</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#usage-example-for-parallel-range-algorithms">Usage Example for Parallel Range Algorithms</a></li>
+</ul>
+  </nav></div>
+
+</div></div>
+              
+            
+          </div>
+          <footer class="bd-footer-content">
+            
+<div class="bd-footer-content__inner container">
+  
+  <div class="footer-item">
+    
+<p class="component-author">
+By Intel
+</p>
+
+  </div>
+  
+  <div class="footer-item">
+    
+  <p class="copyright">
+    
+      © Copyright Intel Corporation.
+      <br/>
+    
+  </p>
+
+  </div>
+  
+  <div class="footer-item">
+    
+  </div>
+  
+  <div class="footer-item">
+    
+<div class="extra_footer">
+  <p align="right"><a data-cookie-notice="true" href="https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html">Cookies</a></p>
+</div>
+  </div>
+  
+</div>
+          </footer>
+        
+
+      </main>
+    </div>
+  </div>
+  
+  <!-- Scripts loaded after <body> so the DOM is not blocked -->
+  <script src="../_static/scripts/bootstrap.js?digest=e353d410970836974a52"></script>
+<script src="../_static/scripts/pydata-sphinx-theme.js?digest=e353d410970836974a52"></script>
+
+  <footer class="bd-footer">
+  </footer>
+  </body>
+</html>
\ No newline at end of file
diff --git a/parallel_api/pass_data_algorithms.html b/parallel_api/pass_data_algorithms.html
index ebf128403b..2b4032728c 100644
--- a/parallel_api/pass_data_algorithms.html
+++ b/parallel_api/pass_data_algorithms.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Pass Data to Algorithms &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Pass Data to Algorithms &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,7 +45,7 @@
     <link rel="shortcut icon" href="../_static/favicons.png"/>
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="API for the SYCL* Kernels" href="../api_for_sycl_kernels_main.html" />
+    <link rel="next" title="Iterators" href="iterators.html" />
     <link rel="prev" title="Additional Algorithms" href="additional_algorithms.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 current active has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2 current active"><a class="current reference internal" href="#">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -392,6 +397,7 @@ <h2> Contents </h2>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-oneapi-dpl-begin-and-oneapi-dpl-end-functions">Use oneapi::dpl::begin and oneapi::dpl::end Functions</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-unified-shared-memory">Use Unified Shared Memory</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-std-vector">Use std::vector</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-range-views">Use Range Views</a></li>
 </ul>
             </nav>
         </div>
@@ -405,24 +411,65 @@ <h2> Contents </h2>
                   
   <div class="section" id="pass-data-to-algorithms">
 <h1>Pass Data to Algorithms<a class="headerlink" href="#pass-data-to-algorithms" title="Permalink to this headline">#</a></h1>
-<p>When using the C++ standard execution policies, oneDPL supports data being passed to its algorithms as specified
-in the ISO/IEC 14882:2017 standard (commonly called C++17). According to the standard, the calling code
-must prevent data races when using algorithms with parallel execution policies.</p>
-<p>Note: Implementations of <code class="docutils literal notranslate"><span class="pre">std::vector&lt;bool&gt;</span></code> are not required to avoid data races for concurrent modifications
+<p>For an algorithm to access data, it is important that the used execution policy matches the data storage type.
+The following table shows which execution policies can be used with various data storage types.</p>
+<table class="table">
+<colgroup>
+<col style="width: 55%" />
+<col style="width: 30%" />
+<col style="width: 15%" />
+</colgroup>
+<thead>
+<tr class="row-odd"><th class="head"><p>Data Storage</p></th>
+<th class="head"><p>Device Policies</p></th>
+<th class="head"><p>Host Policies</p></th>
+</tr>
+</thead>
+<tbody>
+<tr class="row-even"><td><p><a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#subsec:buffers">SYCL buffer</a></p></td>
+<td><p>Yes</p></td>
+<td><p>No</p></td>
+</tr>
+<tr class="row-odd"><td><p>Device-allocated <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#sec:usm">unified shared memory</a> (USM)</p></td>
+<td><p>Yes</p></td>
+<td><p>No</p></td>
+</tr>
+<tr class="row-even"><td><p>Shared and host-allocated USM</p></td>
+<td><p>Yes</p></td>
+<td><p>Yes</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">std::vector</span></code> with <code class="docutils literal notranslate"><span class="pre">sycl::usm_allocator</span></code></p></td>
+<td><p>Yes</p></td>
+<td><p>Yes</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">std::vector</span></code> with an ordinary allocator</p></td>
+<td><p>See <a class="reference internal" href="#use-std-vector"><span class="std std-ref">Use std::vector</span></a></p></td>
+<td><p>Yes</p></td>
+</tr>
+<tr class="row-odd"><td><p>Other data in host memory</p></td>
+<td><p>No</p></td>
+<td><p>Yes</p></td>
+</tr>
+</tbody>
+</table>
+<p>When using the standard-aligned (or <em>host</em>) execution policies, oneDPL supports data being passed
+to its algorithms as specified in the C++ standard (C++17 for algorithms working with iterators,
+C++20 for parallel range algorithms), with <a class="reference internal" href="../introduction.html#library-restrictions"><span class="std std-ref">known restrictions and limitations</span></a>.</p>
+<p>According to the standard, the calling code must prevent data races when using algorithms
+with parallel execution policies.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>Implementations of <code class="docutils literal notranslate"><span class="pre">std::vector&lt;bool&gt;</span></code> are not required to avoid data races for concurrent modifications
 of vector elements. Some implementations may optimize multiple <code class="docutils literal notranslate"><span class="pre">bool</span></code> elements into a bitfield, making it unsafe
 for multithreading. For this reason, it is recommended to avoid <code class="docutils literal notranslate"><span class="pre">std::vector&lt;bool&gt;</span></code> for anything but a read-only
-input with the C++ standard execution policies.</p>
-<p>When using a device execution policy, you can use one of the following ways to pass data to an algorithm:</p>
-<ul class="simple">
-<li><p><code class="docutils literal notranslate"><span class="pre">oneapi:dpl::begin</span></code> and <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::end</span></code> functions</p></li>
-<li><p>Unified shared memory (USM) pointers</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">std::vector</span></code> with or without a USM allocator</p></li>
-</ul>
+input with the standard-aligned execution policies.</p>
+</div>
+<p>The following subsections describe proper ways to pass data to an algorithm invoked with a device execution policy.</p>
 <div class="section" id="use-oneapi-dpl-begin-and-oneapi-dpl-end-functions">
 <span id="use-buffer-wrappers"></span><h2>Use oneapi::dpl::begin and oneapi::dpl::end Functions<a class="headerlink" href="#use-oneapi-dpl-begin-and-oneapi-dpl-end-functions" title="Permalink to this headline">#</a></h2>
 <p><code class="docutils literal notranslate"><span class="pre">oneapi::dpl::begin</span></code> and <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::end</span></code> are special helper functions that
 allow you to pass SYCL buffers to parallel algorithms. These functions accept
-a SYCL buffer and return an object of an unspecified type that provides the following API:</p>
+a <a class="reference external" href="https://registry.khronos.org/SYCL/specs/sycl-2020/html/sycl-2020.html#subsec:buffers">SYCL buffer</a> and return an object of an unspecified type that provides the following API:</p>
 <ul class="simple">
 <li><p>It satisfies <code class="docutils literal notranslate"><span class="pre">CopyConstructible</span></code> and <code class="docutils literal notranslate"><span class="pre">CopyAssignable</span></code> C++ named requirements and comparable with
 <code class="docutils literal notranslate"><span class="pre">operator==</span></code> and <code class="docutils literal notranslate"><span class="pre">operator!=</span></code>.</p></li>
@@ -432,30 +479,30 @@ <h1>Pass Data to Algorithms<a class="headerlink" href="#pass-data-to-algorithms"
 <li><p>It provides the <code class="docutils literal notranslate"><span class="pre">get_buffer</span></code> method, which returns the buffer passed to the <code class="docutils literal notranslate"><span class="pre">begin</span></code> and <code class="docutils literal notranslate"><span class="pre">end</span></code> functions.</p></li>
 </ul>
 <p>The <code class="docutils literal notranslate"><span class="pre">begin</span></code> and <code class="docutils literal notranslate"><span class="pre">end</span></code> functions can take SYCL 2020 deduction tags and <code class="docutils literal notranslate"><span class="pre">sycl::no_init</span></code> as arguments
-to explicitly mention which access mode should be applied to the buffer accessor when submitting a
-SYCL kernel to a device. For example:</p>
-<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">auto</span><span class="w"> </span><span class="n">first1</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">begin</span><span class="p">(</span><span class="n">buf</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">);</span>
-<span class="k">auto</span><span class="w"> </span><span class="n">first2</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">begin</span><span class="p">(</span><span class="n">buf</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">write_only</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">no_init</span><span class="p">);</span>
-<span class="k">auto</span><span class="w"> </span><span class="n">first3</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">begin</span><span class="p">(</span><span class="n">buf</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">no_init</span><span class="p">);</span>
+to explicitly control which access mode should be applied to a particular buffer when submitting
+a SYCL kernel to a device:</p>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">buf</span><span class="p">{</span><span class="cm">/*...*/</span><span class="p">};</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">first_ro</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">buf</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">read_only</span><span class="p">);</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">first_wo</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">buf</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">write_only</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">no_init</span><span class="p">);</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">first_ni</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">buf</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">no_init</span><span class="p">);</span>
 </pre></div>
 </div>
-<p>The example above allows you to control the access mode for the particular buffer passing to a parallel algorithm.</p>
 <p>To use the functions, add <code class="docutils literal notranslate"><span class="pre">#include</span> <span class="pre">&lt;oneapi/dpl/iterator&gt;</span></code> to your code. For example:</p>
 <div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/execution&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/algorithm&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/iterator&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;random&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;sycl/sycl.hpp&gt;</span>
+
 <span class="kt">int</span><span class="w"> </span><span class="nf">main</span><span class="p">(){</span>
 <span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">vector</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">vec</span><span class="p">(</span><span class="mi">1000</span><span class="p">);</span>
 <span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">generate</span><span class="p">(</span><span class="n">vec</span><span class="p">.</span><span class="n">begin</span><span class="p">(),</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">end</span><span class="p">(),</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">minstd_rand</span><span class="p">{});</span>
 
-<span class="w">  </span><span class="c1">//create a buffer from host memory</span>
-<span class="w">  </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">buf</span><span class="w"> </span><span class="p">{</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">data</span><span class="p">(),</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">size</span><span class="p">()</span><span class="w"> </span><span class="p">};</span>
+<span class="w">  </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">buf</span><span class="p">{</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">data</span><span class="p">(),</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">size</span><span class="p">()</span><span class="w"> </span><span class="p">};</span>
 <span class="w">  </span><span class="k">auto</span><span class="w"> </span><span class="n">buf_begin</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">begin</span><span class="p">(</span><span class="n">buf</span><span class="p">);</span>
 <span class="w">  </span><span class="k">auto</span><span class="w"> </span><span class="n">buf_end</span><span class="w">   </span><span class="o">=</span><span class="w"> </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">end</span><span class="p">(</span><span class="n">buf</span><span class="p">);</span>
 
-<span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">sort</span><span class="p">(</span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span><span class="w"> </span><span class="n">buf_begin</span><span class="p">,</span><span class="w"> </span><span class="n">buf_end</span><span class="p">);</span>
+<span class="w">  </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">sort</span><span class="p">(</span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span><span class="w"> </span><span class="n">buf_begin</span><span class="p">,</span><span class="w"> </span><span class="n">buf_end</span><span class="p">);</span>
 <span class="w">  </span><span class="k">return</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span>
 <span class="p">}</span>
 </pre></div>
@@ -463,62 +510,76 @@ <h1>Pass Data to Algorithms<a class="headerlink" href="#pass-data-to-algorithms"
 </div>
 <div class="section" id="use-unified-shared-memory">
 <span id="use-usm"></span><h2>Use Unified Shared Memory<a class="headerlink" href="#use-unified-shared-memory" title="Permalink to this headline">#</a></h2>
-<p>If you have USM-allocated memory, pass the pointers to the start and past the end
-of the sequence to a parallel algorithm. Make sure that the execution policy and
-the USM-allocated memory were created for the same queue. For example:</p>
+<p>If you have USM-allocated data, pass the pointers to the start and past the end
+of the data sequence to a parallel algorithm. Make sure that the execution policy and
+the USM allocation use the same SYCL queue. For example:</p>
 <div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/execution&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/algorithm&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;random&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;sycl/sycl.hpp&gt;</span>
+
 <span class="kt">int</span><span class="w"> </span><span class="nf">main</span><span class="p">(){</span>
 <span class="w">  </span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="p">;</span>
 <span class="w">  </span><span class="k">const</span><span class="w"> </span><span class="kt">int</span><span class="w"> </span><span class="n">n</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">1000</span><span class="p">;</span>
 <span class="w">  </span><span class="kt">int</span><span class="o">*</span><span class="w"> </span><span class="n">d_head</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">malloc_shared</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">,</span><span class="w"> </span><span class="n">q</span><span class="p">);</span>
 <span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">generate</span><span class="p">(</span><span class="n">d_head</span><span class="p">,</span><span class="w"> </span><span class="n">d_head</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">n</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">minstd_rand</span><span class="p">{});</span>
 
-<span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">sort</span><span class="p">(</span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">make_device_policy</span><span class="p">(</span><span class="n">q</span><span class="p">),</span><span class="w"> </span><span class="n">d_head</span><span class="p">,</span><span class="w"> </span><span class="n">d_head</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">n</span><span class="p">);</span>
+<span class="w">  </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">sort</span><span class="p">(</span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">make_device_policy</span><span class="p">(</span><span class="n">q</span><span class="p">),</span><span class="w"> </span><span class="n">d_head</span><span class="p">,</span><span class="w"> </span><span class="n">d_head</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">n</span><span class="p">);</span>
 
 <span class="w">  </span><span class="n">sycl</span><span class="o">::</span><span class="n">free</span><span class="p">(</span><span class="n">d_head</span><span class="p">,</span><span class="w"> </span><span class="n">q</span><span class="p">);</span>
 <span class="w">  </span><span class="k">return</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span>
 <span class="p">}</span>
 </pre></div>
 </div>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>Use of non-USM pointers is not supported for algorithms with device execution policies.</p>
+</div>
 <p>When using device USM, such as allocated by <code class="docutils literal notranslate"><span class="pre">malloc_device</span></code>, you are responsible for data
 transfers to and from the device to ensure that input data is device accessible during oneDPL
 algorithm execution and that the result is available to the subsequent operations.</p>
 </div>
 <div class="section" id="use-std-vector">
-<h2>Use std::vector<a class="headerlink" href="#use-std-vector" title="Permalink to this headline">#</a></h2>
-<p>The following examples demonstrate two ways to use the parallel algorithms with <code class="docutils literal notranslate"><span class="pre">std::vector</span></code>:</p>
-<ul class="simple">
-<li><p>Host allocators</p></li>
-<li><p>USM allocators</p></li>
-</ul>
-<p>You can use iterators to host allocated <code class="docutils literal notranslate"><span class="pre">std::vector</span></code> data
-as shown in the following example:</p>
+<span id="id1"></span><h2>Use std::vector<a class="headerlink" href="#use-std-vector" title="Permalink to this headline">#</a></h2>
+<p>You can use iterators to an ordinary <code class="docutils literal notranslate"><span class="pre">std::vector</span></code> with data in host memory, as shown in the following example:</p>
 <div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/execution&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/algorithm&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;random&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;vector&gt;</span>
+
 <span class="kt">int</span><span class="w"> </span><span class="nf">main</span><span class="p">(){</span>
 <span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">vector</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">vec</span><span class="p">(</span><span class="w"> </span><span class="mi">1000</span><span class="w"> </span><span class="p">);</span>
 <span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">generate</span><span class="p">(</span><span class="n">vec</span><span class="p">.</span><span class="n">begin</span><span class="p">(),</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">end</span><span class="p">(),</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">minstd_rand</span><span class="p">{});</span>
 
-<span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">sort</span><span class="p">(</span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">begin</span><span class="p">(),</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">end</span><span class="p">());</span>
+<span class="w">  </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">sort</span><span class="p">(</span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">begin</span><span class="p">(),</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">end</span><span class="p">());</span>
 <span class="w">  </span><span class="k">return</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span>
 <span class="p">}</span>
 </pre></div>
 </div>
-<p>When using iterators to host allocated data, a temporary SYCL buffer is created, and the data
-is copied to this buffer. After processing on a device is complete, the modified data is copied
-from the temporary buffer back to the host container. While convenient, using host allocated
-data can lead to unintended copying between host and device. We recommend working with SYCL buffers
-or USM memory to reduce data copying between the host and device.</p>
-<p>You can also use <code class="docutils literal notranslate"><span class="pre">std::vector</span></code> with a USM allocator, as shown in the following example:</p>
+<p>In this case a temporary SYCL buffer is created, the data is copied to this buffer, and it is processed
+according to the algorithm semantics. After processing on a device is complete, the modified data is copied
+from the temporary buffer back to the host container.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>For parallel range algorithms with device execution policies the use of ordinary <code class="docutils literal notranslate"><span class="pre">std::vector</span></code>s is not supported.</p>
+</div>
+<p>While convenient, direct use of an ordinary <code class="docutils literal notranslate"><span class="pre">std::vector</span></code> can lead to unintended copying between the host
+and the device. We recommend working with SYCL buffers or with USM to reduce data copying.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>For specialized memory algorithms that begin or end the lifetime of data objects, that is,
+<code class="docutils literal notranslate"><span class="pre">uninitialized_*</span></code> and <code class="docutils literal notranslate"><span class="pre">destroy*</span></code> families of functions, the data to initialize or destroy
+should be accessible on the device without extra copying. Therefore these algorithms may not use
+data storage on the host with device execution policies.</p>
+</div>
+<p>You can also use <code class="docutils literal notranslate"><span class="pre">std::vector</span></code> with a <code class="docutils literal notranslate"><span class="pre">sycl::usm_allocator</span></code>, as shown in the following example.
+Make sure that the allocator and the execution policy use the same SYCL queue:</p>
 <div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/execution&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/algorithm&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;random&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;vector&gt;</span>
 <span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;sycl/sycl.hpp&gt;</span>
+
 <span class="kt">int</span><span class="w"> </span><span class="nf">main</span><span class="p">(){</span>
 <span class="w">  </span><span class="k">const</span><span class="w"> </span><span class="kt">int</span><span class="w"> </span><span class="n">n</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">1000</span><span class="p">;</span>
 <span class="w">  </span><span class="k">auto</span><span class="w"> </span><span class="n">policy</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">;</span>
@@ -527,22 +588,65 @@ <h2>Use std::vector<a class="headerlink" href="#use-std-vector" title="Permalink
 <span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">generate</span><span class="p">(</span><span class="n">vec</span><span class="p">.</span><span class="n">begin</span><span class="p">(),</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">end</span><span class="p">(),</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">minstd_rand</span><span class="p">{});</span>
 
 <span class="w">  </span><span class="c1">// Recommended to use USM pointers:</span>
-<span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">sort</span><span class="p">(</span><span class="n">policy</span><span class="p">,</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">data</span><span class="p">(),</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">data</span><span class="p">()</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">size</span><span class="p">());</span>
-
-<span class="w">  </span><span class="c1">// Iterators for USM allocators might require extra copying - not recommended method</span>
-<span class="w">  </span><span class="c1">// std::sort(policy, vec.begin(), vec.end());</span>
+<span class="w">  </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">sort</span><span class="p">(</span><span class="n">policy</span><span class="p">,</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">data</span><span class="p">(),</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">data</span><span class="p">()</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">vec</span><span class="p">.</span><span class="n">size</span><span class="p">());</span>
+<span class="cm">/*</span>
+<span class="cm">  // Iterators for USM allocators might require extra copying - not a recommended method</span>
+<span class="cm">  oneapi::dpl::sort(policy, vec.begin(), vec.end());</span>
+<span class="cm">*/</span>
 <span class="w">  </span><span class="k">return</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span>
 <span class="p">}</span>
 </pre></div>
 </div>
-<p>Make sure that the execution policy and the USM-allocated memory were created for the same queue.</p>
 <p>For <code class="docutils literal notranslate"><span class="pre">std::vector</span></code> with a USM allocator we recommend to use <code class="docutils literal notranslate"><span class="pre">std::vector::data()</span></code> in
 combination with <code class="docutils literal notranslate"><span class="pre">std::vector::size()</span></code> as shown in the example above, rather than iterators to
 <code class="docutils literal notranslate"><span class="pre">std::vector</span></code>. That is because for some implementations of the C++ Standard Library it might not
 be possible for oneDPL to detect that iterators are pointing to USM-allocated data. In that
-case the data will be treated as if it were host-allocated, with an extra copy made to a SYCL buffer.
+case the data will be treated as if it were in host memory, with an extra copy made to a SYCL buffer.
 Retrieving USM pointers from <code class="docutils literal notranslate"><span class="pre">std::vector</span></code> as shown guarantees no unintended copying.</p>
 </div>
+<div class="section" id="use-range-views">
+<span id="id2"></span><h2>Use Range Views<a class="headerlink" href="#use-range-views" title="Permalink to this headline">#</a></h2>
+<p>For <a class="reference internal" href="parallel_range_algorithms.html"><span class="doc">parallel range algorithms</span></a> with device execution policies,
+place the data in USM or a USM-allocated <code class="docutils literal notranslate"><span class="pre">std::vector</span></code>, and pass it to an algorithm
+via a device-copyable range or view object such as <code class="docutils literal notranslate"><span class="pre">std::ranges::subrange</span></code> or <code class="docutils literal notranslate"><span class="pre">std::span</span></code>.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>Use of <code class="docutils literal notranslate"><span class="pre">std::ranges::views::all</span></code> is not supported for algorithms with device execution policies.</p>
+</div>
+<p>These data ranges as well as supported range adaptors and factories may be combined into
+data transformation pipelines that also can be used with parallel range algorithms. For example:</p>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/execution&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;oneapi/dpl/algorithm&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;random&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;vector&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;span&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;ranges&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;functional&gt;</span>
+<span class="cp">#include</span><span class="w"> </span><span class="cpf">&lt;sycl/sycl.hpp&gt;</span>
+
+<span class="kt">int</span><span class="w"> </span><span class="nf">main</span><span class="p">(){</span>
+<span class="w">  </span><span class="k">const</span><span class="w"> </span><span class="kt">int</span><span class="w"> </span><span class="n">n</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="mi">1000</span><span class="p">;</span>
+<span class="w">  </span><span class="k">auto</span><span class="w"> </span><span class="n">policy</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">;</span>
+<span class="w">  </span><span class="n">sycl</span><span class="o">::</span><span class="n">queue</span><span class="w"> </span><span class="n">q</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">policy</span><span class="p">.</span><span class="n">queue</span><span class="p">();</span>
+
+<span class="w">  </span><span class="kt">int</span><span class="o">*</span><span class="w"> </span><span class="n">d_head</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">malloc_host</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="p">(</span><span class="n">n</span><span class="p">,</span><span class="w"> </span><span class="n">q</span><span class="p">);</span>
+<span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">generate</span><span class="p">(</span><span class="n">d_head</span><span class="p">,</span><span class="w"> </span><span class="n">d_head</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">n</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">minstd_rand</span><span class="p">{});</span>
+
+<span class="w">  </span><span class="n">sycl</span><span class="o">::</span><span class="n">usm_allocator</span><span class="o">&lt;</span><span class="kt">int</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">usm</span><span class="o">::</span><span class="n">alloc</span><span class="o">::</span><span class="n">shared</span><span class="o">&gt;</span><span class="w"> </span><span class="n">alloc</span><span class="p">(</span><span class="n">q</span><span class="p">);</span>
+<span class="w">  </span><span class="n">std</span><span class="o">::</span><span class="n">vector</span><span class="o">&lt;</span><span class="kt">int</span><span class="p">,</span><span class="w"> </span><span class="k">decltype</span><span class="p">(</span><span class="n">alloc</span><span class="p">)</span><span class="o">&gt;</span><span class="w"> </span><span class="n">vec</span><span class="p">(</span><span class="n">n</span><span class="p">,</span><span class="w"> </span><span class="n">alloc</span><span class="p">);</span>
+
+<span class="w">  </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">ranges</span><span class="o">::</span><span class="n">copy</span><span class="p">(</span><span class="n">policy</span><span class="p">,</span>
+<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">ranges</span><span class="o">::</span><span class="n">subrange</span><span class="p">(</span><span class="n">d_head</span><span class="p">,</span><span class="w"> </span><span class="n">d_head</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">n</span><span class="p">)</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">views</span><span class="o">::</span><span class="n">transform</span><span class="p">(</span><span class="n">std</span><span class="o">::</span><span class="n">negate</span><span class="p">{}),</span>
+<span class="w">      </span><span class="n">std</span><span class="o">::</span><span class="n">span</span><span class="p">(</span><span class="n">vec</span><span class="p">));</span>
+
+<span class="w">  </span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">ranges</span><span class="o">::</span><span class="n">sort</span><span class="p">(</span><span class="n">policy</span><span class="p">,</span><span class="w"> </span><span class="n">std</span><span class="o">::</span><span class="n">span</span><span class="p">(</span><span class="n">vec</span><span class="p">));</span>
+
+<span class="w">  </span><span class="n">sycl</span><span class="o">::</span><span class="n">free</span><span class="p">(</span><span class="n">d_head</span><span class="p">,</span><span class="w"> </span><span class="n">q</span><span class="p">);</span>
+<span class="w">  </span><span class="k">return</span><span class="w"> </span><span class="mi">0</span><span class="p">;</span>
+<span class="p">}</span>
+</pre></div>
+</div>
+</div>
 </div>
 
 
@@ -567,11 +671,11 @@ <h2>Use std::vector<a class="headerlink" href="#use-std-vector" title="Permalink
       </div>
     </a>
     <a class="right-next"
-       href="../api_for_sycl_kernels_main.html"
+       href="iterators.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">API for the SYCL* Kernels</p>
+        <p class="prev-next-title">Iterators</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
@@ -596,6 +700,7 @@ <h2>Use std::vector<a class="headerlink" href="#use-std-vector" title="Permalink
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-oneapi-dpl-begin-and-oneapi-dpl-end-functions">Use oneapi::dpl::begin and oneapi::dpl::end Functions</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-unified-shared-memory">Use Unified Shared Memory</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-std-vector">Use std::vector</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#use-range-views">Use Range Views</a></li>
 </ul>
   </nav></div>
 
diff --git a/parallel_api/range_based_api.html b/parallel_api/range_based_api.html
index a3c22d5fc2..1b0d7a6a07 100644
--- a/parallel_api/range_based_api.html
+++ b/parallel_api/range_based_api.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Range-Based API Algorithms &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Experimental Range-Based API &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -45,8 +45,8 @@
     <link rel="shortcut icon" href="../_static/favicons.png"/>
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="Additional Algorithms" href="additional_algorithms.html" />
-    <link rel="prev" title="Asynchronous API Algorithms" href="async_api.html" />
+    <link rel="next" title="API for SYCL* Kernels" href="../api_for_sycl_kernels_main.html" />
+    <link rel="prev" title="Iterators" href="iterators.html" />
 
     <script defer type="text/javascript" src="https://www.intel.com/content/dam/www/global/wap/performance-config.js" ></script>
     <script type="text/javascript">
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="../introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="../introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 current active has-children"><a class="reference internal" href="../parallel_api_main.html">Parallel API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2 current active"><a class="current reference internal" href="#">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="iterators.html">Iterators</a></li>
+<li class="toctree-l2 current active"><a class="current reference internal" href="#">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -184,14 +191,12 @@
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/kernel_configuration.html">Kernel Configuration</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="../kernel_templates/esimd_main.html">ESIMD-Based Kernel Templates</a><input class="toctree-checkbox" id="toctree-checkbox-6" name="toctree-checkbox-6" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-6"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort.html">Radix Sort</a></li>
+<li class="toctree-l3"><a class="reference internal" href="../kernel_templates/esimd/radix_sort_by_key.html">Radix Sort By Key</a></li>
 </ul>
 </li>
 <li class="toctree-l2"><a class="reference internal" href="../kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="../macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -379,7 +384,7 @@
               
 
 <div id="jb-print-docs-body" class="onlyprint">
-    <h1>Range-Based API Algorithms</h1>
+    <h1>Experimental Range-Based API</h1>
     <!-- Table of contents -->
     <div id="print-main-content">
         <div id="jb-print-toc">
@@ -389,7 +394,9 @@ <h2> Contents </h2>
             </div>
             <nav aria-label="Page">
                 <ul class="visible nav section-nav flex-column">
-<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#example-of-range-based-api-usage">Example of Range-Based API Usage</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#range-views">Range Views</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#range-based-algorithms">Range-Based Algorithms</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#usage-example">Usage Example</a></li>
 </ul>
             </nav>
         </div>
@@ -401,29 +408,68 @@ <h2> Contents </h2>
 <div id="searchbox"></div>
                 <article class="bd-article" role="main">
                   
-  <div class="section" id="range-based-api-algorithms">
-<h1>Range-Based API Algorithms<a class="headerlink" href="#range-based-api-algorithms" title="Permalink to this headline">#</a></h1>
+  <div class="section" id="experimental-range-based-api">
+<h1>Experimental Range-Based API<a class="headerlink" href="#experimental-range-based-api" title="Permalink to this headline">#</a></h1>
+<p>The <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/ranges&gt;</span></code> header file contains experimental classes and functions that implement
+the functionality similar to what is provided by the C++20 Ranges Library, yet only requires C++17.
+This allows you to combine oneDPL data parallel execution capabilities with some aspects
+of modern range-based API. The functionality is only implemented for the device execution policies.</p>
 <div class="admonition note">
 <p class="admonition-title">Note</p>
-<p>The use of the range-based API requires C++17 and the C++ standard libraries coming with GCC 8.1 (or higher)
-or Clang 7 (or higher).</p>
+<p>The use of the experimental range-based API requires the C++ standard libraries
+coming with GCC 8.1 (or higher) or Clang 7 (or higher).</p>
 </div>
-<p>C++20 introduces the Ranges library. C++20 standard splits ranges into two categories: factories and adaptors.
-A range factory does not have underlying data. An element is generated on success by an index or by dereferencing an iterator.
-A range adaptor, from the oneAPI DPC++ Library (oneDPL) perspective, is a utility that transforms the base range,
-or another adapted range, into a view with custom behavior.</p>
-<p>oneDPL supports an <code class="docutils literal notranslate"><span class="pre">iota_view</span></code> range factory.</p>
-<p>A <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> wrapped with <code class="docutils literal notranslate"><span class="pre">all_view</span></code> can be used as the range.</p>
-<p>oneDPL considers the supported factories and <code class="docutils literal notranslate"><span class="pre">all_view</span></code> as base ranges.
-The range adaptors may be combined into a pipeline with a <code class="docutils literal notranslate"><span class="pre">base</span></code> range at the beginning. For example:</p>
+<div class="admonition warning">
+<p class="admonition-title">Warning</p>
+<p>This experimental functionality will be gradually substituted by the
+<a class="reference internal" href="parallel_range_algorithms.html"><span class="doc">parallel range algorithms</span></a> and eventually discontinued.</p>
+</div>
+<div class="section" id="range-views">
+<h2>Range Views<a class="headerlink" href="#range-views" title="Permalink to this headline">#</a></h2>
+<p id="viewable-ranges">The following viewable ranges are defined in the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::experimental::ranges</span></code> namespace:</p>
+<ul class="simple">
+<li><p><code class="docutils literal notranslate"><span class="pre">views::iota</span></code>: A range factory that generates a sequence of elements by repeatedly incrementing an initial value.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">views::all</span></code>: A custom utility that represents a view of all or a part of <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> elements
+for reading and writing on a device.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">views::all_read</span></code>: A custom utility that represents a view of all or a part of <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> elements
+for reading on a device.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">views::all_write</span></code>: A custom utility that represents a view of all or a part of <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> elements
+for writing on a device.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">views::host_all</span></code>: A custom utility that represents a view of all or a part of <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> elements
+for reading and writing on the host.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">views::subrange</span></code>: A utility that represents a view of unified shared memory (USM) data range
+defined by two USM pointers.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">views::zip</span></code>: A custom range adaptor that produces one <code class="docutils literal notranslate"><span class="pre">zip_view</span></code> from other several views.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">views::transform</span></code>: A range adaptor that represents a view of an underlying sequence after applying
+a transformation to each element.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">views::reverse</span></code>: A range adaptor that produces a reversed sequence of elements provided by another view.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">views::take</span></code>: A range adaptor that produces a view of the first N elements from another view.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">views::drop</span></code>: A range adaptor that produces a view excluding the first N elements from another view.</p></li>
+</ul>
+<p>Only these ranges, <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code>, and their combinations can be passed to the experimental range-based algorithms.</p>
+<p>A <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> wrapped with <code class="docutils literal notranslate"><span class="pre">views::all</span></code> and similar utilities, <code class="docutils literal notranslate"><span class="pre">views::subrange</span></code> over USM, and <code class="docutils literal notranslate"><span class="pre">views::iota</span></code>
+are considered <em>base ranges</em>. The range adaptors may be combined into a pipeline with a base range at the beginning.
+For example:</p>
 <div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">buf</span><span class="p">(</span><span class="n">data</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="mi">10</span><span class="p">));</span>
-<span class="k">auto</span><span class="w"> </span><span class="n">range_1</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">iota_view</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span><span class="w"> </span><span class="mi">10</span><span class="p">)</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">views</span><span class="o">::</span><span class="n">reverse</span><span class="p">();</span>
-<span class="k">auto</span><span class="w"> </span><span class="n">range_2</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">all_view</span><span class="p">(</span><span class="n">buf</span><span class="p">)</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">views</span><span class="o">::</span><span class="n">reverse</span><span class="p">();</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">range_1</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">views</span><span class="o">::</span><span class="n">iota</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span><span class="w"> </span><span class="mi">10</span><span class="p">)</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">views</span><span class="o">::</span><span class="n">reverse</span><span class="p">;</span>
+<span class="k">auto</span><span class="w"> </span><span class="n">range_2</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">views</span><span class="o">::</span><span class="n">all</span><span class="p">(</span><span class="n">buf</span><span class="p">)</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">views</span><span class="o">::</span><span class="n">take</span><span class="p">(</span><span class="mi">10</span><span class="p">);</span>
+</pre></div>
+</div>
+<p>For ranges based on a SYCL buffer, data access is only permitted on a device, while <code class="docutils literal notranslate"><span class="pre">size()</span></code> and <code class="docutils literal notranslate"><span class="pre">empty()</span></code>
+methods are allowed to be called on both host and device.</p>
+</div>
+<div class="section" id="range-based-algorithms">
+<h2>Range-Based Algorithms<a class="headerlink" href="#range-based-algorithms" title="Permalink to this headline">#</a></h2>
+<p>The functions for experimental range based algorithms resemble the standard C++ parallel algorithm overloads
+where all data sequences represented by ranges instead of iterators or iterator pairs, for example:</p>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="k">typename</span><span class="w"> </span><span class="nc">ExecutionPolicy</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Range1</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Range2</span><span class="o">&gt;</span>
+<span class="kt">void</span><span class="w"> </span><span class="n">copy</span><span class="p">(</span><span class="n">ExecutionPolicy</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">exec</span><span class="p">,</span><span class="w"> </span><span class="n">Range1</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">source</span><span class="p">,</span><span class="w"> </span><span class="n">Range2</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">destination</span><span class="p">);</span>
 </pre></div>
 </div>
-<p>For the range, based on the <code class="docutils literal notranslate"><span class="pre">all_view</span></code> factory, data access is permitted on a device only. <code class="docutils literal notranslate"><span class="pre">size()</span></code> and <code class="docutils literal notranslate"><span class="pre">empty()</span></code> methods are allowed
-to be called on both host and device.</p>
-<p>The following algorithms are available to use with the ranges:</p>
+<p>Note that <code class="docutils literal notranslate"><span class="pre">source</span></code> is used instead of two iterators to represent the input, and <code class="docutils literal notranslate"><span class="pre">destination</span></code> represents the output.</p>
+<p>The following algorithms are available to use with the ranges. These algorithms are defined in the
+<code class="docutils literal notranslate"><span class="pre">oneapi::dpl::experimental::ranges</span></code> namespace and can only be invoked with device execution policies.
+To use these algorithms, include both <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/ranges&gt;</span></code> and <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/execution&gt;</span></code> header files.</p>
 <ul class="simple">
 <li><p><code class="docutils literal notranslate"><span class="pre">adjacent_find</span></code></p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">all_of</span></code></p></li>
@@ -473,42 +519,19 @@ <h1>Range-Based API Algorithms<a class="headerlink" href="#range-based-api-algor
 <li><p><code class="docutils literal notranslate"><span class="pre">unique</span></code></p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">unique_copy</span></code></p></li>
 </ul>
-<p>The signature example of the range-based algorithms looks like:</p>
-<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">template</span><span class="w"> </span><span class="o">&lt;</span><span class="k">typename</span><span class="w"> </span><span class="nc">ExecutionPolicy</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Range1</span><span class="p">,</span><span class="w"> </span><span class="k">typename</span><span class="w"> </span><span class="nc">Range2</span><span class="o">&gt;</span>
-<span class="kt">void</span><span class="w"> </span><span class="n">copy</span><span class="p">(</span><span class="n">ExecutionPolicy</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">exec</span><span class="p">,</span><span class="w"> </span><span class="n">Range1</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">source</span><span class="p">,</span><span class="w"> </span><span class="n">Range2</span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="n">destination</span><span class="p">);</span>
-</pre></div>
 </div>
-<p>where <code class="docutils literal notranslate"><span class="pre">source</span></code> is used instead of two iterators to represent the input, and <code class="docutils literal notranslate"><span class="pre">destination</span></code> represents the output.</p>
-<p>These algorithms are declared in the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::experimental::ranges</span></code> namespace and implemented only for device execution policies.
-To make these algorithms available, the <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/ranges&gt;</span></code> header should be included (after <code class="docutils literal notranslate"><span class="pre">&lt;oneapi/dpl/execution&gt;</span></code>).
-Use of the range-based API requires C++17 and the C++ standard libraries that come with GCC 8.1 (or higher) or Clang 7 (or higher).</p>
-<p>The following viewable ranges are declared in the <code class="docutils literal notranslate"><span class="pre">oneapi::dpl::experimental::ranges</span></code> namespace.
-Only the ranges shown below and <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> are available as ranges for range-based algorithms.</p>
-<ul class="simple" id="viewable-ranges">
-<li><p><code class="docutils literal notranslate"><span class="pre">views::iota</span></code>: A range factory that generates a sequence of N elements, which starts from an initial value and ends by final N-1.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">views::all</span></code>: A custom utility that represents a view of all or a part of <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> underlying elements for reading and writing on a device.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">views::all_read</span></code>: A custom utility that represents a view of all or a part of <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> underlying elements for reading on a device.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">views::all_write</span></code>: A custom utility that represents a view of all or a part of <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> underlying elements for writing on a device.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">views::host_all</span></code>: A custom utility that represents a view of all or a part of <code class="docutils literal notranslate"><span class="pre">sycl::buffer</span></code> underlying elements for reading and writing on the host.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">views::subrange</span></code>: A utility that represents a view of unified shared memory (USM) data range defined by a two USM pointers.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">views::zip</span></code>: A custom range adapter that produces one <code class="docutils literal notranslate"><span class="pre">zip_view</span></code> from other several views.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">views::transform</span></code>: A range adapter that represents a view of a underlying sequence after applying a transformation to each element.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">views::reverse</span></code>: A range adapter that produces a reversed sequence of elements provided by another view.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">views::take</span></code>: A range adapter that produces a view of the first N elements from another view.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">views::drop</span></code>: A range adapter that produces a view excluding the first N elements from another view.</p></li>
-</ul>
-<div class="section" id="example-of-range-based-api-usage">
-<h2>Example of Range-Based API Usage<a class="headerlink" href="#example-of-range-based-api-usage" title="Permalink to this headline">#</a></h2>
-<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">using</span><span class="w"> </span><span class="k">namespace</span><span class="w"> </span><span class="nn">oneapi</span><span class="o">::</span><span class="nn">dpl</span><span class="o">::</span><span class="nn">experimental</span><span class="o">::</span><span class="nn">ranges</span><span class="p">;</span>
+<div class="section" id="usage-example">
+<h2>Usage Example<a class="headerlink" href="#usage-example" title="Permalink to this headline">#</a></h2>
+<div class="highlight-cpp notranslate"><div class="highlight"><pre><span></span><span class="k">namespace</span><span class="w"> </span><span class="nn">rangexp</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="nn">oneapi</span><span class="o">::</span><span class="nn">dpl</span><span class="o">::</span><span class="nn">experimental</span><span class="o">::</span><span class="nn">ranges</span><span class="p">;</span>
 
 <span class="p">{</span>
 <span class="w">    </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">A</span><span class="p">(</span><span class="n">data</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">max_n</span><span class="p">));</span>
 <span class="w">    </span><span class="n">sycl</span><span class="o">::</span><span class="n">buffer</span><span class="o">&lt;</span><span class="kt">int</span><span class="o">&gt;</span><span class="w"> </span><span class="n">B</span><span class="p">(</span><span class="n">data2</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">range</span><span class="o">&lt;</span><span class="mi">1</span><span class="o">&gt;</span><span class="p">(</span><span class="n">max_n</span><span class="p">));</span>
 
-<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">view</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">all_view</span><span class="p">(</span><span class="n">A</span><span class="p">)</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">views</span><span class="o">::</span><span class="n">reverse</span><span class="p">();</span>
-<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">range_res</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">all_view</span><span class="o">&lt;</span><span class="kt">int</span><span class="p">,</span><span class="w"> </span><span class="n">sycl</span><span class="o">::</span><span class="n">access</span><span class="o">::</span><span class="n">mode</span><span class="o">::</span><span class="n">write</span><span class="o">&gt;</span><span class="p">(</span><span class="n">B</span><span class="p">);</span>
+<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">view</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">rangexp</span><span class="o">::</span><span class="n">views</span><span class="o">::</span><span class="n">all</span><span class="p">(</span><span class="n">A</span><span class="p">)</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">rangexp</span><span class="o">::</span><span class="n">views</span><span class="o">::</span><span class="n">reverse</span><span class="p">;</span>
+<span class="w">    </span><span class="k">auto</span><span class="w"> </span><span class="n">range_res</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">rangexp</span><span class="o">::</span><span class="n">views</span><span class="o">::</span><span class="n">all_write</span><span class="p">(</span><span class="n">B</span><span class="p">);</span>
 
-<span class="w">    </span><span class="n">copy</span><span class="p">(</span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span><span class="w"> </span><span class="n">view</span><span class="p">,</span><span class="w"> </span><span class="n">range_res</span><span class="p">);</span>
+<span class="w">    </span><span class="n">rangexp</span><span class="o">::</span><span class="n">copy</span><span class="p">(</span><span class="n">oneapi</span><span class="o">::</span><span class="n">dpl</span><span class="o">::</span><span class="n">execution</span><span class="o">::</span><span class="n">dpcpp_default</span><span class="p">,</span><span class="w"> </span><span class="n">view</span><span class="p">,</span><span class="w"> </span><span class="n">range_res</span><span class="p">);</span>
 <span class="p">}</span>
 </pre></div>
 </div>
@@ -528,20 +551,20 @@ <h2>Example of Range-Based API Usage<a class="headerlink" href="#example-of-rang
     <div class="footer-article-item"><!-- Previous / next buttons -->
 <div class="prev-next-area">
     <a class="left-prev"
-       href="async_api.html"
+       href="iterators.html"
        title="previous page">
       <i class="fa-solid fa-angle-left"></i>
       <div class="prev-next-info">
         <p class="prev-next-subtitle">previous</p>
-        <p class="prev-next-title">Asynchronous API Algorithms</p>
+        <p class="prev-next-title">Iterators</p>
       </div>
     </a>
     <a class="right-next"
-       href="additional_algorithms.html"
+       href="../api_for_sycl_kernels_main.html"
        title="next page">
       <div class="prev-next-info">
         <p class="prev-next-subtitle">next</p>
-        <p class="prev-next-title">Additional Algorithms</p>
+        <p class="prev-next-title">API for SYCL* Kernels</p>
       </div>
       <i class="fa-solid fa-angle-right"></i>
     </a>
@@ -563,7 +586,9 @@ <h2>Example of Range-Based API Usage<a class="headerlink" href="#example-of-rang
   </div>
   <nav class="bd-toc-nav page-toc">
     <ul class="visible nav section-nav flex-column">
-<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#example-of-range-based-api-usage">Example of Range-Based API Usage</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#range-views">Range Views</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#range-based-algorithms">Range-Based Algorithms</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#usage-example">Usage Example</a></li>
 </ul>
   </nav></div>
 
diff --git a/parallel_api_main.html b/parallel_api_main.html
index ebf40fc0be..a8b49f4a31 100644
--- a/parallel_api_main.html
+++ b/parallel_api_main.html
@@ -8,7 +8,7 @@
   <head>
     <meta charset="utf-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Parallel API &#8212; oneDPL Documentation 2022.6.0 documentation</title>
+    <title>Parallel API &#8212; oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="current nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 current active has-children"><a class="current reference internal" href="#">Parallel API</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -190,9 +197,6 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
@@ -394,26 +398,26 @@ <h1>Parallel API</h1>
                   
   <div class="section" id="parallel-api">
 <h1>Parallel API<a class="headerlink" href="#parallel-api" title="Permalink to this headline">#</a></h1>
-<p>Parallel API is an implementation of the C++ standard libraries algorithms and execution
-policies, as specified in the ISO/IEC 14882:2017 standard (commonly called C++17). The implementation
-supports the unsequenced execution policy and the <code class="docutils literal notranslate"><span class="pre">shift_left</span></code>/<code class="docutils literal notranslate"><span class="pre">shift_right</span></code> algorithms, which are specified
-in the final draft of the C++ 20 standard (N4860). For more details see the <a class="reference external" href="https://en.cppreference.com/w/cpp/algorithm/execution_policy_tag_t">C++ Standard Execution
-Policies</a>. oneAPI DPC++ Library (oneDPL)
-provides specific versions of the algorithms, including:</p>
+<p>The Parallel API in oneAPI DPC++ Library (oneDPL) is an implementation of the C++ standard algorithms
+with <a class="reference external" href="https://en.cppreference.com/w/cpp/algorithm#Execution_policies">execution policies</a>,
+as specified in the ISO/IEC 14882:2017 standard (commonly called C++17), as well as those added in C++20.
+It offers threaded and SIMD execution of these algorithms on Intel® processors implemented on top of OpenMP*
+and oneTBB, as well as data parallel execution on accelerators backed by SYCL* support in Intel® oneAPI DPC++/C++ Compiler.</p>
+<p>Extending the capabilities of <a class="reference external" href="https://en.cppreference.com/w/cpp/algorithm/ranges">range algorithms</a> in C++20,
+the Parallel API provides analogous <em>parallel range algorithms</em> that execute according to an execution policy.</p>
+<p>In addition, oneDPL provides specific variations of some algorithms, including:</p>
 <ul class="simple">
 <li><p>Segmented reduce</p></li>
 <li><p>Segmented scan</p></li>
 <li><p>Vectorized search algorithms</p></li>
+<li><p>Sorting of key-value pairs</p></li>
+<li><p>Conditional transform</p></li>
 </ul>
-<p>Parallel API offers support for the parallel and vectorized execution of algorithms on Intel®
-processors and heterogeneity support with a DPC++ based implementation for device execution policies.
-For sequential execution, oneDPL relies on an available implementation of the C++ standard library.</p>
 <p>The utility API includes iterators and function object classes. The iterators implement
 zip, transform, complete permutation operations on other iterators, and include a counting and discard iterator.
 The function object classes provide minimum, maximum, and identity operations
 that may be passed to algorithms such as reduce or transform.</p>
-<p>oneDPL also includes an experimental implementation of range-based algorithms with their
-required ranges and Async API.</p>
+<p>oneDPL also includes an experimental implementation of asynchronous algorithms.</p>
 <div class="toctree-wrapper compound">
 </div>
 </div>
diff --git a/search.html b/search.html
index e372f34f6f..d012edb081 100644
--- a/search.html
+++ b/search.html
@@ -7,7 +7,7 @@
 
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><title>Search - oneDPL Documentation 2022.6.0 documentation</title>
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><title>Search - oneDPL Documentation 2022.7.0 documentation</title>
   
   
   
@@ -151,24 +151,31 @@
 <li class="toctree-l1"><a class="reference internal" href="introduction/release_notes.html">Release Notes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="introduction/onedpl_gsg.html">Get Started with the oneAPI DPC++ Library</a></li>
 </ul>
-<p aria-level="2" class="caption" role="heading"><span class="caption-text">Library Guide</span></p>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Core Functionality</span></p>
 <ul class="nav bd-sidenav">
 <li class="toctree-l1"><a class="reference internal" href="introduction.html">oneAPI DPC++ Library Introduction</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="parallel_api_main.html">Parallel API</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-1"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/execution_policies.html">Execution Policies</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous API Algorithms</a></li>
-<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Range-Based API Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/parallel_range_algorithms.html">Parallel Range Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/additional_algorithms.html">Additional Algorithms</a></li>
 <li class="toctree-l2"><a class="reference internal" href="parallel_api/pass_data_algorithms.html">Pass Data to Algorithms</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/iterators.html">Iterators</a></li>
+<li class="toctree-l2"><a class="reference internal" href="parallel_api/range_based_api.html">Experimental Range-Based API</a></li>
 </ul>
 </li>
-<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for the SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
-<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
+<li class="toctree-l1 has-children"><a class="reference internal" href="api_for_sycl_kernels_main.html">API for SYCL* Kernels</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-2"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/tested_standard_cpp_api.html">Tested Standard C++ APIs</a></li>
+<li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/random.html">Random Number Generators</a></li>
 <li class="toctree-l2"><a class="reference internal" href="api_for_sycl_kernels/utility_function_object_classes.html">Utility Function Object Classes</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
+<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
+<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
+</ul>
+<p aria-level="2" class="caption" role="heading"><span class="caption-text">Technology Preview</span></p>
+<ul class="nav bd-sidenav">
+<li class="toctree-l1"><a class="reference internal" href="parallel_api/async_api.html">Asynchronous Algorithms</a></li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="dynamic_selection_api_main.html">Dynamic Selection API</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-3"><i class="fa-solid fa-chevron-down"></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="dynamic_selection_api/functions.html">Functions</a></li>
 <li class="toctree-l2 has-children"><a class="reference internal" href="dynamic_selection_api/policies.html">Policies</a><input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/><label class="toctree-toggle" for="toctree-checkbox-4"><i class="fa-solid fa-chevron-down"></i></label><ul>
@@ -190,9 +197,6 @@
 <li class="toctree-l2"><a class="reference internal" href="kernel_templates/single_pass_scan.html">Inclusive Scan</a></li>
 </ul>
 </li>
-<li class="toctree-l1"><a class="reference internal" href="macros.html">Macros</a></li>
-<li class="toctree-l1"><a class="reference internal" href="cmake_support.html">CMake Support</a></li>
-<li class="toctree-l1"><a class="reference internal" href="oneDPL_2022.0_changes.html">oneDPL 2022 Breaking Changes</a></li>
 </ul>
 <p aria-level="2" class="caption" role="heading"><span class="caption-text">Notices and Disclaimers</span></p>
 <ul class="nav bd-sidenav">
diff --git a/searchindex.js b/searchindex.js
index f31f3b658c..b729e93740 100644
--- a/searchindex.js
+++ b/searchindex.js
@@ -1 +1 @@
-Search.setIndex({docnames:["api_for_sycl_kernels/random","api_for_sycl_kernels/tested_standard_cpp_api","api_for_sycl_kernels/utility_function_object_classes","api_for_sycl_kernels_main","cmake_support","dynamic_selection_api/auto_tune_policy","dynamic_selection_api/dynamic_load_policy","dynamic_selection_api/fixed_resource_policy","dynamic_selection_api/functions","dynamic_selection_api/policies","dynamic_selection_api/round_robin_policy","dynamic_selection_api_main","index","introduction","introduction/onedpl_gsg","introduction/release_notes","kernel_templates/esimd/radix_sort","kernel_templates/esimd/radix_sort_by_key","kernel_templates/esimd_main","kernel_templates/kernel_configuration","kernel_templates/single_pass_scan","kernel_templates_main","macros","notices_disclaimers","oneDPL_2022.0_changes","onedpl_gsg","parallel_api/additional_algorithms","parallel_api/async_api","parallel_api/execution_policies","parallel_api/iterators","parallel_api/pass_data_algorithms","parallel_api/range_based_api","parallel_api_main"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":4,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":3,"sphinx.domains.rst":2,"sphinx.domains.std":2,sphinx:56},filenames:["api_for_sycl_kernels/random.rst","api_for_sycl_kernels/tested_standard_cpp_api.rst","api_for_sycl_kernels/utility_function_object_classes.rst","api_for_sycl_kernels_main.rst","cmake_support.rst","dynamic_selection_api/auto_tune_policy.rst","dynamic_selection_api/dynamic_load_policy.rst","dynamic_selection_api/fixed_resource_policy.rst","dynamic_selection_api/functions.rst","dynamic_selection_api/policies.rst","dynamic_selection_api/round_robin_policy.rst","dynamic_selection_api_main.rst","index.rst","introduction.rst","introduction/onedpl_gsg.rst","introduction/release_notes.rst","kernel_templates/esimd/radix_sort.rst","kernel_templates/esimd/radix_sort_by_key.rst","kernel_templates/esimd_main.rst","kernel_templates/kernel_configuration.rst","kernel_templates/single_pass_scan.rst","kernel_templates_main.rst","macros.rst","notices_disclaimers.rst","oneDPL_2022.0_changes.rst","onedpl_gsg.rst","parallel_api/additional_algorithms.rst","parallel_api/async_api.rst","parallel_api/execution_policies.rst","parallel_api/iterators.rst","parallel_api/pass_data_algorithms.rst","parallel_api/range_based_api.rst","parallel_api_main.rst"],objects:{},objnames:{},objtypes:{},terms:{"0":[0,1,5,6,7,8,10,11,13,14,16,17,20,22,23,24,25,26,27,28,29,30,31],"002":20,"01784":[16,17],"04":18,"0f":[14,25],"1":[0,1,5,6,7,8,9,10,11,14,16,17,20,22,24,25,26,27,28,29,31],"10":[0,13,20,22,26,27,29,31],"100":[0,6,10],"1000":[22,28,30],"10000":[5,6,7,10],"11":[0,1,2,4,24],"12":[0,26],"14":[24,26],"14882":[30,32],"15":[18,26],"16807":0,"16k":16,"17":[1,4,13,24,27,29,30,31,32],"1m":[16,17],"2":[1,5,6,7,8,9,10,11,14,16,17,18,20,23,25,26,29],"20":[2,4,13,24,31,32],"2016":20,"2017":[1,30,32],"2019":[1,13],"2020":[13,16,17,19,20,28,30],"2021":[13,24],"2022":[1,12,13,16,17],"2023":18,"2147483647":0,"22":18,"2206":[16,17],"223":0,"23":0,"24":0,"256":20,"3":[1,4,5,6,7,8,9,10,11,16,17,20,26],"30":[16,17],"32":[16,17,20],"389":0,"4":[1,5,6,7,8,9,10,11,13,14,16,17,20,25,26],"416":16,"42":28,"45":29,"48":0,"48271":0,"4kb":[16,17],"5":[0,1,6,7,10,11,13,16,17,20,26],"6":[5,6,7,8,10,11,16,17,20,26],"64":[16,17,20],"7":[1,6,10,13,20,24,26,27,29,31],"777":0,"8":[6,13,16,17,20,26,28,31],"9":[1,13,18,26,29],"96":17,"99":[6,10,26],"\u03c0":[14,25],"\u0441":24,"boolean":26,"break":12,"byte":20,"case":[0,7,8,10,19,29,30],"char":17,"class":[0,1,3,5,6,7,10,13,14,24,25,28,29,32],"const":[5,6,7,8,9,10,13,27,29,30],"default":[4,5,6,7,8,9,10,11,13,14,22,25,26,28,29],"do":[8,13,16,17,26,27,28,29],"final":[26,31,32],"float":[0,5,6,7,10,13,14,16,17,20,25],"function":[1,3,5,6,7,9,10,11,12,13,14,22,24,25,26,27,28,29,32],"import":4,"int":[0,1,5,6,7,8,9,10,11,14,16,17,20,25,27,28,29,30,31],"new":[13,14,25],"public":[5,6,7,10],"return":[0,1,2,5,6,7,8,9,10,11,14,25,26,27,28,29,30],"short":8,"switch":[13,24],"throw":[5,6,7,10,13,28],"true":[13,16,17,20,26],"try":22,"void":[1,5,6,7,8,9,10,14,25,31],"while":[5,6,7,10,13,16,17,30],A:[2,4,5,6,7,8,10,11,13,14,16,17,19,20,22,25,26,28,31],And:11,By:[11,22],For:[0,4,5,7,8,12,13,14,16,17,20,22,25,26,28,29,30,31,32],If:[4,5,6,7,8,9,10,13,16,17,19,20,22,26,27,28,30],In:[1,4,5,6,7,10,11,24,29,30],It:[4,5,6,7,8,10,20,21,28,30],Its:[16,17],No:[5,6,7,10,23,28],On:[4,20],Such:[7,20],That:[13,20,30],The:[0,1,2,3,4,5,6,7,8,9,10,11,13,14,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32],Then:[5,28],There:[5,6,7,8,9,10,11,20,26],These:[0,1,4,14,18,21,25,30,31],To:[4,13,14,20,21,24,25,28,29,30,31],Will:[6,10],__boundary_first:26,_async:27,_pstl_version:22,_pstl_version_major:22,_pstl_version_minor:22,_pstl_version_patch:22,a_a:[5,7],a_b:[5,7],ab:[1,16,17],about:[7,9,10,11,13,14,22,25],abov:[4,14,25,27,28,29,30],absolut:23,accept:[29,30],access:[0,1,13,29,30,31],accessor:[5,7,30],accident:13,accord:[0,13,16,17,20,26,29,30],achiev:[6,10,28],aco:1,acosh:1,across:[0,6,10,12,14,25],act:[5,13],activ:[5,6,7,10,23],ad:[1,13,14,25,27,28],adapt:31,adaptor:[0,31],add:[4,13,14,25,28,30],add_const:1,add_cv:1,add_execut:[4,14,25],add_volatil:1,addit:[3,6,8,12,13,16,17,20],addition:20,adinet:[16,17],adjacent_find:31,advanc:8,advic:[16,17,20],affect:4,after:[4,8,30,31],against:[14,25],aim:21,algorithm:[0,4,16,17,20,21,22,28,29,32],alia:13,align:24,alignment_of:1,all:[2,5,6,7,8,10,11,13,14,16,17,20,21,22,23,25,26,27,28,29,31],all_of:[1,31],all_read:31,all_view:31,all_writ:31,alloc:[13,27,29,30],allow:[4,6,13,16,17,20,22,27,28,30,31],along:8,alreadi:11,also:[5,6,7,8,10,20,22,29,30,32],alter:[16,17],altern:11,although:20,alwai:[7,11],among:4,amount:[16,17,20],an:[0,1,4,5,6,7,8,9,10,11,13,14,16,17,19,20,21,22,25,26,27,28,29,30,31,32],analysi:28,andi:[16,17],ani:[5,6,7,8,9,10,11,13,16,20,23,24,27,28,29],anoth:[26,29,31],any_of:[1,31],anyth:30,apach:23,api:[5,6,7,8,9,10,12,13,14,22,24,25,28,30],appear:6,appli:[2,13,16,17,20,26,29,30,31],applic:[4,7,12,14,22,25,28,29],approach:[6,10,21],appropri:[14,25],approxim:[16,17,20],ar:[0,1,2,4,5,6,7,8,9,10,11,13,14,16,17,18,20,21,22,23,24,25,26,27,28,29,30,31,32],arbitrari:27,area:[14,25],arg:[1,5,6,7,8,10],argument:[2,5,7,8,11,22,27,28,29,30],aris:23,arithmet:29,arr:20,arrai:[1,6,10,13],arxiv:[16,17],ascend:[16,17],asin:1,asinh:1,aspect:[11,22],assert:1,assign:[6,10],associ:[5,6,7,9,10,20,26,28],assum:[1,4,26,28],assumpt:21,async:[8,32],asynchron:[5,6,7,10,20,28],atan2:1,atan:1,atanh:1,atom:20,augment:19,auto:[0,1,6,7,8,9,10,11,14,16,17,20,25,26,27,28,29,30,31],auto_tune_polici:[7,8,11],auto_tune_polii:8,automat:19,av:[5,7],avail:[0,2,4,6,10,14,16,17,18,20,21,22,23,25,26,27,29,30,31,32],avoid:[5,6,7,10,13,16,17,20,30],b:[26,30,31],b_a:[5,7],b_b:[5,7],back:[8,20,30],backend:[5,6,7,9,10,12,13,22,28],bad_alloc:[16,17,20],balanc:[6,10],base:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,19,20,21,22,23,24,25,26,27,28,29,30,32],basic:[1,3,14,25],becaus:[8,13,30],becom:27,been:[1,3,4,14,20,24,25,26],befor:[4,5,6,7,8,10,12,14,22,25,28],begin:[0,12,16,17,20,27,28,29,31],behav:8,behavior:[7,8,10,13,16,17,20,26,27,28,31],being:[5,26,30],below:[0,1,4,5,6,7,8,9,10,13,14,16,17,19,20,25,26,27,28,29,31],benefici:20,benefit:[16,17],bernoulli:0,bernoulli_distribut:0,best:[5,7,11],best_resource_:5,better:[16,17,20,28],between:[5,6,7,8,10,11,16,17,20,24,29,30],bin:26,binari:[13,20,26],binary_funct:24,binary_neg:[1,24],binary_op:20,binary_search:[1,26],binaryop:20,bind:29,bit:[16,17,20],bit_and:1,bit_not:1,bit_or:1,bit_xor:1,bitfield:30,block:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32],bodi:11,bool:[0,16,17,30],both:[4,7,13,16,17,26,28,29,31],bound:[16,17,27],boundari:26,brand:23,buf:[30,31],buf_begin:30,buf_end:30,buffer:[0,1,5,7,13,16,17,20,27,30,31],build:[0,1,2,3,5,6,7,8,9,10,11,12,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32],built:21,bv:[5,7],c:[0,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,20,21,22,23,24,25,26,27,29,30,31,32],c_a:[5,7],c_b:[5,7],call:[4,5,6,7,8,9,10,11,13,20,22,27,28,29,30,31,32],callabl:13,callback:[5,6],caller:28,can:[0,1,4,5,6,7,8,9,10,11,12,13,14,16,17,19,20,22,23,25,27,28,30,31],cannot:[13,29],capabl:[7,10],captur:13,carlo:[14,25],carri:0,catalog:[14,25],categor:21,categori:31,cauchi:0,cauchy_distribut:0,caus:[13,23,28],cbrt:1,cd:[4,14,25],ceil:1,center:[16,17,18,20],certain:22,cflag:[14,25],cgh:[0,1],chain:[11,27],chang:[12,13,27,29],character:23,cheap:29,check:[5,6,7,10,14,16,17,20,25],choic:5,choos:[5,6,8,11,16,17,20,28],chosen:[4,5,6,7,8,9,10,11,22],chrono:8,chunk:[16,17],circl:[14,25],cl:4,cl_int:1,claim:23,clang:[1,31],clariti:[5,7],cmake:12,cmake_build_typ:4,cmake_cxx_compil:4,cmake_cxx_standard:4,cmake_host_win32:4,cmakelist:[4,14,25],co:1,code:[0,1,5,6,7,8,10,11,12,14,22,24,25,28,29,30],coexist:28,combin:[5,20,28,30,31],come:31,command:[1,8,11,12,13,16,17,20],common_typ:1,commonli:[30,32],commun:20,commut:20,compar:[13,26,29,30],comparioson:26,comparison:13,compat:20,compil:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32],complet:[6,8,10,11,14,20,22,25,27,30,32],complex:[1,13],compliant:19,compon:[14,23,25],comput:[14,16,17,20,25,26,27,28,29],concurr:[6,10,27,30],condit:[1,13],configur:[4,14,16,17,20,21,25],congruenti:0,conj:1,connect:[4,14,25],consid:[4,8,31],consist:[14,25],constant:7,constexpr:[1,5,6,7,10,19,28],construct:[5,6,7,9,10,13,26,28,29],constructor:[8,28,29],contain:[4,6,7,8,10,13,22,23,30],content:28,contigu:[26,29],control:[4,22,27,30],conveni:30,convert:[0,13,14,25,27],copi:[1,9,16,17,20,22,29,30,31],copy_async:27,copy_backward:1,copy_if:[1,13,29,31],copy_n:1,copyabl:13,copyassign:30,copyconstruct:[13,30],copyright:23,copysign:1,copysignf:1,core:[16,17,20],corpor:23,correct:26,correctli:[16,17,20],correspond:[1,13,14,17,25,26,27,29],cosh:1,cost:[6,10,23],could:[7,13,26],count:[1,8,14,25,26,31,32],count_a:29,count_b:29,count_if:[1,31],count_kernel:0,counter:[10,16,17,29],counting_iter:[14,25,29],cours:23,cout:[0,1,5,6,7,8,9,10,11,16,17,20],cplusplu:24,cpp:[1,4,13,14,16,17,20,25],cpu:[1,5,7,8,9,10,11,14,25,28],cpu_selector_v:[5,7,8,9,11,28],creat:[0,4,11,13,14,16,17,19,25,28,30],creation:28,cref:1,cross:[4,20],cstdint:[16,17,20],current:[1,6,16,17,20,22,23,26,27],custom:[0,21,26,28,31],customiz:21,cut:8,cv:[5,7],cycl:10,d:[17,20,26],d_head:30,data2:31,data:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,31,32],data_per_workitem:[16,17,19,20],dataperworkitem:19,dcmake_build_typ:[4,14,25],dcmake_cxx_compil:[4,14,25],deal:23,debug:[4,7],decai:1,decay_t:9,decim:22,declar:[29,31],decltyp:[5,6,7,10,30],declval:1,decoupl:20,dedic:22,deduct:30,default_selector_v:0,defaultconstruct:13,defect:23,defer:22,deferred_initialization_t:[5,6,7,10],defin:[0,5,6,7,10,16,17,19,20,22,26,27,28,29,31],definit:[2,13,19,26,29],deliv:21,demonstr:[5,6,7,8,9,10,11,29,30],denot:20,densiti:0,depend:[8,13,16,17,19,20,21,22,27,28],deprec:[1,13,24],depth:[14,25],derefer:29,dereferenc:[13,29,31],descend:[16,17],describ:[0,4,8,16,17,20,23,27],descript:[0,5,6,7,10,14,16,17,19,20,22,25,28],design:[7,14,20,23,25],desir:[4,14,25,28,29],destin:[13,31],destroi:13,destroy_n:13,detail:[4,9,11,13,14,22,25,32],detect:30,determin:[5,8,9,26],determinist:20,develop:[4,11,14,22,25],deviat:23,devic:[0,1,5,6,7,8,10,12,13,14,16,17,18,19,20,21,22,25,26,27,29,30,31,32],device_polici:28,devicequeu:1,differ:[6,8,9,20,28],digit:[16,17],direct:[13,28],directli:[5,6,7,8,10,28],directori:[4,13,14,25],disabl:[13,22],discard:[0,29,32],discard_block_engin:[0,24],discard_iter:29,discontinu:24,dispatch:20,displai:[5,7],distanc:29,distr:[0,14,25],distribut:[3,4,14,25],divid:[1,20,26],do_cpu_work:6,document:[23,28],doe:[6,7,10,13,16,17,19,20,29,31],done:[1,5,6,7,8,11,16],donedpl_par_backend:4,doubl:[13,16,17,26],dpc:[0,1,2,3,4,5,6,7,8,9,10,11,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32],dpcpp:[1,4,13],dpcpp_default:[14,22,25,27,28,29,30,31],dpcpp_fpga:[22,28],dpl:[0,1,2,5,6,7,8,9,10,11,13,16,17,18,19,20,21,24,26,27,28,29,31],draft:32,driver:8,drop:31,duan:[16,17],due:[13,20],dure:[7,11,13,29,30],dynam:[5,7,8,9,10,12,28],dynamic_load_exampl:6,dynamic_load_polici:[8,11],dynamic_select:[5,6,7,8,9,10,11],e1:29,e2:29,e3:29,e:[8,16,17,20,26],each:[5,6,9,10,11,14,16,17,19,20,25,26,29,31],earlier:13,easier:29,effect:[22,28,29,30],effici:[0,16,20,21],effort:[12,14,25],ehsc:13,either:[13,16,17,29],element:[10,13,16,17,19,20,21,26,29,30,31],elems_per_workgroup:20,elif:7,els:[5,6,7,10],emit:22,emploi:1,empti:[11,31],emul:[8,22,28],enabl:[4,13,22,23,27,28],enable_if:1,encapsul:[5,6,7,9,10,28],end:[11,16,17,20,26,27,28,31],endif:[4,7],endl:[0,1],engin:[3,14,24,25],enough:[6,16,17,20],ensur:[28,30],enterpris:18,entropi:0,environ:[4,13,14,25],equal:[6,13,16,17,20,26,31],equal_rang:1,equal_to:[1,26],erf:1,erfc:1,errata:23,error:[5,7,13,22,23,29],esimd:[16,17,19,21],essenti:8,estim:[14,25],estimated_pi:[14,25],estoppel:23,etc:[22,27,28],evalu:[13,20,22,26],even:[7,13,26],evenli:[0,26],event:[5,6,7,9,10,11,16,17,20,27],everi:29,ex:[1,5,6,7,8,9,10,11],exact:8,exactli:20,exampl:[0,1,8,9,11,12,13,21,26,29,30],exce:[16,17],except:[13,16,17,20,23,28],exclud:31,exclusive_scan:[13,31],exclusive_scan_async:27,exclusive_scan_by_seg:[13,26],exec:31,execut:[5,6,7,8,9,10,13,14,16,17,20,22,25,26,27,29,30,31,32],execution_info:[5,6,7,8,10],executionpolici:31,exist:28,exp2:1,exp:1,expect:[9,14,25],experi:20,experiment:[5,6,7,8,9,10,11,13,16,17,18,19,20,21,27,31,32],explicit:[7,10,18,21],explicitli:[5,6,8,13,22,28,30],explor:[14,25],expm1:1,exponenti:0,exponential_distribut:0,expositori:[5,6,7,10],express:[23,27,30],extend:27,extens:[18,21],extent:1,extra:30,extrem:0,extreme_value_distribut:0,f:[5,6,8,10,26],fab:1,factor:[19,28],factori:31,fals:[4,16,17,26],fast:6,faster:[6,16,17],fdim:1,featur:[5,6,7,8,9,10,11,13,14,25,27,29],feed:[16,17],feedback:[5,6,7,10],fewest:[6,11],file:[1,12,13,21,23,28],fill:[1,22,27,28],fill_async:27,fill_n:1,find:[1,4,12,13,28,29,31],find_end:31,find_first_of:31,find_if:[1,31],find_if_not:[1,31],find_least_load:6,find_packag:[4,14,25],first1:30,first2:30,first3:30,first:[4,5,7,8,16,26,28,29,31],first_out:16,firstli:13,fit:[14,20,23,25],fix:[9,11,13,14,25],fixed_offset:7,fixed_offset_:7,fixed_resouce_polici:7,fixed_resource_polici:11,flag:[14,20,25],floor:[1,26],flow:27,fmax:1,fmaxf:1,fmin:1,fminf:1,fmod:1,follow:[1,3,4,5,6,7,8,9,10,11,13,14,18,24,25,27,28,29,30,31],foo:[4,14,25],fopenmp:[13,22],for_each:[1,14,25,28,31],for_each_async:27,for_each_n:1,form:[14,22,25],forward:[1,20],found:[4,8,13,24,26,29],fpga:[8,14,22,25],fpga_emulator_selector:28,fpga_polici:28,fpga_policy_a:28,fpga_policy_b:28,fpga_policy_c:28,fpga_selector:28,fpgapolicya:28,fpgapolicyc:28,fraction:[14,25],free:[16,20,30],frexp:[1,13],from:[5,6,7,8,10,11,13,14,16,17,20,23,24,25,26,27,28,29,30,31],fsycl:[4,13,14,16,17,20,25,28],full:[4,23,24],fulli:[4,19],func:29,functor:29,further:[21,22],furthermor:13,fut1:27,fut2:27,futur:[1,20,27],garland:20,gaussian:0,gcc:[1,13,22,31],gener:[1,3,5,6,7,10,12,14,16,17,19,20,21,25,30,31],generate_n:1,geometr:0,geometric_distribut:0,get:[13,22,27,29],get_access:[0,1],get_buff:30,get_devic:[5,7,8,9,11],get_linear_id:0,get_polici:[5,6,7,10],get_resourc:[5,6,7,8,10],get_resource_to_profil:5,get_submission_group:[5,6,7,8,10,11],get_tun:5,github:[12,14,24,25],give:30,given:[5,20,26],global_ptr:[14,25],gninja:4,gnu:[1,13],good:[6,10],gpu:[5,7,8,9,10,11,14,16,17,18,20,25],gpu_selector_v:[5,7,8,9,11,14,16,17,20,25,28],grant:23,greater:[1,2,4],greater_equ:1,group:[11,16,17,19,20,21],guarante:[13,20,30],guid:[4,14,16,17,20,22,25],guidelin:[16,17,20],gumbel:0,h:[5,6,7,10],ha:[1,3,4,5,6,7,8,10,11,19,20,24,26],had:6,halv:[16,17],handbook:28,handler:[0,1,5,6,7,10,28],hard:[14,25],hardwar:[18,22,23,28],has_known_identity_v:20,hat:18,have:[1,4,5,6,9,14,20,22,24,25,28,29,30,31],header:[0,1,2,4,13,21,22,24,26,27,28,29,31],held:29,help:[14,25],helper:[8,30],here:[4,11],heterogen:[13,28,32],heurist:4,hierarchi:20,high:[12,14,16,17,20,25],higher:[13,31],highest:26,histogram:26,histori:5,hold:[13,26,29],host:[0,13,28,29,30,31],host_accessor:17,host_al:31,how:[1,4,14,25,28],howev:[5,6,7,9,10,19,21],hpc:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32],hpp:[0,1,5,6,7,8,9,10,11,16,17,20,27,30],http:[16,17,24],hypot:1,i:[0,5,6,7,8,10,11,14,16,17,20,25,26,29],icpx:[4,14,16,17,20,25],icx:4,idea:[14,25],ident:[2,13,20,32],identifi:[5,26],idx:0,iec:[30,32],ignor:20,illustr:[14,25],ilogb:1,imag:1,implement:[0,2,4,5,6,7,8,10,13,16,17,18,19,20,21,22,24,26,27,28,29,30,31,32],impli:23,implicit:28,impos:13,improv:[14,25],in_begin:20,in_end:20,in_ord:28,in_rng:20,includ:[0,1,3,5,6,7,8,9,10,11,13,14,16,17,20,21,22,23,25,27,28,30,31,32],inclus:21,inclusive_scan:[13,31],inclusive_scan_async:27,inclusive_scan_by_seg:[13,26],incompat:24,increas:[16,17],increment:[10,16,17],independ:9,index:[5,7,26,29,31],indic:26,infin:1,info:8,inform:[7,8,9,10,11,12,13,14,16,17,20,25,28],infring:23,init:29,initer:20,initi:[13,16,17,20,26,31],initiali:6,initialized_:[5,6,7,10],initializer_list:1,inner:[6,10],inplace_merg:13,input:[5,13,16,17,19,20,26,27,29,30,31],inrng:20,inscrib:[14,25],insert:26,insid:11,instal:[8,13],instanc:[9,13,29],instanti:[0,29],instead:[8,13,20,31],instruct:[4,14,25],instrument:[5,6,8],int32_t:0,int64_t:0,integ:[0,7,29,30],integr:[4,16,17,20],integral_const:1,intel:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32],intellectu:23,intend:[20,28],interfac:27,interleav:27,intermedi:[16,17,20],intern:[16,17,20],interoper:27,interv:5,introduc:[13,31],introduct:12,invoc:12,invok:[5,7,19,28],io:24,iostream:[0,1,5,6,7,8,9,10,11,16,17,20],iota:31,iota_view:31,is_arithmet:1,is_assign:1,is_base_of:1,is_base_of_union:1,is_compound:1,is_const:1,is_construct:1,is_convert:1,is_copy_assign:1,is_copy_construct:1,is_cpu:[5,7],is_default_construct:1,is_destruct:1,is_empti:1,is_fundament:1,is_gpu:[8,9,11],is_heap:1,is_heap_until:1,is_literal_typ:[1,24],is_literal_type_v:24,is_member_point:1,is_move_assign:1,is_move_construct:1,is_object:1,is_permut:1,is_pod:1,is_refer:1,is_sam:1,is_scalar:1,is_sign:1,is_sort:[1,31],is_sorted_until:[1,31],is_standard_layout:1,is_trivi:1,is_trivially_assign:1,is_trivially_construct:1,is_trivially_copy:1,is_unsign:1,is_volatil:1,isascend:[16,17],isgreat:1,isgreaterequ:1,isinf:1,isless:1,islessequ:1,isnan:1,iso:[30,32],issu:[4,13,14,20,25],issue3561:24,isunord:1,item:[0,19,21],iter:[6,10,13,14,16,19,25,26,30,31,32],iterator1:[16,17],iterator2:[16,17],iterator_trait:13,iteratortyp:13,its:[2,5,6,7,10,13,14,22,23,24,25,30],j:[6,8,10],just:8,k:5,k_acc:17,k_out_acc:17,kei:[5,6,7,10,11,16,20,26,29],kernel:[1,5,6,10,12,13,14,16,17,20,25,27,28,30],kernel_nam:19,kernel_param:[16,17,20],kernel_swap:1,kernel_templ:[16,17,19,20,21],kernel_test:1,kernelnam:19,kernelparam:[16,17,20],kernelswap:1,key_typ:[16,17,20],keys_begin:29,keys_first:17,keys_last:17,keys_out:[16,17],keys_out_first:17,keys_per_workgroup:[16,17],keysiterator1:17,keysiterator2:17,keysrng1:17,keysrng2:17,keysrng:17,kit:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32],know:8,known:[7,14,20,23,25],kt:[16,17,18,19,20,21],lambda:[13,28],languag:24,larg:[14,16,17,20,25],last:[16,26,27,29],later:13,latest:[4,14,25],layer:[14,25],layout:24,ldexp:[1,13],lead:[13,16,17,22,30],learn:[14,25],least:[16,17,20],least_load:6,least_loaded_resourc:6,left:26,legacyrandomaccessiter:30,less:[1,2,16,17],less_equ:1,lesser:2,let:24,level:[4,16,17,20],lgamma:1,lh:29,libc:[1,13],librari:[0,1,2,3,4,5,6,7,8,9,10,11,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32],libstdc:[1,13],lie:[14,25],lifetim:27,like:[5,8,27,29,31],limit:[6,10,14,16,17,20,23,25,27],line:[4,13],linear:0,linear_congruential_engin:0,link:[4,14,25,28],linux:[4,13,14,18,25],list:[4,13,14,20,24,25,26,27],llvm:[1,22,23,28],load:[9,10,11],local:21,local_sum:[14,25],log10:1,log1p:1,log2:1,log:1,logb:1,logic:[5,6,7,9,10],logic_error:[5,6,7,10],logical_and:1,logical_not:1,logical_or:1,lognorm:0,lognormal_distribut:0,logo:23,look:[14,20,25,31],loop:[6,10,11,28],lower_bound:[1,26],lowest:[1,26],ltbb:13,lwg:24,m:[20,26],machin:8,macro:[12,13,14,25,28],made:[5,6,8,11,30],mai:[4,5,6,7,10,13,16,17,19,20,21,22,23,24,28,30,31,32],main:[0,1,5,7,8,9,11,14,16,17,20,25,27,28,30],maintain:[7,9],major:22,make:[5,6,7,9,10,13,14,16,17,20,22,25,30,31],make_device_polici:[14,22,25,28,30],make_fpga_polici:[22,28],make_heap:1,make_permutation_iter:29,make_task_kei:5,make_transform_iter:29,make_zip_iter:29,makefil:4,malloc_devic:30,malloc_shar:[16,20,30],manag:8,mani:[16,17,20],manner:[14,25],map:[26,29],mark:23,massiv:28,math:13,max:[1,16,17,18,20,26],max_el:[13,31],max_n:31,maxim:[16,17],maximum:[2,26,32],mean:[13,19,28],measur:[16,17,20],mechan:8,meet:13,member:[5,6,7,10,13,27,29],memori:[13,21,28,31],mention:30,merchant:23,merg:[13,31],merril:[16,17,20],messag:22,met:13,meta:[14,25],method:[14,25,30,31],microsoft:[1,13,14,25],might:[19,30],min:[1,26],min_el:[13,31],minim:[4,12,13,14,25],minimum:[2,26,32],minmax_el:[13,31],minor:22,minstd_rand0:0,minstd_rand0_vec:0,minstd_rand:[0,14,25,30],minstd_rand_vec:[0,14,25],minu:1,mkdir:[4,14,25],mode:[0,1,30,31],model:28,modf:1,modif:30,modifi:[24,29,30],modulu:1,mont:[14,25],more:[4,5,6,8,9,11,12,13,16,17,20,28,29,32],most:[4,6,13,14,25],move:[1,31],move_backward:1,move_if_noexcept:1,moveassign:13,moveconstruct:13,msvc:[1,14,25],multiarchitectur:[14,25],multipl:[6,16,17,19,20,28,30],multipli:1,multiply_index_by_two:29,multithread:30,must:[1,4,5,6,7,8,10,11,13,16,17,19,20,26,28,30],my_polici:[5,6,7,10],n4860:32,n:[0,5,6,7,8,9,10,11,13,14,16,17,20,25,29,30,31],name:[13,16,17,19,20,23,27,28,30],namespac:[0,1,2,5,6,7,8,9,10,11,13,14,16,17,18,19,20,21,24,25,26,27,28,29,31],nan:1,nanf:1,ncopi:9,nearbyint:1,nearbyintf:1,necessari:[4,5,6,7,8,10],need:[5,6,7,8,9,10,13,14,20,24,25,28,29],negat:[1,29],nest:21,newer:[13,18,24],newli:4,next:6,next_context_:10,nextaft:1,nfirst:0,ninja:4,nlast:0,no_init:30,non:[5,8,20,22,23,27],noncontigu:29,none_of:[1,31],nontempor:22,norm:1,normal:0,normal_distribut:0,not1:[1,24],not2:24,not_equal_to:1,note:[12,13,14,25,28,30],notic:13,now:8,nresourc:8,nsampl:0,num1:1,num2:1,num_arrai:[6,10],num_bin:26,num_devic:[6,10],num_el:29,num_resources_:10,number:[3,6,10,14,16,17,19,20,21,22,25,26,27,29],numer:[22,27,28],numeric_limit:1,numofitem:1,nvidia:20,nvr:20,o0:13,o:[1,13,16,17,20],object:[3,5,6,7,8,9,10,11,13,14,16,17,19,20,22,25,26,27,28,29,30,32],observ:[14,25],occur:24,off:13,offer:[0,32],offload:[5,6,7,8,10,13,14,25],offset:[0,5,7,14,25],ok:29,older:13,omit:19,onc:[4,5,14,20,25],one:[5,6,7,10,11,13,14,16,17,25,26,28,29,30,31],oneapi:[0,1,2,3,4,5,6,7,8,9,10,11,15,16,17,18,19,20,21,22,23,24,26,27,28,29,31,32],onedpl:[1,2,3,5,6,7,8,9,10,11,12,15,16,17,18,19,20,21,22,23,26,27,28,29,30,31,32],onedpl_allow_deferred_wait:22,onedpl_found:4,onedpl_fpga_devic:[22,28],onedpl_fpga_emul:[22,28],onedpl_par_backend:4,onedpl_use_dpcpp_backend:22,onedpl_use_openmp_backend:22,onedpl_use_predefined_polici:22,onedpl_use_tbb_backend:22,onedpl_version_major:22,onedpl_version_minor:22,onedpl_version_patch:22,onedplconfig:4,onedplconfigvers:4,onedplwindowsintelllvm:4,ones:28,onesweep:[16,17],onetbb:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32],onli:[5,6,8,11,13,16,17,18,22,26,28,29,30,31],openmp:[4,13,22,28],oper:[2,9,13,16,17,18,20,26,29,30,32],opportun:[6,10,21],optim:[4,14,16,17,19,20,21,25,30],option:[1,5,7,12,13,14,19,20,22,25,28],order:[1,4,16,17,26,29],org:[16,17],origin:26,other:[5,6,7,9,10,13,16,17,22,23,26,28,29,31,32],otherwis:[5,7,13,23],out:[20,28],out_begin:20,out_rng:20,outer:[6,10],outiter:20,output:[0,8,9,11,16,17,20,26,29,31],output_kei:26,output_valu:26,outrng:20,outstand:[6,11],over:[6,10,21,22,29],overal:[16,17],overcom:13,overflow:26,overhead:[5,6,7,10,16,17],overlap:27,overload:[16,17,26,29],overrid:[5,6,7,10],overview:[13,14,25],p1:9,p1s1:9,p1s2:9,p2:9,p2s1:9,p2s2:9,p2s3:9,p2s4:9,p3:9,p3s1:9,p3s2:9,p3s3:9,p:[5,6,7,8,10,11],p_default:8,p_explicit:8,packag:[1,4],page:[13,14,22,24,25],pair:[1,17,26,29],par:[22,28],par_unseq:[13,22,28],parallel:[0,1,2,3,5,6,7,8,9,10,11,12,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31],parallel_for:[0,5,7],param:[16,17,20],paramet:[13,19,21,24,29],parent:[4,14,25],part:[5,6,7,8,9,10,11,29,31],partial:26,partial_sort:[1,13],partial_sort_copi:[1,13],particip:29,particular:[21,23,30],particularli:20,partition_copi:13,pass:[4,5,6,7,8,9,10,11,13,16,17,20,21,28,29,32],past:[26,30],patch:22,path:[14,16,17,20,25],perform:[5,6,7,10,12,14,19,21,23,25,26,28,29],period:5,permit:31,permut:[26,29,32],permutation_first:29,permutation_iter:29,permutation_last:29,perspect:31,phase:5,pick:11,pipelin:31,place:[4,13],platform:[1,4,7,8],pleas:[4,13,14,25],plu:[1,14,20,25,26],point:[5,6,7,10,11,13,14,16,17,20,25,30],pointer:[16,17,20,30,31],polar:1,polici:[11,12,13,14,22,25,26,27,29,30,31,32],policy_:28,policy_a:28,policy_b:28,policy_c:28,policy_d:28,policy_trait:[5,6,7,8,9,10],policya:28,policyb:28,policyc:28,policyd:28,pop_heap:1,portabl:[14,25],posit:[16,17,26],possibl:[5,6,7,8,10,16,17,20,30],pow:1,pragma:[22,28],preced:[11,22],precis:[13,28],predefin:[22,28],predic:26,prefix:[20,26],preprocessor:13,prerequisit:26,presenc:22,present:27,preserv:[16,17],prevent:30,preview:1,previou:[8,13],previous:5,primari:[7,21],print:[1,16,17,20],print_typ:9,prior:[5,6,7,10],priorit:21,probabl:[0,14,25],process:[0,10,13,16,17,19,20,21,28,29,30],processor:32,produc:[0,31],product:[12,14,20,23,25],profil:[5,11,16,17,20],program:[1,12,13,14,22,25],progress:20,proj:1,project:[4,14,25,28],properti:[23,28],propos:24,prove:20,provid:[0,1,4,5,6,7,8,9,10,11,12,13,14,16,17,19,20,21,25,26,27,28,29,30,31,32],pseudo:[0,14,25],pstl:[13,22],pstl_usage_warn:22,pstl_use_nontemporal_stor:22,publish:23,purpos:[8,11,23],push_heap:1,q:[5,6,7,8,9,10,11,14,16,17,20,25,30],qualifi:[13,29],quantiti:[14,25],quarter:[14,25],queue:[0,1,5,6,7,8,9,10,11,14,16,17,20,25,28,30],quick:12,quiet_nan:1,r:[5,7,10,16,17],r_out:16,race:30,radix_sort:18,radix_sort_by_kei:18,radixbit:[16,17],random:[3,13,29,30],random_fil:[14,25],randomaccessiter:26,rang:[0,1,13,16,17,20,24,26,29,32],range1:[16,31],range2:[16,31],range_1:31,range_2:31,range_r:31,rank:1,ranlux24:0,ranlux24_bas:0,ranlux24_base_vec:0,ranlux24_vec:0,ranlux48:0,ranlux48_bas:0,ranlux48_base_vec:0,ranlux48_vec:0,rather:30,ratio:[1,14,25],rbegin:0,re:[0,14,25],read:[20,29,30,31],read_onli:[5,7,17,30],read_writ:[1,5,7],readi:27,readm:[14,25],real:[0,1],reason:30,rebuild:24,receiv:[11,29],recent:4,recommend:[4,21,22,30],red:18,reduc:[1,13,16,17,27,29,30,31,32],reduce_async:27,reduce_by_seg:[13,26,31],reduct:[13,14,20,25,26],redund:11,ref:1,refer:[4,12,14,15,22,23,25,28,29],reference_wrapp:1,rel:[16,17],releas:[1,4,12,13,14,24,25],reli:32,remain:[7,13],remaind:1,remov:[1,13,24,31],remove_all_ext:1,remove_const:1,remove_copi:31,remove_copy_if:31,remove_cv:1,remove_ext:1,remove_if:[13,31],remove_volatil:1,remquo:1,reorder:[16,17],repeat:10,replac:31,replace_copi:31,replace_copy_if:31,replace_if:31,report:20,report_info_v:[5,6,7,10],repositori:[12,14,25],repres:[11,16,17,20,29,31],request:23,requir:[8,12,14,19,23,24,25,26,28,29,30,31,32],resampl:5,resample_interval_in_millisecond:5,resid:1,resolut:29,resourc:[5,6,9,10,11,14,25,27],resource_t:[8,9],resource_typ:[5,6,7,9,10],resources_:[5,6,7,10],respect:[13,17,22],respons:[28,30],result:[0,1,5,8,13,20,23,26,27,29,30],result_of:24,result_of_t:24,ret_val:27,retriev:[14,16,17,25,30],revers:31,reverse_copi:31,rh:29,rid:[14,25],right:23,robin:[9,11],rotat:[5,10,11,13],rotate_copi:31,round:[1,9,11],round_robin_exampl:10,round_robin_polici:[5,8,9,11],round_round_polici:10,roundf:1,run:[1,5,6,7,8,10,13,16,17,20,22,28],runtim:[5,8,11,13,22,28],s:[4,5,6,7,8,9,10,13,14,16,17,19,20,25,26,29],safe:28,same:[6,7,13,17,22,26,30],sampl:[0,14,25],satisfi:[13,16,17,19,20,21,30],scalar:[0,14,25],scan:[13,21,26,32],scenario:7,script:[4,14,25],search:[4,14,25,26,31,32],secondli:13,section:[4,8,9,11,28],secur:23,see:[4,13,16,17,19,20,22,28,29,32],seed:[0,14,25],seen:8,segment:32,select:[4,9,12,16,17,20],selection_t:[8,9],selection_typ:[5,6,7,8,9,10],selector:28,semant:29,send:[6,10],separ:9,seq:28,sequenc:[0,13,16,17,20,26,30,31],sequence1:[26,29],sequence2:[26,29],sequence3:29,sequenti:[19,22,28,32],seri:[8,11,18,20],serial:[4,13],server:18,servic:23,set:[4,5,6,7,8,10,13,14,19,22,25,26,28,29],set_differ:13,set_intersect:13,set_symmetric_differ:13,set_union:13,sever:[0,1,3,5,6,7,8,9,10,11,31],shall:26,share:[9,20,31],shift_left:32,shift_right:32,should:[4,6,8,13,22,26,29,30,31],show:[1,8,11,14,25],shown:[8,9,30,31],side:[0,29],signatur:[5,6,7,8,9,10,27,31],signific:[16,17],silent:26,simd:[13,18,21,28],similar:10,similar_devic:10,similarli:[1,13],simpl:[6,10,27],simpli:7,simplifi:[5,6,7,10,14,25,28,29],simultan:6,sin:1,sinc:[6,8,11,16,17,29],singl:[8,16,20,21,26],single_task:[1,8,11],sinh:1,size:[0,6,10,19,21,24,26,30,31],size_t:[5,6,7,10,14,16,17,20,25,29],sizeof:[16,17,20],skip:26,small:[16,20],smaller:10,snippet:29,so:[5,7,9,19,29],softwar:[13,23],some:[4,6,7,8,11,13,16,17,20,30],sort:[13,26,27,29,30,31],sort_async:27,sort_by_kei:26,sourc:[0,13,14,25,29,31],sp5:18,space:[13,16,17],special:[7,19,30],specif:[7,8,13,14,16,17,19,20,21,23,25,28,32],specifi:[4,11,14,25,26,28,30,32],speed:[14,25],split:31,sqrt:[1,13],squar:[14,25],stabl:[5,16,17,26,29],stable_partit:13,stable_sort:[13,29,31],standard:[3,4,14,22,24,25,30,31,32],start:[4,6,13,30,31],state:[5,6,7,9,10,13,29],statist:0,statu:[16,17,20],std:[0,1,2,5,6,7,8,9,10,11,13,14,16,17,19,20,22,25,26,28,29],steady_clock:8,stencil:29,step:[6,10,13,28],still:[5,6,7,10],stl:[22,27,28],storag:[13,16,17,20,27],store:[0,7,14,16,17,20,25,26,29],str:9,string:9,struct:[9,19,29],structur:[19,21,29],studio:1,submiss:[5,6,7,10,11],submission_group_s:[6,10],submission_t:8,submit:[0,1,5,6,7,9,10,11,16,17,20,30],submit_and_wait:[5,6,7,8,9,10,11],subrang:[16,17,20,31],subsequ:[26,30],subset:[7,27],subsidiari:23,subtract:0,subtract_with_carry_engin:0,success:[4,31],successfulli:4,suffici:[20,26],suffix:27,suitabl:4,sum:[14,20,25,26,29],summar:[7,10],suppli:28,support:[0,1,3,6,12,13,16,17,18,19,20,22,24,26,27,28,29,30,31,32],suppos:29,sure:[16,17,20,30],suse:18,swap:[1,29],swap_accessor:1,swap_buff:1,swap_num:1,swap_rang:31,sycl:[0,1,4,5,6,7,8,9,10,11,12,13,14,16,17,18,19,20,21,25,27,28,30,31],sycl_backend:[5,6,7,10],sycl_device_typ:[14,25],sycl_read_writ:1,synchron:[16,17,20,28],synopsi:[16,17,19,20],syntact:[8,11],syntax:[14,25],system:[4,7,10,12,14,25,28],t:[1,17,29],tabl:[7,10],tag:30,tailor:28,take:[14,16,17,22,25,26,27,30,31],tan:1,tanh:1,target:[4,7,14,25,26],target_link_librari:[4,14,25],task:[6,11],task_complet:[5,6,7,8,10],task_submiss:[5,6,7,8,10],task_submission_t:[5,6,7,10],task_tim:[5,6,7,8,10],tbb:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32],technic:20,technolog:[18,23],templat:[0,5,6,7,8,9,10,12,14,24,25,28,29,31],temporari:[27,29,30],term:[16,17,20],test:[3,8,13,14,25],text:23,tgamma:1,than:[6,16,17,28,30],thei:[0,1,21,27,29],them:[14,22,25,28],themselv:[14,25],thereaft:5,therefor:[7,10],thi:[4,5,6,7,8,9,10,11,13,14,18,20,22,23,24,25,26,27,28,29,30],those:[8,10,30],though:29,thread:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32],three:[5,6,7,10],through:[2,5,6,8,10,26,28,29],thrown:[16,17,20,28],tile:20,time:[4,5,6,7,10,22],togeth:13,too:[16,17,20],tool:[14,25],toolkit:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32],top:21,total:[6,10],track:[5,6],trade:23,trademark:23,tradition:27,trait:8,transfer:[13,30],transform:[1,26,27,29,31,32],transform_async:27,transform_exclusive_scan:[13,31],transform_exclusive_scan_async:27,transform_first:29,transform_if:26,transform_inclusive_scan:[13,31],transform_inclusive_scan_async:27,transform_iter:29,transform_last:29,transform_reduc:[13,14,25,31],transform_reduce_async:27,treat:30,trivial:13,trunc:1,truncf:1,tune:[9,11,16,17],tuner:5,tupl:[1,29],tuple_like_obj:29,turn:28,twice:[16,17],two:[1,5,7,8,9,26,28,30,31],txt:[4,14,25],type:[0,2,4,5,6,7,8,9,10,13,16,17,20,21,26,27,28,29,30],type_trait:24,typenam:[5,6,7,8,9,10,16,17,19,20,29,31],typic:[1,19],u:[5,6,7,10],ubuntu:18,uint16_t:19,uint32_t:[0,16,17,20],uint64_t:[0,5],uint8_t:[16,17],unari:[13,26,29],unary_funct:24,unary_neg:[1,24],unchang:2,undefin:[13,16,17,20,28],under:[0,23],underli:[8,31],unfinish:6,unifi:[20,31],uniform_int_distribut:0,uniform_real_distribut:[0,14,25],uniniti:13,uninitialized_copi:13,uninitialized_copy_n:13,uninitialized_default_construct:13,uninitialized_default_construct_n:13,uninitialized_fil:13,uninitialized_fill_n:13,uninitialized_mov:13,uninitialized_move_n:13,uninitialized_value_construct:13,uninitialized_value_construct_n:13,unintend:30,uniqu:[5,13,19,28,31],unique_copi:[13,31],unix:4,unless:22,unmodifi:26,unnam:[13,28],unnecessari:13,unrol:28,unroll_factor:28,unsaf:30,unseq:[13,28],unsequenc:[22,28,32],unsign:0,unspecifi:[19,27,29,30],unsupport:4,until:[6,8,10,11,20],unwrap:[5,6,7,8,9,10],up:[16,17],updat:[4,14,25],upper:[16,17],upper_bound:[1,26],us:[0,1,3,4,5,6,7,9,10,11,13,16,17,19,20,21,22,24,26,27,29,31],usag:[12,22,23],use_best:5,use_cpu:7,use_gpu:7,user:[4,5,6,7,8,9,10,11,26,28],user_funct:9,usm:[6,10,13,16,17,20,30,31],usm_alloc:30,usm_data:[6,10],usmptr:[14,25],usual:[16,17,19],util:[1,3,16,17,20,24,27,31,32],v:[6,8,10,20],v_acc:17,v_out_acc:17,valid:[8,11,30],vals_begin:29,valu:[0,5,6,13,14,19,22,24,25,26,28,29,30,31],value_typ:[13,17],values_first:17,values_out:17,values_out_first:17,values_per_workgroup:17,valuesiterator1:17,valuesiterator2:17,valuesrng1:17,valuesrng2:17,valuesrng:17,vari:[6,23],variabl:[4,13,14,25],variant:[16,17],varieti:20,variou:[0,3,21],vec:[0,14,25,30],vecsiz:[14,25],vector:[0,5,6,7,8,10,13,14,19,22,25,28,32],vector_length:19,verifi:20,version:[1,4,12,13,20,23,24,32],via:[1,4,5,6,11,13,14,25],view:[16,17,20,31],viewabl:31,violat:26,visit:[13,14,25,28],visual:[1,13,14,25],w:8,wa:[5,6,7,8,10,11,13,26],wai:[0,1,30],wait:[5,6,7,10,11,16,17,20,22,27],wait_for_al:27,wait_t:9,wait_typ:[5,6,7,9,10],want:13,warn:22,warranti:23,we:[4,6,30],weibul:0,weibull_distribut:0,well:[8,19,23],were:[1,14,24,25,29,30],what:[8,13,14,25],when:[5,6,7,8,9,10,13,14,16,17,19,20,21,22,24,25,28,30],where:[2,5,6,7,10,13,14,16,17,19,20,22,25,26,27,28,29,30,31],whether:[8,26],which:[0,4,5,12,13,14,16,17,20,23,25,26,29,30,31,32],whichev:10,whole:11,whose:[13,29],width:[16,17],window:[4,13,14,25],within:[13,14,16,17,19,20,25,26],without:[5,6,7,10,22,23,26,30],work:[4,5,6,7,8,10,11,12,13,14,16,17,19,20,21,25,30],workaround:4,workgroup_s:[16,17,19,20],workgroups:19,workload:[7,10,21],would:[6,29],wrap:[28,29,31],write:[0,5,6,7,10,13,22,26,29,31],write_onli:[17,30],written:[20,26],wrong:13,x:[0,4,14,16,17,20,25,27],x_acc:0,x_buf:0,xe_core_count:[16,17,20],xx:22,xxyyz:22,y:[14,25],ye:[5,6],yet:6,yocto:[14,25],you:[4,5,6,12,14,22,24,25,27,28,29,30],your:[4,11,12,14,22,23,24,25,28,30],yy:22,z:22,zero:[5,14,22,25],zip:[31,32],zip_iter:29,zip_view:31,zipped_begin:29,zipped_first:29},titles:["Random Number Generators","Tested Standard C++ APIs","Utility Function Object Classes","API for the SYCL* Kernels","CMake Support","Auto-Tune Policy","Dynamic Load Policy","Fixed-Resource Policy","Functions","Policies","Round-Robin Policy","Dynamic Selection API","oneAPI DPC++ Library Developer Guide","oneAPI DPC++ Library Introduction","Get Started with the oneAPI DPC++ Library","Release Notes","Radix Sort","Radix Sort By Key","ESIMD-Based Kernel Templates","Kernel Configuration","Inclusive Scan","Kernel Templates API","Macros","Notices and Disclaimers","oneDPL 2022 Breaking Changes","Get Started with the oneAPI DPC++ Library","Additional Algorithms","Asynchronous API Algorithms","Execution Policies","Iterators","Pass Data to Algorithms","Range-Based API Algorithms","Parallel API"],titleterms:{"2022":24,"break":24,"class":[2,19],"function":[0,2,8,16,17,20,30],"return":[16,17,20],"static":19,By:17,In:[16,17],No:8,addit:[22,26],algorithm:[5,6,7,10,13,26,27,30,31],api:[1,3,11,21,27,31,32],associ:8,async:27,asynchron:27,auto:5,auto_tune_polici:5,avail:9,backend:4,base:[18,31],befor:13,begin:[13,30],benchmark:[14,25],best:[16,17,20],build:[4,13,14,25],c:[1,13,28],chang:24,cmake:[4,14,25],code:13,command:[4,14,25],common:9,config:[14,25],configur:19,constant:19,constructor:[5,6,7,10],data:30,defer:[5,6,7,10],develop:12,devic:[4,28],differ:13,disclaim:23,distribut:0,dpc:[12,13,14,25],dpl:[14,25,30],dynam:[6,11],dynamic_load_polici:6,end:30,engin:0,error:28,esimd:18,event:8,exampl:[4,5,6,7,10,14,16,17,20,25,27,28,31],execut:[4,28],file:[4,14,25],find:[14,25],fix:7,fixed_resource_polici:7,fpga:28,gener:[0,4],get:[8,12,14,25],global:[16,17,20],group:8,guid:12,handl:28,header:[14,25],inclus:20,inclusive_scan:20,initi:[5,6,7,10],instal:[14,25],introduct:13,invoc:[4,14,25],iter:29,kei:17,kernel:[3,18,19,21],kernel_param:19,known:13,librari:[12,13,14,25],licens:23,limit:13,load:6,local:[16,17,20],macro:22,member:19,memori:[16,17,20,30],model:0,more:[14,25],note:15,notic:23,number:0,object:2,oneapi:[12,13,14,25,30],onedpl:[0,4,13,14,24,25],option:[4,8],out:[16,17],par:4,par_unseq:4,parallel:[4,13,32],paramet:[16,17,20],pass:30,perform:[16,17,20],pi:[14,25],pkg:[14,25],place:[16,17],polici:[4,5,6,7,8,9,10,28],predefin:0,prerequisit:13,queri:[5,6,7,8,10],quick:[14,25],radix:[16,17],radix_sort:16,radix_sort_by_kei:17,random:[0,14,25],rang:31,recommend:[16,17,20],refer:[1,9],releas:15,report:[5,6,7,8,10],requir:[4,5,6,7,10,13,16,17,18,20],resourc:[7,8],restrict:13,robin:10,round:10,round_robin_polici:10,scan:20,select:[5,6,7,8,10,11],semant:9,set:[16,17,20],share:30,simpl:[14,25],sort:[16,17],standard:[1,13,28],start:[12,14,25],std:30,submiss:8,submit:8,support:[4,14,25],sycl:3,system:[13,18],templat:[16,17,18,19,20,21],test:1,trait:9,tune:5,type:19,unifi:30,us:[8,14,25,28,30],usag:[0,4,14,16,17,20,25,27,28,31],util:2,valu:[8,16,17,20],vector:30,version:22,wait:8,you:13,your:13}})
\ No newline at end of file
+Search.setIndex({docnames:["api_for_sycl_kernels/random","api_for_sycl_kernels/tested_standard_cpp_api","api_for_sycl_kernels/utility_function_object_classes","api_for_sycl_kernels_main","cmake_support","dynamic_selection_api/auto_tune_policy","dynamic_selection_api/dynamic_load_policy","dynamic_selection_api/fixed_resource_policy","dynamic_selection_api/functions","dynamic_selection_api/policies","dynamic_selection_api/round_robin_policy","dynamic_selection_api_main","index","introduction","introduction/onedpl_gsg","introduction/release_notes","kernel_templates/esimd/radix_sort","kernel_templates/esimd/radix_sort_by_key","kernel_templates/esimd_main","kernel_templates/kernel_configuration","kernel_templates/single_pass_scan","kernel_templates_main","macros","notices_disclaimers","oneDPL_2022.0_changes","onedpl_gsg","parallel_api/additional_algorithms","parallel_api/async_api","parallel_api/execution_policies","parallel_api/iterators","parallel_api/parallel_range_algorithms","parallel_api/pass_data_algorithms","parallel_api/range_based_api","parallel_api_main"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":4,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":3,"sphinx.domains.rst":2,"sphinx.domains.std":2,sphinx:56},filenames:["api_for_sycl_kernels/random.rst","api_for_sycl_kernels/tested_standard_cpp_api.rst","api_for_sycl_kernels/utility_function_object_classes.rst","api_for_sycl_kernels_main.rst","cmake_support.rst","dynamic_selection_api/auto_tune_policy.rst","dynamic_selection_api/dynamic_load_policy.rst","dynamic_selection_api/fixed_resource_policy.rst","dynamic_selection_api/functions.rst","dynamic_selection_api/policies.rst","dynamic_selection_api/round_robin_policy.rst","dynamic_selection_api_main.rst","index.rst","introduction.rst","introduction/onedpl_gsg.rst","introduction/release_notes.rst","kernel_templates/esimd/radix_sort.rst","kernel_templates/esimd/radix_sort_by_key.rst","kernel_templates/esimd_main.rst","kernel_templates/kernel_configuration.rst","kernel_templates/single_pass_scan.rst","kernel_templates_main.rst","macros.rst","notices_disclaimers.rst","oneDPL_2022.0_changes.rst","onedpl_gsg.rst","parallel_api/additional_algorithms.rst","parallel_api/async_api.rst","parallel_api/execution_policies.rst","parallel_api/iterators.rst","parallel_api/parallel_range_algorithms.rst","parallel_api/pass_data_algorithms.rst","parallel_api/range_based_api.rst","parallel_api_main.rst"],objects:{},objnames:{},objtypes:{},terms:{"0":[0,1,5,6,7,8,10,11,13,14,16,17,20,22,23,24,25,26,27,28,29,30,31,32],"002":20,"01784":[16,17],"0f":[14,25],"0x9e3779b9":0,"0x9e3779b97f4a7c15":0,"0xbb67ae85":0,"0xbb67ae8584caa73b":0,"0xca5a826395121157":0,"0xcd9e8d57":0,"0xd2511f53":0,"0xd2e7470ee14c6c93":0,"1":[0,1,5,6,7,8,9,10,11,14,16,17,20,22,24,25,26,27,28,29,30,32],"10":[0,13,20,22,26,27,29,30,32],"100":[0,6,10],"1000":[22,28,31],"10000":[5,6,7,10],"11":[0,1,4,24],"12":[0,26],"14":[24,26],"14882":33,"15":26,"16":30,"16807":0,"16k":16,"17":[1,4,13,24,27,29,31,32,33],"1m":[16,17],"2":[1,5,6,7,8,9,10,11,14,16,17,20,23,25,26,29,30],"20":[2,4,24,30,31,32,33],"2016":20,"2017":[1,33],"2019":[1,13,30],"2020":[13,16,17,19,20,28,31],"2021":[13,24],"2022":[1,12,13,16,17],"2023":[16,17],"202409l":[22,30],"2147483647":0,"2206":[16,17],"223":0,"23":0,"24":0,"256":20,"3":[1,4,5,6,7,8,9,10,11,16,17,20,26,30],"30":[16,17],"32":[0,16,17,20],"389":0,"4":[0,1,5,6,7,8,9,10,11,13,14,16,17,20,25,26,30],"416":16,"42":28,"45":29,"48":0,"48271":0,"4kb":[16,17],"5":[0,1,6,7,10,11,13,16,17,20,26,30],"6":[5,6,7,8,10,11,16,17,20,26,30],"64":[0,16,17,20],"7":[1,6,10,13,20,24,26,27,29,30,32],"777":0,"8":[6,13,16,17,20,26,28,30,32],"9":[1,26,29,30],"96":17,"99":[6,10,26],"\u03c0":[14,25],"\u0441":24,"boolean":26,"break":12,"byte":20,"case":[7,8,10,19,20,29,31],"char":17,"class":[0,1,3,5,6,7,10,12,13,14,24,25,28,29,30,32,33],"const":[5,6,7,8,9,10,13,27,29,31],"default":[4,5,6,7,8,9,10,11,13,14,22,25,26,28,29],"do":[8,13,16,17,26,27,28,29],"final":26,"float":[0,5,6,7,10,13,14,16,17,20,25],"function":[1,3,5,6,7,9,10,11,13,14,22,24,25,26,27,28,29,32,33],"import":[4,31],"int":[0,1,5,6,7,8,9,10,11,14,16,17,20,25,27,28,29,30,31,32],"new":[13,14,25,30],"public":[5,6,7,10],"return":[0,1,2,5,6,7,8,9,10,11,14,22,25,26,27,28,29,30,31],"short":8,"switch":24,"throw":[5,6,7,10,13,28],"true":[13,16,17,20,26],"try":22,"void":[1,5,6,7,8,9,10,14,25,32],"while":[0,5,6,7,10,13,16,17,31,32],A:[2,4,5,6,7,8,10,11,13,14,16,17,19,20,22,25,26,28,30,32],And:11,By:[11,22],For:[0,4,5,7,8,12,13,14,16,17,20,22,25,26,28,29,31,32],If:[4,5,6,7,8,9,10,13,16,17,19,20,22,26,27,28,30,31],In:[1,4,5,6,7,10,11,24,29,31,33],It:[2,4,5,6,7,8,10,13,20,21,28,31,33],Its:[16,17],No:[5,6,7,10,23,28,31],On:[4,20],Such:[7,20],That:[13,20,31],The:[0,1,2,3,4,5,6,7,8,9,10,11,13,14,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],Then:[5,28],There:[5,6,7,8,9,10,11,20,26],These:[1,4,14,18,21,25,31,32],To:[4,13,14,20,21,24,25,28,29,31,32],Will:[6,10],__boundary_first:26,_async:27,_pstl_version:22,_pstl_version_major:22,_pstl_version_minor:22,_pstl_version_patch:22,a_a:[5,7],a_b:[5,7],ab:[1,16,17],abil:30,about:[7,9,10,11,13,14,22,25],abov:[0,4,14,25,27,28,29,31],absolut:23,acceler:33,accept:[29,31],access:[0,1,13,22,29,30,31,32],accessor:[5,7],accident:13,accord:[0,13,16,17,20,26,28,29,31,33],accur:5,achiev:[6,10,28,30],aco:1,acosh:1,across:[0,6,10,12,14,25],act:[5,13],activ:[5,6,7,10,23],ad:[1,13,14,22,25,26,27,28,33],adaptor:[0,30,31,32],add:[4,13,14,25,28,31],add_const:1,add_cv:1,add_execut:[4,14,25],add_volatil:1,addit:[3,6,8,12,13,16,17,20,33],addition:20,adinet:[16,17],adjacent_find:[30,32],advanc:8,advic:[16,17,20],affect:[4,13],after:[4,8,31,32],against:[14,25],aim:21,algorithm:[0,4,12,16,17,20,21,22,28,29,33],alia:13,align:[13,24,30,31],alignment_of:1,all:[2,5,6,7,8,10,11,13,14,16,17,20,21,22,23,25,26,27,28,29,30,31,32],all_of:[1,30,32],all_read:32,all_writ:32,alloc:[13,27,29,30,31],allow:[4,5,6,13,16,17,20,22,27,28,30,31,32],along:8,alreadi:11,also:[5,6,7,8,10,13,20,22,28,29,30,31,33],alter:[16,17],altern:11,although:20,alwai:[7,11],among:[4,30],amount:[16,17,20],an:[0,1,2,4,5,6,7,8,9,10,11,13,14,16,17,19,20,21,22,25,26,27,28,29,30,31,32,33],analog:33,analysi:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],andi:[16,17],ani:[5,6,7,8,9,10,11,13,16,20,23,24,27,28,29,30],anoth:[26,29,30,32],any_of:[1,30,32],anyth:31,apach:23,api:[5,6,7,8,9,10,12,13,14,22,24,25,28,30,31],appear:6,appli:[2,13,16,17,20,26,29,30,31,32],applic:[4,7,12,14,22,25,28,29],approach:[6,10,21],appropri:[14,25],approxim:[16,17,20],ar:[0,1,2,4,5,6,7,8,9,10,11,13,14,16,17,18,20,21,22,23,24,25,26,27,28,29,30,31,32],arbitrari:27,area:[14,25],arg:[1,5,6,7,8,10],argument:[2,5,7,8,11,22,27,28,29,31],aris:23,arithmet:29,arr:20,arrai:[1,6,10,13],arxiv:[16,17],ascend:[16,17],asin:1,asinh:1,aspect:[0,11,22,32],assert:1,assign:[6,10],associ:[5,6,7,9,10,20,26,28],assum:[1,4,26,28],assumpt:21,async:8,asynchron:[5,6,7,10,12,20,28,33],atan2:1,atan:1,atanh:1,atom:20,augment:19,auto:[0,1,6,7,8,9,10,11,14,16,17,20,25,26,27,28,29,30,31,32],auto_tune_polici:[7,8,11],auto_tune_polii:8,automat:19,av:[5,7],avail:[0,2,4,6,10,14,16,17,18,20,21,22,23,25,26,27,29,31,32],avoid:[5,6,7,10,13,16,17,20,31],b:[26,31,32],b_a:[5,7],b_b:[5,7],back:[8,20,31,33],backend:[5,6,7,9,10,13,22,28],bad_alloc:[16,17,20],balanc:[6,10],base:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,19,20,21,22,23,24,25,26,27,28,29,30,31,33],basic:[1,3,14,25],becaus:[8,13,30,31],becom:27,been:[1,3,4,14,20,24,25,26],befor:[4,5,6,7,8,10,14,22,25],begin:[0,16,17,20,27,28,29,30,32],behav:8,behavior:[7,8,10,13,16,17,20,22,26,27,28,30],being:[5,26,31],below:[0,1,4,5,6,7,8,9,10,13,14,16,17,19,20,25,26,27,28,29],benefici:20,benefit:[16,17],bernoulli:0,bernoulli_distribut:0,best:[5,7,11],best_resource_:5,better:[13,16,17,20,28],between:[5,6,7,8,10,11,16,17,20,24,29,31],bin:26,binari:[13,20,26],binary_funct:24,binary_neg:[1,24],binary_op:20,binary_search:[1,26],binaryop:20,bind:29,bit:[16,17,20],bit_and:1,bit_not:1,bit_or:1,bit_xor:1,bitfield:31,block:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],bodi:11,bool:[0,16,17,31],both:[4,7,13,16,17,28,29,30,32],bound:[16,17,27],boundari:26,brand:23,breviti:13,buf:[31,32],buf_begin:31,buf_end:31,buffer:[0,1,5,7,13,16,17,20,27,31,32],build:[0,1,2,3,5,6,7,8,9,10,11,12,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32,33],built:21,bv:[5,7],c:[0,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,20,21,22,23,24,25,26,27,29,30,31,32,33],c_a:[5,7],c_b:[5,7],call:[4,5,6,7,8,9,10,11,13,20,22,27,29,30,31,32,33],callabl:13,callback:[5,6],caller:28,can:[0,1,2,4,5,6,7,8,9,10,11,12,13,14,16,17,19,20,22,23,25,27,30,31,32],cannot:[13,29],capabl:[7,10,32,33],captur:13,carlo:[14,25],carri:0,catalog:[14,25],categor:21,categori:30,cauchi:0,cauchy_distribut:0,caus:[23,28],cbrt:1,cd:[4,14,25],ceil:1,center:[16,17,20],certain:22,cflag:[14,25],cgh:[0,1],chain:[11,27],chang:[12,13,27,29],character:23,cheap:29,check:[0,5,6,7,10,14,16,17,20,25],choic:5,choos:[5,6,8,11,16,17,20,28],chosen:[4,5,6,7,8,9,10,11,22],chrono:8,chunk:[16,17],circl:[14,25],cl:4,cl_int:1,claim:23,clang:[1,30,32],clariti:[5,7],cmake:[0,1,2,3,5,6,7,8,9,10,11,12,13,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32,33],cmake_build_typ:4,cmake_cxx_compil:4,cmake_cxx_standard:4,cmake_host_win32:4,cmakelist:[4,14,25],co:1,code:[0,1,5,6,7,8,10,11,14,22,24,25,28,29,31],coexist:13,combin:[5,20,28,31,32],come:[30,32],command:[1,8,11,13,16,17,20],common_typ:1,commonli:33,commun:20,commut:20,compar:[13,26,29,31],comparison:[13,22,26],compat:20,compil:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],complet:[6,8,10,11,14,20,22,25,27,31,33],complex:[1,13],compliant:19,compon:[14,23,25],comput:[14,16,17,20,22,25,26,27,28,29,30],concurr:[6,10,27,31],condit:[1,13,33],configur:[4,14,16,17,20,21,25],congruenti:0,conj:1,connect:[4,14,25],consid:[4,8,32],consist:[14,25],constant:[7,30],constexpr:[1,5,6,7,10,19,28],construct:[5,6,7,9,10,13,26,28,29],constructor:[8,28,29],contain:[4,6,7,8,10,13,22,23,30,31,32],content:28,contigu:[26,29,30],control:[4,22,27,31],conveni:31,convert:[0,13,14,25,27],copi:[1,9,16,17,20,22,29,30,31,32],copy_async:27,copy_backward:1,copy_if:[1,13,29,30,32],copy_n:1,copyabl:[13,31],copyassign:31,copyconstruct:[13,31],copyright:23,copysign:1,copysignf:1,core:[16,17,20],corpor:23,correct:26,correctli:[16,17,20],correspond:[1,13,14,17,22,25,26,27,29],cosh:1,cost:[6,10,23],could:[7,13,26],count:[1,8,14,25,26,30,32,33],count_a:29,count_b:29,count_if:[1,30,32],count_kernel:0,counter:[10,16,17,29],counting_iter:[14,25,29],cours:23,cout:[0,1,5,6,7,8,9,10,11,16,17,20],cplusplu:24,cpp:[1,4,13,14,16,17,20,25],cpu:[1,5,7,8,9,10,11,14,25,28],cpu_selector_v:[5,7,8,9,11,28],creat:[0,4,11,13,14,16,17,19,25,28,31],creation:28,cref:1,cross:[4,20],cstdint:[16,17,20],current:[1,6,16,17,20,22,23,26,27],custom:[21,26,28,32],customiz:[0,21],cut:8,cv:[5,7],cycl:10,d:[17,20,26],d_head:31,data2:32,data:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,32,33],data_per_workitem:[16,17,19,20],dataperworkitem:19,dcmake_build_typ:[4,14,25],dcmake_cxx_compil:[4,14,25],deal:23,debug:[4,7],decai:1,decay_t:9,decim:22,declar:29,decltyp:[5,6,7,10,31],declval:1,decoupl:20,dedic:22,deduct:31,default_selector_v:0,defaultconstruct:13,defect:23,defer:22,deferred_initialization_t:[5,6,7,10],defin:[0,5,6,7,10,13,16,17,19,20,22,26,27,28,29,30,32],definit:[2,13,19,26,29],deliv:21,demonstr:[5,6,7,8,9,10,11,29],denot:20,densiti:0,depend:[8,13,16,17,19,20,21,22,27,28],deprec:[1,13,24],depth:[14,25],derefer:29,dereferenc:[13,29],descend:[16,17],describ:[4,8,16,17,20,23,27,30,31],descript:[0,5,6,7,10,14,16,17,19,20,22,25,28],design:[7,14,20,23,25],desir:[4,14,25,28,29],destin:[13,32],destroi:31,detail:[4,9,11,13,14,22,25],detect:31,determin:[5,8,9,26],determinist:20,develop:[0,1,2,3,4,5,6,7,8,9,10,11,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],deviat:23,devic:[0,1,5,6,7,8,10,12,13,14,16,17,18,19,20,21,22,25,26,27,29,30,31,32],device_polici:28,devicequeu:1,differ:[0,6,8,9,20,28],digit:[16,17],direct:[13,28,31],directli:[5,6,7,8,10,13,28],directori:[4,13,14,25],disabl:22,discard:[0,29,33],discard_block_engin:[0,24],discard_iter:29,discontinu:[24,32],dispatch:20,displai:[5,7],distanc:29,distr:[0,14,25],distribut:[3,4,14,22,25,30],divid:[1,20,26],do_cpu_work:6,document:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],doe:[6,7,10,13,16,17,19,20,29],done:[1,5,6,7,8,11,16],donedpl_par_backend:4,doubl:[0,13,16,17,26],dpc:[0,1,2,3,4,5,6,7,8,9,10,11,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32,33],dpcpp:[1,4],dpcpp_default:[14,22,25,27,28,29,30,31,32],dpcpp_fpga:[22,28],dpl:[0,1,2,5,6,7,8,9,10,11,13,16,17,18,19,20,21,24,26,27,28,29,30,32],driver:8,drop:32,drop_view:30,duan:[16,17],due:[13,20],dure:[7,11,13,29,31],dynam:[5,7,8,9,10,12],dynamic_load_exampl:6,dynamic_load_polici:[8,11],dynamic_select:[5,6,7,8,9,10,11],e1:29,e2:29,e3:29,e:[8,16,17,20,26],each:[5,6,9,10,11,14,16,17,19,20,25,26,29,30,32],earlier:13,easier:29,effect:[22,28,29,31],effici:[0,16,20,21,30],effort:[12,14,25],ehsc:13,either:[13,16,17,29],element:[10,13,16,17,19,20,21,26,29,30,31,32],elems_per_workgroup:20,elif:7,els:[5,6,7,10],emit:22,emploi:1,empti:[11,32],emul:[8,22,28],enabl:[4,22,23,27,28,30],enable_if:1,enable_profil:5,encapsul:[5,6,7,9,10,28],end:[11,16,17,20,26,27,28,30],endif:[4,7],endl:[0,1],engin:[3,14,22,24,25],enough:[6,16,17,20],ensur:[28,31],entropi:0,environ:[4,13,14,25],equal:[6,13,16,17,20,26,30,32],equal_rang:1,equal_to:[1,26],erf:1,erfc:1,errata:23,error:[5,7,13,22,23,29],esimd:[16,17,19,21],especi:30,essenti:[8,26,30],estim:[14,25],estimated_pi:[14,25],estoppel:23,etc:[22,27,28],evalu:[13,20,22,26],even:[7,26],evenli:[0,26],event:[5,6,7,9,10,11,16,17,20,27],eventu:32,everi:29,ex:[1,5,6,7,8,9,10,11],exact:8,exactli:[20,30],exampl:[0,1,8,9,11,13,21,26,29,31],exce:[16,17],except:[13,16,17,20,23,28],exclud:[30,32],exclusive_scan:[13,32],exclusive_scan_async:27,exclusive_scan_by_seg:[13,26],exec:32,execut:[5,6,7,8,9,10,12,13,14,16,17,20,22,25,26,27,29,30,31,32,33],execution_info:[5,6,7,8,10],executionpolici:32,exist:28,exp2:1,exp:1,expect:[9,14,25],experi:20,experiment:[0,5,6,7,8,9,10,11,12,13,16,17,18,19,20,21,22,27,30,33],explicit:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],explicitli:[5,6,8,13,22,28,31],explor:[14,25],expm1:1,exponenti:0,exponential_distribut:0,expositori:[5,6,7,10],express:[23,27,30,31],extend:[27,30,33],extens:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],extent:1,extra:31,extrem:0,extreme_value_distribut:0,f:[5,6,8,10,26],fab:1,factor:[19,28],factori:[30,31,32],fals:[4,16,17,26],famili:31,fast:6,faster:[6,16,17],fdim:1,featur:[5,6,7,8,9,10,11,13,14,25,27,29,30],feed:[16,17],feedback:[5,6,7,10],fewest:[6,11],file:[1,13,21,23,28,32],fill:[1,22,27,28],fill_async:27,fill_n:1,find:[1,4,13,28,29,30,32],find_end:32,find_first_of:32,find_if:[1,30,32],find_if_not:[1,30,32],find_least_load:6,find_packag:[4,14,25],fiopenmp:13,first:[4,5,7,8,16,26,28,29,30,32],first_ni:31,first_out:16,first_ro:31,first_wo:31,firstli:13,fit:[14,20,23,25],fix:[9,11,13,14,25],fixed_offset:7,fixed_offset_:7,fixed_resouce_polici:7,fixed_resource_polici:11,flag:[14,20,25],floor:[1,26],flow:27,fmax:1,fmaxf:1,fmin:1,fminf:1,fmod:1,follow:[0,1,3,4,5,6,7,8,9,10,11,13,14,18,24,25,27,28,29,30,31,32],foo:[4,14,25],fopenmp:22,for_each:[1,14,25,28,30,32],for_each_async:27,for_each_n:1,form:[14,22,25],forward:[1,20],found:[4,8,13,24,26,29],fp64:0,fpga:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,29,30,31,32,33],fpga_emulator_selector:28,fpga_polici:28,fpga_policy_a:28,fpga_policy_b:28,fpga_policy_c:28,fpga_selector:28,fpgapolicya:28,fpgapolicyc:28,fraction:[14,25],free:[16,20,31],frexp:[1,13],from:[0,5,6,7,8,10,11,13,14,20,23,24,25,26,27,28,29,30,31,32],fsycl:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],full:[4,23,24],fulli:[4,19,20],func:29,functor:29,further:[21,22],furthermor:13,fut1:27,fut2:27,futur:[1,20,26,27],garland:20,gaussian:0,gcc:[1,13,22,30,32],gener:[1,3,5,6,7,10,12,14,16,17,19,20,21,22,25,30,31,32],generate_n:1,geometr:0,geometric_distribut:0,get:[0,1,2,3,4,5,6,7,9,10,11,13,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32,33],get_access:[0,1],get_buff:31,get_devic:[5,7,8,9,11],get_linear_id:0,get_polici:[5,6,7,10],get_resourc:[5,6,7,8,10],get_resource_to_profil:5,get_submission_group:[5,6,7,8,10,11],get_tun:5,github:[12,14,24,25],give:31,given:[5,20,26],global_ptr:[14,25],gninja:4,gnu:1,good:[6,10],gpu:[5,7,8,9,10,11,13,14,16,17,18,20,25],gpu_selector_v:[5,7,8,9,11,14,16,17,20,25,28],gradual:32,grant:23,greater:[1,2,4,30],greater_equ:1,group:[11,16,17,19,20,21],guarante:[13,20,26,31],guid:[0,1,2,3,4,5,6,7,8,9,10,11,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],guidelin:[16,17,20],gumbel:0,h:[5,6,7,10],ha:[1,3,4,5,6,7,8,10,11,19,20,24,26],had:6,halv:[16,17],handbook:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],handler:[0,1,5,6,7,10,28],hard:[14,25],hardwar:[22,23,28],has_known_identity_v:20,have:[1,4,5,6,9,14,22,24,25,28,29,31],header:[0,1,2,4,13,21,22,24,26,27,28,29,30,32],held:29,help:[14,25],helper:[8,31],here:[4,11,13],heterogen:[13,28],heurist:4,hierarchi:20,high:[12,14,16,17,20,25,30],higher:[13,30,32],highest:26,histogram:26,histori:5,hold:[13,26,29],host:[0,13,28,29,30,31,32],host_accessor:17,host_al:32,how:[1,4,14,25,28],howev:[5,6,7,9,10,19,21],hpc:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],hpp:[0,1,5,6,7,8,9,10,11,16,17,20,27,31],http:[16,17,24],hypot:1,i:[0,5,6,7,8,10,11,14,16,17,20,22,25,26,29],icpx:[4,13,14,16,17,20,25],icx:4,idea:[14,25],ident:[2,13,20,33],identifi:[5,26],idx:0,iec:33,ignor:20,illustr:[14,25],ilogb:1,imag:1,immut:28,implement:[0,2,4,5,6,7,8,10,13,16,17,18,19,20,21,22,24,26,27,28,29,31,32,33],impli:23,implicit:28,impos:13,improv:[14,25],in_begin:20,in_end:20,in_ord:28,in_rng:20,includ:[0,1,3,5,6,7,8,9,10,11,13,14,16,17,20,21,22,23,25,27,28,30,31,32,33],inclus:21,inclusive_scan:[13,32],inclusive_scan_async:27,inclusive_scan_by_seg:[13,26],incompat:24,increas:[16,17],increment:[10,16,17,30,32],independ:9,index:[5,7,26,29,30],indic:[26,28],infin:1,info:8,inform:[7,8,9,10,11,12,14,16,17,20,25,28,30],infring:23,init:29,initer:20,initi:[13,16,17,20,26,30,31,32],initiali:6,initialized_:[5,6,7,10],initializer_list:1,inner:[6,10],inplace_merg:13,input:[5,13,16,17,19,20,26,27,29,31,32],inrng:20,inscrib:[14,25],insert:26,insid:11,instal:[8,13],instanc:[9,13,29],instanti:[0,29],instead:[8,13,20,32],instruct:[4,14,25],instrument:[5,6,8],int32_t:0,int64_t:0,integ:[0,7,29,31],integr:[4,16,17,20],integral_const:1,intel:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],intellectu:23,intend:[20,28],interchang:13,interfac:27,interleav:27,intermedi:[16,17,20],intern:[16,17,20],interoper:27,interv:5,introduc:[13,30],introduct:12,invok:[5,7,13,19,28,31,32],io:24,iostream:[0,1,5,6,7,8,9,10,11,16,17,20],iota:32,iota_view:30,is_arithmet:1,is_assign:1,is_base_of:1,is_base_of_union:1,is_compound:1,is_const:1,is_construct:1,is_convert:1,is_copy_assign:1,is_copy_construct:1,is_cpu:[5,7],is_default_construct:1,is_destruct:1,is_empti:1,is_fundament:1,is_gpu:[8,9,11],is_heap:1,is_heap_until:1,is_literal_typ:[1,24],is_literal_type_v:24,is_member_point:1,is_move_assign:1,is_move_construct:1,is_object:1,is_permut:1,is_pod:1,is_refer:1,is_sam:1,is_scalar:1,is_sign:1,is_sort:[1,30,32],is_sorted_until:[1,32],is_standard_layout:1,is_trivi:1,is_trivially_assign:1,is_trivially_construct:1,is_trivially_copy:1,is_unsign:1,is_volatil:1,isascend:[16,17],isgreat:1,isgreaterequ:1,isinf:1,isless:1,islessequ:1,isnan:1,iso:33,issu:[4,13,14,25],issue3561:24,isunord:1,item:[0,19,21],iter:[6,10,12,13,14,16,19,25,26,30,31,32,33],iterator1:[16,17],iterator2:[16,17],iterator_trait:13,iteratortyp:13,its:[2,5,6,7,10,13,14,22,23,24,25,30,31],j:[6,8,10],just:8,k:5,k_acc:17,k_out_acc:17,kei:[5,6,7,10,11,16,20,26,29,33],kernel:[1,5,6,10,12,13,14,16,17,20,25,27,28,31],kernel_nam:19,kernel_param:[16,17,20],kernel_swap:1,kernel_templ:[16,17,19,20,21],kernel_test:1,kernelnam:19,kernelparam:[16,17,20],kernelswap:1,key_typ:[16,17,20],keys_begin:29,keys_first:17,keys_last:17,keys_out:[16,17],keys_out_first:17,keys_per_workgroup:[16,17],keysiterator1:17,keysiterator2:17,keysrng1:17,keysrng2:17,keysrng:17,kit:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],know:8,known:[7,14,20,23,25,31],kt:[16,17,18,19,20,21],lambda:[13,28],languag:24,larg:[14,16,17,20,25],last:[16,26,27,29],later:13,latest:[4,14,25],layer:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],layout:24,ldexp:[1,13],lead:[16,17,22,31],learn:[14,25],least:[16,17,20,26],least_load:6,least_loaded_resourc:6,left:26,legacyrandomaccessiter:31,less:[1,2,16,17],less_equ:1,lesser:2,let:24,level:[4,16,17,20],leverag:30,lgamma:1,lh:29,libc:[1,13],librari:[0,1,2,3,4,5,6,7,8,9,10,11,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32,33],libstdc:[1,13],lie:[14,25],lifetim:[27,31],lightweight:30,like:[5,8,27,29],limit:[6,10,14,16,17,20,23,25,27,31],line:[4,13],linear:0,linear_congruential_engin:0,link:[4,14,25,28],linux:[4,13,14,25],list:[4,13,14,20,24,25,26,27],llvm:[1,22,23,28],load:[9,10,11],local:21,local_sum:[14,25],log10:1,log1p:1,log2:1,log:1,logb:1,logic:[5,6,7,9,10],logic_error:[5,6,7,10],logical_and:1,logical_not:1,logical_or:1,lognorm:0,lognormal_distribut:0,logo:23,look:[14,20,25],loop:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],lower_bound:[1,26],lowest:[1,26],ltbb:13,lwg:24,m:[20,26],machin:8,macro:[12,13,14,25,28,30],made:[5,6,8,11,31],mai:[4,5,6,7,10,13,16,17,19,20,21,22,23,24,26,28,30,31,32,33],main:[0,1,5,7,8,9,11,14,16,17,20,25,27,28,31],maintain:[7,9],major:22,make:[5,6,7,9,10,13,14,16,17,20,22,25,31],make_device_polici:[14,22,25,28,31],make_fpga_polici:[22,28],make_heap:1,make_permutation_iter:29,make_task_kei:5,make_transform_iter:29,make_zip_iter:29,makefil:4,malloc_devic:31,malloc_host:31,malloc_shar:[16,20,31],manag:8,mani:[16,17,20,26],manner:[14,25],map:[26,29],mark:23,match:31,math:13,max:[1,16,17,20,26],max_el:[13,30,32],max_n:32,maxim:[16,17],maximum:[2,26,33],mean:[13,19,28],measur:[16,17,20],mechan:8,meet:13,member:[5,6,7,10,13,27,29],memori:[13,21,28,32],merchant:23,merg:[13,30,32],merril:[16,17,20],messag:22,met:13,meta:[14,25],method:[14,25,31,32],microsoft:[1,13,14,25,30],might:[19,22,31],min:[1,26],min_el:[13,30,32],minim:[4,12,13,14,25],minimum:[2,26,33],minmax_el:[13,32],minor:22,minstd_rand0:0,minstd_rand0_vec:0,minstd_rand:[0,14,25,31],minstd_rand_vec:[0,14,25],minu:1,miss:13,mkdir:[4,14,25],mode:[0,1,31],model:28,modern:[30,32],modf:1,modif:31,modifi:[22,24,29,30,31],modulu:1,mont:[14,25],more:[4,5,6,8,9,11,13,16,17,20,28,29,30],most:[4,6,14,25],move:[1,32],move_backward:1,move_if_noexcept:1,moveassign:13,moveconstruct:13,msvc:[1,14,25],multiarchitectur:[14,25],multipl:[6,16,17,19,20,28,30,31],multipli:1,multiply_index_by_two:29,multithread:31,must:[1,4,5,6,7,8,10,11,13,16,17,19,20,26,28,31],my_polici:[5,6,7,10],n:[0,5,6,7,8,9,10,11,13,14,16,17,20,25,29,30,31,32],name:[16,17,19,20,23,27,28,31],namespac:[0,1,2,5,6,7,8,9,10,11,13,14,16,17,18,19,20,21,24,25,26,27,28,29,30,32],nan:1,nanf:1,ncopi:9,nearbyint:1,nearbyintf:1,necessari:[4,5,6,7,8,10],need:[5,6,7,8,9,10,13,14,20,24,25,28,29],negat:[1,29,31],nest:21,newer:[13,16,17,24],newli:4,next:6,next_context_:10,nextaft:1,nfirst:0,ninja:4,nlast:0,no_init:31,non:[5,8,20,22,23,27,31],noncontigu:29,none_of:[1,30,32],nontempor:22,norm:1,normal:0,normal_distribut:0,not1:[1,24],not2:24,not_equal_to:1,note:[12,13,14,25,28,32],notic:13,now:8,nresourc:8,nsampl:0,num1:1,num2:1,num_arrai:[6,10],num_bin:26,num_devic:[6,10],num_el:29,num_resources_:10,number:[3,6,10,12,14,16,17,19,20,21,22,25,26,27,29],numer:[22,27,28],numeric_limit:1,numofitem:1,nvidia:20,nvr:20,o0:13,o:[1,13,16,17,20,22],object:[3,5,6,7,8,9,10,11,12,13,14,16,17,19,20,22,25,26,27,28,29,31,33],observ:[14,25],occur:24,offer:[0,33],offload:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],offset:[0,5,7,14,25],ok:29,older:13,omit:19,onc:[4,5,14,20,25],one:[5,6,7,10,11,13,14,16,17,25,26,28,29,30,32],oneapi:[0,1,2,3,4,5,6,7,8,9,10,11,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,32,33],onedpl:[1,2,3,5,6,7,8,9,10,11,12,15,16,17,18,19,20,21,22,23,26,27,28,29,30,31,32,33],onedpl_allow_deferred_wait:22,onedpl_found:4,onedpl_fpga_devic:[22,28],onedpl_fpga_emul:[22,28],onedpl_has_random_numb:22,onedpl_has_range_algorithm:[22,30],onedpl_par_backend:4,onedpl_use_dpcpp_backend:22,onedpl_use_openmp_backend:22,onedpl_use_predefined_polici:22,onedpl_use_tbb_backend:22,onedpl_version_major:22,onedpl_version_minor:22,onedpl_version_patch:22,onedplconfig:4,onedplconfigvers:4,onedplwindowsintelllvm:4,ones:13,onesweep:[16,17],onetbb:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],onli:[0,5,6,8,11,13,16,17,18,22,26,28,29,30,31,32],openmp:[4,13,22,28,33],oper:[2,9,13,16,17,20,22,26,29,30,31,33],opportun:[6,10,21],optim:[4,14,16,17,19,20,21,25,31],option:[0,1,2,3,5,6,7,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],order:[1,4,16,17,26,29],ordinari:31,org:[16,17],origin:26,other:[0,5,6,7,9,10,13,16,17,22,23,26,28,29,31,32,33],otherwis:[5,7,13,22,23,26],out:[20,28],out_begin:20,out_rng:20,outer:[6,10],outiter:20,output:[0,8,9,11,16,17,20,26,29,32],output_kei:26,output_valu:26,outrng:20,outstand:[6,11],over:[6,10,21,22,29,32],overal:[16,17],overflow:26,overhead:[5,6,7,10,16,17],overlap:27,overload:[16,17,26,29,32],overrid:[5,6,7,10],overview:[13,14,25],own:13,p1:9,p1s1:9,p1s2:9,p2:9,p2s1:9,p2s2:9,p2s3:9,p2s4:9,p3:9,p3s1:9,p3s2:9,p3s3:9,p:[5,6,7,8,10,11],p_default:8,p_explicit:8,packag:[1,4],page:[13,14,24,25],pair:[1,17,26,29,32,33],par:[22,28,30],par_unseq:[13,22,28],paradigm:30,parallel:[0,1,2,3,5,6,7,8,9,10,11,12,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,31,32],parallel_for:[0,5,7],param:[16,17,20],paramet:[0,13,19,21,24,29],parent:[4,14,25],part:[5,6,7,8,9,10,11,29,32],partial:26,partial_sort:[1,13],partial_sort_copi:[1,13],particip:29,particular:[21,23,31],particularli:[13,20],partition_copi:13,pass:[4,5,6,7,8,9,10,11,12,13,16,17,20,21,28,29,30,32,33],past:[26,31],patch:22,path:[14,16,17,20,25],perform:[5,6,7,10,12,14,19,21,23,25,26,28,29,30],period:5,permit:32,permut:[26,29,33],permutation_first:29,permutation_iter:29,permutation_last:29,phase:5,philox4x32:0,philox4x32_vec:0,philox4x64:0,philox4x64_vec:0,philox:[0,22],philox_engin:0,pick:11,pipelin:[30,31,32],place:[4,13,31],platform:[1,4,7,8],pleas:[4,14,25],plu:[1,14,20,25,26],point:[5,6,7,10,11,13,14,16,17,20,25,31],pointer:[13,16,17,20,31,32],polar:1,polici:[11,12,13,14,22,25,26,27,29,30,31,32,33],policy_:28,policy_a:28,policy_b:28,policy_c:28,policy_d:28,policy_trait:[5,6,7,8,9,10],policya:28,policyb:28,policyc:28,policyd:28,pop_heap:1,portabl:[14,25],posit:[16,17,26,30],possibl:[5,6,7,8,10,16,17,20,28,31],pow:1,power:13,pragma:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],preced:[11,22],precis:[0,13,28],predefin:[22,28],predic:26,prefix:[20,26],preprocessor:13,presenc:[22,30],present:27,preserv:[16,17],prevent:31,preview:1,previou:[8,13],previous:5,primari:[7,21],print:[1,16,17,20],print_typ:9,prior:[2,5,6,7,10],priorit:21,probabl:[0,14,25],process:[0,10,13,16,17,19,20,21,28,29,30,31],processor:33,produc:[0,22,30,32],product:[12,14,20,23,25],profil:[5,11,16,17,20],program:[1,12,13,14,22,25],progress:20,proj:1,project:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],proper:31,properti:[5,23,28],propos:24,prove:20,provid:[0,1,4,5,6,7,8,9,10,11,12,13,14,16,17,19,20,21,25,26,27,28,29,30,31,32,33],pseudo:[0,14,22,25],pstl:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],pstl_usage_warn:22,pstl_use_nontemporal_stor:22,publish:23,purpos:[8,11,23],push_heap:1,q:[5,6,7,8,9,10,11,14,16,17,20,25,31],qualifi:[13,29],quantiti:[14,25],quarter:[14,25],queue:[0,1,5,6,7,8,9,10,11,14,16,17,20,22,25,28,30,31],quiet_nan:1,r:[5,7,10,16,17],r_out:16,race:31,radix_sort:18,radix_sort_by_kei:18,radixbit:[16,17],random:[3,12,13,22,29,30,31],random_fil:[14,25],randomaccessiter:26,rang:[0,1,12,13,16,17,20,22,24,26,29,33],range1:[16,32],range2:[16,32],range_1:32,range_2:32,range_r:32,rangexp:32,rank:1,ranlux24:0,ranlux24_bas:0,ranlux24_base_vec:0,ranlux24_vec:0,ranlux48:0,ranlux48_bas:0,ranlux48_base_vec:0,ranlux48_vec:0,rather:31,ratio:[1,14,25],rbegin:0,re:[0,14,25],read:[20,29,31,32],read_onli:[5,7,17,31],read_writ:[1,5,7],readi:27,readm:[14,25],real:[0,1],reason:31,rebuild:24,receiv:[11,29],recent:4,recommend:[4,21,22,31],redirect:13,reduc:[1,13,16,17,27,29,31,32,33],reduce_async:27,reduce_by_seg:[13,26,32],reduct:[13,14,20,25,26],redund:11,ref:1,refer:[0,2,3,4,5,6,7,8,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],reference_wrapp:1,rel:[16,17],releas:[1,4,12,13,14,24,25],reli:0,remain:[0,7,13],remaind:1,remov:[1,13,24,32],remove_all_ext:1,remove_const:1,remove_copi:32,remove_copy_if:32,remove_cv:1,remove_ext:1,remove_if:[13,32],remove_volatil:1,remquo:1,reorder:[16,17],repeat:10,repeatedli:[30,32],replac:32,replace_copi:32,replace_copy_if:32,replace_if:32,report:20,report_info_v:[5,6,7,10],repositori:[12,14,25],repres:[11,16,17,20,29,32],request:23,requir:[8,14,19,22,23,24,25,26,28,29,30,31,32],resampl:5,resample_interval_in_millisecond:5,resembl:32,resid:1,resolut:29,resourc:[5,6,9,10,11,14,25,27],resource_t:[8,9],resource_typ:[5,6,7,9,10],resources_:[5,6,7,10],respect:[0,13,17,22],respons:[28,31],restrict:31,result:[0,1,5,8,13,20,23,26,27,29,31],result_of:24,result_of_t:24,ret_val:27,retriev:[14,25,31],revers:[30,32],reverse_copi:32,reverse_view:30,rh:29,rid:[14,25],right:23,robin:[9,11],rotat:[5,10,11,13],rotate_copi:32,round:[1,9,11],round_robin_exampl:10,round_robin_polici:[5,8,9,11],round_round_polici:10,roundf:1,run:[1,5,6,7,8,10,13,16,17,20,22,28],runtim:[5,8,11,13,22,28],s:[4,5,6,7,8,9,10,13,14,16,17,19,20,25,26,29,30,31],safe:28,same:[0,6,7,13,17,22,31],sampl:[0,14,25],satisfi:[13,16,17,19,20,21,31],scalar:[0,14,25],scan:[13,21,26,33],scenario:7,script:[4,14,25],search:[4,14,25,26,30,32,33],search_n:30,secondli:13,section:[4,8,9,11],secur:23,see:[4,13,16,17,20,22,28,29,30,31],seed:[0,14,25],seen:8,segment:33,select:[0,4,9,12,16,17,20],selection_t:[8,9],selection_typ:[5,6,7,8,9,10],selector:28,semant:[28,29,31],send:[6,10],sentinel:30,separ:9,seq:28,sequenc:[0,13,16,17,20,26,30,31,32],sequence1:[26,29],sequence2:[26,29],sequence3:29,sequenti:[19,22,28],seri:[8,11,16,17,20],serial:[4,13],servic:23,set:[4,5,6,7,8,10,13,14,19,22,25,26,28,29],set_differ:13,set_intersect:13,set_symmetric_differ:13,set_union:13,sever:[0,1,3,5,6,7,8,9,10,11,32],share:[9,20,30,32],shorter:13,should:[4,6,8,13,22,26,29,31],show:[1,8,11,14,25,31],shown:[8,9,31],side:[0,29],signatur:[5,6,7,8,9,10,27],signific:[16,17],silent:26,simd:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],similar:[10,26,32],similar_devic:10,similarli:1,simpl:[6,10,27],simpli:7,simplifi:[5,6,7,10,14,25,28,29],simultan:[6,26,30],sin:1,sinc:[6,8,11,16,17,29],singl:[8,16,20,21,26],single_task:[1,8,11],single_view:30,sinh:1,size:[0,6,10,19,21,24,30,31,32],size_t:[5,6,7,10,14,16,17,20,25,29],sizeof:[16,17,20],skip:26,small:[16,20],smaller:10,snippet:29,so:[5,7,9,19,29],softwar:[13,23],some:[4,6,7,8,11,13,16,17,20,31,32,33],sort:[13,26,27,29,30,31,32,33],sort_async:27,sort_by_kei:26,sourc:[0,13,14,25,29,32],space:[13,16,17],span:[30,31],special:[7,19,31],specif:[7,8,13,14,16,17,19,20,21,22,23,25,28,33],specifi:[4,11,14,25,26,28,30,31,33],speed:[14,25],sqrt:[1,13],squar:[14,25],stabil:26,stabl:[5,16,17,26,29],stable_partit:13,stable_sort:[13,29,30,32],stable_sort_by_kei:26,standard:[3,4,12,14,22,24,25,30,31,32,33],start:[0,1,2,3,4,5,6,7,8,9,10,11,13,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32,33],state:[5,6,7,9,10,13,29],statist:0,statu:[16,17,20],std:[0,1,2,5,6,7,8,9,10,11,13,14,16,17,19,20,22,25,26,28,29,30],steady_clock:8,stencil:29,step:[6,10,13,28],still:[5,6,7,10],stl:[22,27,28],storag:[16,17,20,27,31],store:[0,7,14,16,17,20,25,26,29],str:9,stream:22,string:9,struct:[9,19,29],structur:[19,21,29],studio:[1,30],submiss:[5,6,7,10,11],submission_group_s:[6,10],submission_t:8,submit:[0,1,5,6,7,9,10,11,16,17,20,31],submit_and_wait:[5,6,7,8,9,10,11],subrang:[16,17,20,30,31,32],subsect:31,subsequ:[26,31],subset:[7,27],subsidiari:23,substitut:[13,32],subtract:0,subtract_with_carry_engin:0,success:4,successfulli:4,suffici:[20,26],suffix:27,suitabl:4,sum:[14,20,25,26,29],summar:[7,10],suppli:28,support:[0,1,2,3,5,6,7,8,9,10,11,12,13,15,16,17,18,19,20,21,22,23,24,26,27,28,29,31,32,33],suppos:29,sure:[16,17,20,31],swap:[1,29],swap_accessor:1,swap_buff:1,swap_num:1,swap_rang:32,sycl:[0,1,2,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],sycl_backend:[5,6,7,10],sycl_device_typ:[14,25],sycl_read_writ:1,synchron:[16,17,20,28],synopsi:[16,17,19,20],syntact:[8,11],syntax:[14,25],system:[4,7,10,14,25,28],t:[0,1,17,29],tabl:[7,10,31],tag:31,tailor:28,take:[14,16,17,22,25,26,27,31,32],take_view:30,tan:1,tanh:1,target:[4,7,14,25,26],target_link_librari:[4,14,25],task:[6,11,22],task_complet:[5,6,7,8,10],task_submiss:[5,6,7,8,10],task_submission_t:[5,6,7,10],task_tim:[5,6,7,8,10],tbb:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],technic:20,technolog:[18,23],templat:[0,5,6,7,8,9,10,12,14,24,25,28,29,32],temporari:[27,29,31],term:[16,17,20],test:[3,8,12,13,14,22,25,30],text:23,tgamma:1,than:[6,16,17,28,31],thei:[0,1,21,27,29,30],them:[14,22,25,28],themselv:[14,25],thereaft:5,therefor:[7,10,31],thi:[4,5,6,7,8,9,10,11,13,14,18,20,22,23,24,25,26,27,28,29,30,31,32],those:[8,10,31,33],though:29,thread:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],three:[5,6,7,10],through:[2,5,6,8,10,26,28,29],thrown:[16,17,20,28],tile:20,time:[4,5,6,7,10,22,30],too:[16,17,20],tool:[14,25],toolkit:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],top:[21,33],total:[6,10],track:[5,6],trade:23,trademark:23,tradition:27,trait:8,transfer:[13,31],transform:[1,26,27,29,30,31,32,33],transform_async:27,transform_exclusive_scan:[13,32],transform_exclusive_scan_async:27,transform_first:29,transform_if:26,transform_inclusive_scan:[13,32],transform_inclusive_scan_async:27,transform_iter:29,transform_last:29,transform_reduc:[13,14,25,32],transform_reduce_async:27,transform_view:30,treat:31,trivial:13,trunc:1,truncf:1,tune:[9,11,16,17],tuner:5,tupl:[1,29],tuple_like_obj:29,turn:28,twice:[16,17],two:[1,5,7,8,9,26,28,30,32],txt:[4,14,25],type:[0,2,4,5,6,7,8,9,10,13,16,17,20,21,26,27,28,29,31],type_trait:24,typenam:[5,6,7,8,9,10,16,17,19,20,29,32],typic:[1,19,30],u:[5,6,7,10],uint16_t:19,uint32_t:[0,16,17,20],uint64_t:[0,5],uint8_t:[16,17],uint_fast32_t:0,uint_fast64_t:0,unari:[13,26,29],unary_funct:24,unary_neg:[1,24],unchang:2,undefin:[13,16,17,20,22,26,28],under:[0,23],underli:[8,30,32],unfinish:6,unifi:[20,32],uniform_int_distribut:0,uniform_real_distribut:[0,14,25],uninitialized_:31,unintend:31,uniqu:[5,13,19,28,32],unique_copi:[13,32],unit:30,unix:4,unless:22,unmodifi:26,unnam:28,unnecessari:13,unrol:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],unroll_factor:28,unsaf:31,unseq:[13,28],unsequenc:[13,22,28],unsign:0,unspecifi:[19,27,29,31],unstabl:26,unsupport:4,until:[6,8,10,11,20],unwrap:[5,6,7,8,9,10],up:[16,17],updat:[4,14,25],upper:[16,17],upper_bound:[1,26],us:[0,1,2,3,4,5,6,7,9,10,11,16,17,19,20,21,22,24,26,27,29,30,32],usag:[22,23],use_best:5,use_cpu:7,use_gpu:7,user:[4,5,6,7,8,9,10,11,26,28],user_funct:9,usm:[6,10,13,16,17,20,30,31,32],usm_alloc:[30,31],usm_data:[6,10],usm_shared_alloc:30,usmptr:[14,25],usual:[16,17,19],util:[1,3,12,16,17,20,24,27,30,32,33],v:[6,8,10,20],v_acc:17,v_out_acc:17,valid:[8,11,31],vals_begin:29,valu:[0,5,6,13,14,19,22,24,25,26,28,29,30,31,32,33],value_typ:[13,17],values_first:17,values_out:17,values_out_first:17,values_per_workgroup:17,valuesiterator1:17,valuesiterator2:17,valuesrng1:17,valuesrng2:17,valuesrng:17,vari:[6,23],variabl:[4,13,14,25],variant:[16,17],variat:33,varieti:20,variou:[0,3,21,31],vec:[0,14,25,31],vec_in:30,vec_out:30,vecsiz:[14,25],vector:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,32,33],vector_length:19,verifi:20,version:[1,4,13,20,23,24],via:[1,4,5,6,11,13,14,25,30,31],view:[16,17,20],view_in:30,viewabl:32,violat:26,visit:[13,14,25,28,30],visual:[1,13,14,25,30],w:8,wa:[5,6,7,8,10,11,26],wai:[0,1,31],wait:[5,6,7,10,11,16,17,20,22,27],wait_for_al:27,wait_t:9,wait_typ:[5,6,7,9,10],want:13,warn:22,warranti:23,we:[4,6,31],weibul:0,weibull_distribut:0,well:[8,19,23,28,31,33],were:[1,14,24,25,29,31],what:[8,13,14,25,32],when:[5,6,7,8,9,10,13,14,16,17,19,20,21,22,24,25,28,31],where:[2,5,6,7,10,13,14,16,17,19,20,22,25,26,27,28,29,31,32],whether:[8,26],which:[0,4,5,12,13,14,16,17,20,23,25,26,29,30,31],whichev:10,whole:11,whose:[13,29],width:[16,17],window:[4,13,14,25],within:[13,14,16,17,19,20,25,26],without:[5,6,7,10,22,23,26,31],work:[4,5,6,7,8,10,11,12,13,14,16,17,19,20,21,25,30,31],workaround:4,workgroup_s:[16,17,19,20],workgroups:19,workload:[7,10,21,30],would:[6,29],wrap:[28,29,32],write:[0,5,6,7,10,13,22,26,29,32],write_onli:[17,31],written:[20,26],wrong:13,x:[0,4,14,16,17,20,25,27],x_acc:0,x_buf:0,xe_core_count:[16,17,20],xx:22,xxyyz:22,y:[14,25],ye:[5,6,31],yet:[6,32],yocto:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33],you:[4,5,6,14,22,24,25,27,28,29,31,32],your:[4,11,14,22,23,24,25,28,31],yy:22,z:22,zero:[5,14,22,25],zip:[32,33],zip_iter:29,zip_view:32,zipped_begin:29,zipped_first:29},titles:["Random Number Generators","Tested Standard C++ APIs","Utility Function Object Classes","API for SYCL* Kernels","CMake Support","Auto-Tune Policy","Dynamic Load Policy","Fixed-Resource Policy","Functions","Policies","Round-Robin Policy","Dynamic Selection API","oneAPI DPC++ Library Developer Guide","oneAPI DPC++ Library Introduction","Get Started with the oneAPI DPC++ Library","Release Notes","Radix Sort","Radix Sort By Key","ESIMD-Based Kernel Templates","Kernel Configuration","Inclusive Scan","Kernel Templates API","Macros","Notices and Disclaimers","oneDPL 2022 Breaking Changes","Get Started with the oneAPI DPC++ Library","Additional Algorithms","Asynchronous Algorithms","Execution Policies","Iterators","Parallel Range Algorithms","Pass Data to Algorithms","Experimental Range-Based API","Parallel API"],titleterms:{"2022":24,"break":24,"class":[2,19],"function":[0,2,8,12,16,17,20,31],"return":[16,17,20],"static":19,By:17,In:[16,17],No:8,addit:[22,26],algorithm:[5,6,7,10,13,26,27,30,31,32],align:28,api:[1,3,11,21,27,32,33],associ:8,async:27,asynchron:27,auto:5,auto_tune_polici:5,avail:9,backend:4,base:[18,32],befor:13,begin:[13,31],benchmark:[14,25],best:[16,17,20],build:[4,13,14,25],c:[1,13,28],chang:24,cmake:[4,14,25],code:13,command:[4,14,25],common:9,config:[14,25],configur:19,constant:19,constructor:[5,6,7,10],core:12,data:31,defer:[5,6,7,10],develop:[12,13],devic:[4,28],differ:13,disclaim:23,distribut:0,dpc:[12,13,14,25],dpl:[14,25,31],dynam:[6,11],dynamic_load_polici:6,end:31,engin:0,error:28,esimd:18,event:8,exampl:[4,5,6,7,10,14,16,17,20,25,27,28,30,32],execut:[4,28],experiment:32,featur:22,file:[4,14,25],find:[14,25],fix:7,fixed_resource_polici:7,fpga:28,gener:[0,4],get:[8,12,14,25],global:[16,17,20],group:8,guid:12,handl:28,header:[14,25],inclus:20,inclusive_scan:20,inform:13,initi:[5,6,7,10],instal:[14,25],introduct:13,invoc:[4,14,25],iter:29,kei:17,kernel:[3,18,19,21],kernel_param:19,known:13,librari:[12,13,14,25],licens:23,limit:13,load:6,local:[16,17,20],macro:22,member:19,memori:[16,17,20,31],model:0,more:[14,25],note:15,notic:23,number:0,object:2,oneapi:[12,13,14,25,31],onedpl:[0,4,13,14,24,25],option:[4,8],out:[16,17],par:4,par_unseq:4,parallel:[4,13,30,33],paramet:[16,17,20],pass:31,perform:[16,17,20],pi:[14,25],pkg:[14,25],place:[16,17],polici:[4,5,6,7,8,9,10,28],predefin:0,prerequisit:13,preview:12,queri:[5,6,7,8,10],quick:[14,25],radix:[16,17],radix_sort:16,radix_sort_by_kei:17,random:[0,14,25],rang:[30,31,32],recommend:[16,17,20],refer:[1,9],releas:15,report:[5,6,7,8,10],requir:[4,5,6,7,10,13,16,17,20],resourc:[7,8],restrict:13,robin:10,round:10,round_robin_polici:10,scan:20,select:[5,6,7,8,10,11],semant:9,set:[16,17,20],share:31,simpl:[14,25],sort:[16,17],standard:[1,13,28],start:[12,14,25],std:31,submiss:8,submit:8,support:[4,14,25,30],sycl:3,system:13,technolog:12,templat:[16,17,18,19,20,21],test:1,trait:9,tune:5,type:19,unifi:31,us:[8,13,14,25,28,31],usag:[0,4,14,16,17,20,25,27,28,30,32],util:2,valu:[8,16,17,20],vector:31,version:22,view:[30,31,32],wait:8,you:13,your:13}})
\ No newline at end of file