-
Notifications
You must be signed in to change notification settings - Fork 26
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
External storage API with updates from 2023-02-09 discussion with GDS.
- Loading branch information
Showing
3 changed files
with
189 additions
and
9 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,131 @@ | ||
/* | ||
* Copyright (c) 2022, NVIDIA CORPORATION. | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
#pragma once | ||
|
||
#include <cstdint> | ||
#include <type_traits> | ||
#include "merlin/memory_pool.cuh" | ||
|
||
namespace nv { | ||
namespace merlin { | ||
|
||
template <class Key, class Value> | ||
class ExternalStorage { | ||
public: | ||
using size_type = size_t; | ||
using key_type = Key; | ||
using value_type = Value; | ||
|
||
using dev_mem_pool_type = MemoryPool<DeviceAllocator<char>>; | ||
using host_mem_pool_type = MemoryPool<HostAllocator<char>>; | ||
|
||
const size_type value_dim; | ||
|
||
ExternalStorage() = delete; | ||
|
||
/** | ||
* Constructs external storage object. | ||
* | ||
* @param value_dim The dimensionality of the values. In other words, each | ||
* value stored is exactly `value_dim * sizeof(value_type)` bytes large. | ||
*/ | ||
ExternalStorage(const size_type value_dim) : value_dim{value_dim} {} | ||
|
||
/** | ||
* @brief Inserts key/value pairs into the external storage that are about to | ||
* be evicted from the Merlin hashtable. If a key/value pair already exists, | ||
* overwrites the current value. | ||
* | ||
* @param dev_mem_pool Memory pool for temporarily allocating device memory. | ||
* @param host_mem_pool Memory pool for temporarily allocating host memory. | ||
* @param hkvs_is_pure_hbm True if the Merlin hashtable store is currently | ||
* operating in pure HBM mode, false otherwise. In pure HBM mode, all `values` | ||
* pointers are GUARANTEED to point to device memory. | ||
* @param n Number of key/value slots provided in other arguments. | ||
* @param d_masked_keys Device pointer to an (n)-sized array of keys. | ||
* Key-Value slots that should be ignored have the key set to `EMPTY_KEY`. | ||
* @param d_values Device pointer to an (n)-sized array containing pointers to | ||
* respectively a memory location where the current values for a key are | ||
* stored. Each pointer points to a vector of length `value_dim`. Pointers | ||
* *can* be set to `nullptr` for slots where the corresponding key equated to | ||
* the `EMPTY_KEY`. The memory locations can be device or host memory (see | ||
* also `hkvs_is_pure_hbm`). | ||
* @param stream Stream that MUST be used for queuing asynchronous CUDA | ||
* operations. If only the input arguments or resources obtained from | ||
* respectively `dev_mem_pool` and `host_mem_pool` are used for such | ||
* operations, it is not necessary to synchronize the stream prior to | ||
* returning from the function. | ||
*/ | ||
virtual void insert_or_assign(dev_mem_pool_type& dev_mem_pool, | ||
host_mem_pool_type& host_mem_pool, | ||
bool hkvs_is_pure_hbm, size_type n, | ||
const key_type* d_masked_keys, // (n) | ||
const value_type* const* d_values, // (n) | ||
cudaStream_t stream) = 0; | ||
|
||
/** | ||
* @brief Attempts to find the supplied `d_keys` if the corresponding | ||
* `d_founds`-flag is `false` and fills the stored into the supplied memory | ||
* locations (i.e. in `d_values`). | ||
* | ||
* @param dev_mem_pool Memory pool for temporarily allocating device memory. | ||
* @param host_mem_pool Memory pool for temporarily allocating host memory. | ||
* @param n Number of key/value slots provided in other arguments. | ||
* @param d_keys Device pointer to an (n)-sized array of keys. | ||
* @param d_values Device pointer to an (n * value_dim)-sized array to store | ||
* the retrieved `d_values`. For slots where the corresponding `d_founds`-flag | ||
* is not `false`, the value may already have been assigned and, thus, MUST | ||
* not be altered. | ||
* @param d_founds Device pointer to an (n)-sized array which indicates | ||
* whether the corresponding `d_values` slot is already filled or not. So, if | ||
* and only if `d_founds` is still false, the implementation shall attempt to | ||
* retrieve and fill in the value for the corresponding key. If a key/value | ||
* was retrieved successfully from external storage, the implementation MUST | ||
* also set `d_founds` to `true`. | ||
* @param stream Stream that MUST be used for queuing asynchronous CUDA | ||
* operations. If only the input arguments or resources obtained from | ||
* respectively `dev_mem_pool` and `host_mem_pool` are used for such | ||
* operations, it is not necessary to synchronize the stream prior to | ||
* returning from the function. | ||
*/ | ||
virtual void find(dev_mem_pool_type& dev_mem_pool, | ||
host_mem_pool_type& host_mem_pool, size_type n, | ||
const key_type* d_keys, // (n) | ||
value_type* d_values, // (n * value_dim) | ||
bool* d_founds, // (n) | ||
cudaStream_t stream) = 0; | ||
|
||
/** | ||
* @brief Attempts to erase the entries associated with the supplied `d_keys`. | ||
* For keys do not exist nothing happens. It is permissible for this function | ||
* to be implemented asynchronously (i.e., to return before the actual | ||
* deletion has happened). | ||
* | ||
* @param dev_mem_pool Memory pool for temporarily allocating device memory. | ||
* @param host_mem_pool Memory pool for temporarily allocating host memory. | ||
* @param n Number of keys provided in `d_keys` arguments. | ||
* @param d_keys Device pointer to an (n)-sized array of keys. This pointer is | ||
* only guarnteed to be valid for the duration of the call. If easure is | ||
* implemented asynchronously, you must make a copy and manage its lifetime | ||
* yourself. | ||
*/ | ||
virtual void erase_async(dev_mem_pool_type& dev_mem_pool, | ||
host_mem_pool_type& host_mem_pool, size_type n, | ||
const key_type* d_keys, cudaStream_t stream) = 0; | ||
}; | ||
|
||
} // namespace merlin | ||
} // namespace nv |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters