forked from NVIDIA/CUDALibrarySamples
-
Notifications
You must be signed in to change notification settings - Fork 1
/
benchmark_deflate_chunked.cu
84 lines (78 loc) · 2.59 KB
/
benchmark_deflate_chunked.cu
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
/*
* SPDX-FileCopyrightText: Copyright (c) 2020-2024 NVIDIA CORPORATION & AFFILIATES.
* All rights reserved. SPDX-License-Identifier: LicenseRef-NvidiaProprietary
*
* NVIDIA CORPORATION, its affiliates and licensors retain all intellectual
* property and proprietary rights in and to this material, related
* documentation and any modifications thereto. Any use, reproduction,
* disclosure or distribution of this material and related documentation
* without an express license agreement from NVIDIA CORPORATION or
* its affiliates is strictly prohibited.
*/
#include "benchmark_template_chunked.cuh"
#include "nvcomp/deflate.h"
static nvcompBatchedDeflateOpts_t nvcompBatchedDeflateOpts = nvcompBatchedDeflateDefaultOpts;
static bool handleCommandLineArgument(
const std::string& arg,
const char* const* additionalArgs,
size_t& additionalArgsUsed)
{
if (arg == "--algorithm" || arg == "-a") {
int algorithm_type = atoi(*additionalArgs);
additionalArgsUsed = 1;
// Note:
// Currently algorithm_type=0 is not working, and hence
// we need to disable this option.
// TODO: Fix algorithmic option 0, then re-enable.
if (algorithm_type < 1 || algorithm_type > 5) {
std::cerr << "ERROR: Deflate algorithm must be 1, 2, 3, 4, 5, but it is "
<< algorithm_type << std::endl;
return false;
}
nvcompBatchedDeflateOpts.algo = algorithm_type;
return true;
}
return false;
}
static bool isDeflateInputValid(const std::vector<std::vector<char>>& data)
{
for (const auto& chunk : data) {
if (chunk.size() > 65536) {
std::cerr << "ERROR: Deflate doesn't support chunk sizes larger than "
"65536 bytes."
<< std::endl;
return false;
}
}
return true;
}
void run_benchmark(
const std::vector<std::vector<char>>& data,
const bool warmup,
const size_t count,
const bool csv_output,
const bool tab_separator,
const size_t duplicate_count,
const size_t num_files,
const bool compressed_inputs,
const bool single_output_buffer)
{
run_benchmark_template(
nvcompBatchedDeflateCompressGetTempSize,
nvcompBatchedDeflateCompressGetMaxOutputChunkSize,
nvcompBatchedDeflateCompressAsync,
nvcompBatchedDeflateDecompressGetTempSize,
nvcompBatchedDeflateDecompressAsync,
nvcompBatchedDeflateGetDecompressSizeAsync,
isDeflateInputValid,
nvcompBatchedDeflateOpts,
data,
warmup,
count,
csv_output,
tab_separator,
duplicate_count,
num_files,
compressed_inputs,
single_output_buffer);
}