Skip to content

Commit

Permalink
back to more cases
Browse files Browse the repository at this point in the history
  • Loading branch information
vuule committed Nov 5, 2024
1 parent 1feca3b commit 714011a
Show file tree
Hide file tree
Showing 2 changed files with 25 additions and 19 deletions.
38 changes: 22 additions & 16 deletions cpp/benchmarks/io/parquet/parquet_reader_input.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -287,38 +287,44 @@ void BM_parquet_read_wide_tables_mixed(nvbench::state& state)
parquet_read_common(num_rows_written, n_col, source_sink, state, data_size_bytes);
}

using d_type_list =
nvbench::enum_type_list<data_type::FLOAT, data_type::DECIMAL, data_type::STRING>;
using d_type_list = nvbench::enum_type_list<data_type::INTEGRAL,
data_type::FLOAT,
data_type::DECIMAL,
data_type::TIMESTAMP,
data_type::DURATION,
data_type::STRING,
data_type::LIST,
data_type::STRUCT>;

NVBENCH_BENCH_TYPES(BM_parquet_read_data, NVBENCH_TYPE_AXES(d_type_list))
.set_name("parquet_read_decode")
.set_type_axes_names({"data_type"})
.add_string_axis("io_type", {"DEVICE_BUFFER"})
.set_min_samples(4)
.add_int64_axis("cardinality", {0, 1000})
.add_int64_axis("run_length", {1, 32});
.add_int64_axis("cardinality", {0, 2000})
.add_int64_axis("run_length", {1, 16});

NVBENCH_BENCH(BM_parquet_read_io_compression)
.set_name("parquet_read_io_compression")
.add_string_axis("io_type", {"DEVICE_BUFFER"})
.set_min_samples(4)
.add_int64_axis("cardinality", {0, 1000})
.add_int64_axis("run_length", {1, 32});
.add_int64_axis("cardinality", {0, 2000})
.add_int64_axis("run_length", {1, 16});

NVBENCH_BENCH_TYPES(BM_parquet_read_chunks, NVBENCH_TYPE_AXES(d_type_list))
.set_name("parquet_read_chunks")
.add_string_axis("io_type", {"DEVICE_BUFFER"})
.set_min_samples(4)
.add_int64_axis("cardinality", {0, 1000})
.add_int64_axis("run_length", {1, 32})
.add_int64_axis("cardinality", {0, 2000})
.add_int64_axis("run_length", {1, 16})
.add_int64_axis("byte_limit", {0, 500'000});

NVBENCH_BENCH(BM_parquet_read_io_small_mixed)
.set_name("parquet_read_io_small_mixed")
.add_string_axis("io_type", {"DEVICE_BUFFER"})
.set_min_samples(4)
.add_int64_axis("cardinality", {0, 1000})
.add_int64_axis("run_length", {1, 32})
.add_int64_axis("cardinality", {0, 2000})
.add_int64_axis("run_length", {1, 16})
.add_int64_axis("num_string_cols", {1, 2, 3});

using d_type_list_wide_table = nvbench::enum_type_list<data_type::DECIMAL, data_type::STRING>;
Expand All @@ -329,17 +335,17 @@ NVBENCH_BENCH_TYPES(BM_parquet_read_wide_tables, NVBENCH_TYPE_AXES(d_type_list_w
.add_string_axis("io_type", {"DEVICE_BUFFER"})
.add_int64_axis("data_size_mb", {1024, 2048, 4096})
.add_int64_axis("num_cols", {256, 512, 1024})
.add_int64_axis("cardinality", {0, 1000})
.add_int64_axis("run_length", {1, 32});
.add_int64_axis("cardinality", {0, 2000})
.add_int64_axis("run_length", {1, 16});

NVBENCH_BENCH(BM_parquet_read_wide_tables_mixed)
.set_name("parquet_read_wide_tables_mixed")
.add_string_axis("io_type", {"DEVICE_BUFFER"})
.set_min_samples(4)
.add_int64_axis("data_size_mb", {1024, 2048, 4096})
.add_int64_axis("num_cols", {256, 512, 1024})
.add_int64_axis("cardinality", {0, 1000})
.add_int64_axis("run_length", {1, 32});
.add_int64_axis("cardinality", {0, 2000})
.add_int64_axis("run_length", {1, 16});

// a benchmark for structs that only contain fixed-width types
using d_type_list_struct_only = nvbench::enum_type_list<data_type::STRUCT>;
Expand All @@ -348,5 +354,5 @@ NVBENCH_BENCH_TYPES(BM_parquet_read_fixed_width_struct, NVBENCH_TYPE_AXES(d_type
.set_type_axes_names({"data_type"})
.add_string_axis("io_type", {"DEVICE_BUFFER"})
.set_min_samples(4)
.add_int64_axis("cardinality", {0, 1000})
.add_int64_axis("run_length", {1, 32});
.add_int64_axis("cardinality", {0, 2000})
.add_int64_axis("run_length", {1, 16});
6 changes: 3 additions & 3 deletions cpp/benchmarks/io/parquet/parquet_reader_options.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -148,7 +148,7 @@ NVBENCH_BENCH_TYPES(BM_parquet_read_options,
"str_to_categories",
"uses_pandas_metadata",
"timestamp_type"})
.add_string_axis("io_type", {"PINNED_BUFFER", "DEVICE_BUFFER"})
.add_string_axis("io_type", {"DEVICE_BUFFER"})
.set_min_samples(4);

using col_selections = nvbench::enum_type_list<column_selection::ALL,
Expand All @@ -167,7 +167,7 @@ NVBENCH_BENCH_TYPES(BM_parquet_read_options,
"str_to_categories",
"uses_pandas_metadata",
"timestamp_type"})
.add_string_axis("io_type", {"PINNED_BUFFER", "DEVICE_BUFFER"})
.add_string_axis("io_type", {"DEVICE_BUFFER"})
.set_min_samples(4);

NVBENCH_BENCH_TYPES(
Expand All @@ -183,5 +183,5 @@ NVBENCH_BENCH_TYPES(
"str_to_categories",
"uses_pandas_metadata",
"timestamp_type"})
.add_string_axis("io_type", {"PINNED_BUFFER", "DEVICE_BUFFER"})
.add_string_axis("io_type", {"DEVICE_BUFFER"})
.set_min_samples(4);

0 comments on commit 714011a

Please sign in to comment.