From 87a9621f2d710232c23cd8de1e1ddc0856d10482 Mon Sep 17 00:00:00 2001 From: Benjamin Kietzman Date: Mon, 21 Oct 2024 15:34:07 -0500 Subject: [PATCH 1/8] GH-44491: [C++] StatusConstant- cheaply copied const Status --- cpp/src/arrow/result.cc | 13 ++++++---- cpp/src/arrow/result.h | 6 +++-- cpp/src/arrow/status.cc | 25 ++++++++++++------- cpp/src/arrow/status.h | 31 ++++++++++++++---------- cpp/src/arrow/status_internal.h | 43 +++++++++++++++++++++++++++++++++ cpp/src/arrow/status_test.cc | 13 ++++++++++ 6 files changed, 102 insertions(+), 29 deletions(-) create mode 100644 cpp/src/arrow/status_internal.h diff --git a/cpp/src/arrow/result.cc b/cpp/src/arrow/result.cc index 0bb65acb83181..e76231a411d49 100644 --- a/cpp/src/arrow/result.cc +++ b/cpp/src/arrow/result.cc @@ -20,10 +20,9 @@ #include #include "arrow/util/logging.h" +#include "arrow/status_internal.h" -namespace arrow { - -namespace internal { +namespace arrow::internal { void DieWithMessage(const std::string& msg) { ARROW_LOG(FATAL) << msg; } @@ -31,6 +30,10 @@ void InvalidValueOrDie(const Status& st) { DieWithMessage(std::string("ValueOrDie called on an error: ") + st.ToString()); } -} // namespace internal +Status UninitializedResult() { + static StatusConstant uninitialized_result{StatusCode::UnknownError, + "Uninitialized Result"}; + return uninitialized_result; +} -} // namespace arrow +} // namespace arrow::internal diff --git a/cpp/src/arrow/result.h b/cpp/src/arrow/result.h index 091351154251e..bb3e49d0ca933 100644 --- a/cpp/src/arrow/result.h +++ b/cpp/src/arrow/result.h @@ -39,6 +39,8 @@ ARROW_EXPORT void DieWithMessage(const std::string& msg); ARROW_EXPORT void InvalidValueOrDie(const Status& st); +ARROW_EXPORT Status UninitializedResult(); + } // namespace internal /// A class for representing either a usable value, or an error. @@ -112,7 +114,7 @@ class [[nodiscard]] Result : public util::EqualityComparable> { /// an empty vector, it will actually invoke the default constructor of /// Result. explicit Result() noexcept // NOLINT(runtime/explicit) - : status_(Status::UnknownError("Uninitialized Result")) {} + : status_(internal::UninitializedResult()) {} ~Result() noexcept { Destroy(); } @@ -302,7 +304,7 @@ class [[nodiscard]] Result : public util::EqualityComparable> { /// has a value. Status status() && { if (ok()) return Status::OK(); - auto tmp = Status::UnknownError("Uninitialized Result"); + auto tmp = internal::UninitializedResult(); std::swap(status_, tmp); return tmp; } diff --git a/cpp/src/arrow/status.cc b/cpp/src/arrow/status.cc index 368e03cac0bd2..34b6336c72911 100644 --- a/cpp/src/arrow/status.cc +++ b/cpp/src/arrow/status.cc @@ -15,7 +15,9 @@ #include #include #include -#include +#ifdef ARROW_EXTRA_ERROR_CONTEXT +# include +#endif #include "arrow/util/logging.h" @@ -26,18 +28,19 @@ Status::Status(StatusCode code, const std::string& msg) Status::Status(StatusCode code, std::string msg, std::shared_ptr detail) { ARROW_CHECK_NE(code, StatusCode::OK) << "Cannot construct ok status with message"; - state_ = new State; - state_->code = code; - state_->msg = std::move(msg); - if (detail != nullptr) { - state_->detail = std::move(detail); - } + state_ = new State{code, std::move(msg), std::move(detail)}; } +// We would prefer that this destructor *not* be inlined, since the vast majority of +// Statuses are OK and so inlining would superflously increase binary size. +Status::State::~State() = default; + void Status::CopyFrom(const Status& s) { - delete state_; + DeleteState(); if (s.state_ == nullptr) { state_ = nullptr; + } else if (s.state_->is_constant) { + state_ = s.state_; } else { state_ = new State(*s.state_); } @@ -160,7 +163,11 @@ void Status::AddContextLine(const char* filename, int line, const char* expr) { ARROW_CHECK(!ok()) << "Cannot add context line to ok status"; std::stringstream ss; ss << "\n" << filename << ":" << line << " " << expr; - state_->msg += ss.str(); + if (state_->is_constant) { + // We can't add context lines to a StatusConstant's state, so copy it now + state_ = new State{code(), message(), detail()}; + } + const_cast(state_)->msg += ss.str(); } #endif diff --git a/cpp/src/arrow/status.h b/cpp/src/arrow/status.h index fb75d963f3a3c..a9570d8126e64 100644 --- a/cpp/src/arrow/status.h +++ b/cpp/src/arrow/status.h @@ -82,6 +82,9 @@ #endif namespace arrow { +namespace internal { +class StatusConstant; +} enum class StatusCode : char { OK = 0, @@ -134,13 +137,7 @@ class ARROW_EXPORT [[nodiscard]] Status : public util::EqualityComparable detail; + bool is_constant = false; + ~State(); }; // OK status has a `NULL` state_. Otherwise, `state_` points to // a `State` structure containing the error code and message(s) - State* state_; + const State* state_; void DeleteState() { - delete state_; - state_ = NULLPTR; + // ARROW-2400: On certain compilers, splitting off the slow path improves + // performance significantly. + if (ARROW_PREDICT_FALSE(state_ != NULLPTR)) { + if (!state_->is_constant) { + delete state_; + } + } } void CopyFrom(const Status& s); inline void MoveFrom(Status& s); + + friend class internal::StatusConstant; }; void Status::MoveFrom(Status& s) { - delete state_; + DeleteState(); state_ = s.state_; s.state_ = NULLPTR; } -Status::Status(const Status& s) - : state_((s.state_ == NULLPTR) ? NULLPTR : new State(*s.state_)) {} +Status::Status(const Status& s) : state_{NULLPTR} { CopyFrom(s); } Status& Status::operator=(const Status& s) { // The following condition catches both aliasing (when this == &s), diff --git a/cpp/src/arrow/status_internal.h b/cpp/src/arrow/status_internal.h new file mode 100644 index 0000000000000..9474716551ab2 --- /dev/null +++ b/cpp/src/arrow/status_internal.h @@ -0,0 +1,43 @@ +// Licensed to the Apache Software Foundation (ASF) under one +// or more contributor license agreements. See the NOTICE file +// distributed with this work for additional information +// regarding copyright ownership. The ASF licenses this file +// to you under the Apache License, Version 2.0 (the +// "License"); you may not use this file except in compliance +// with the License. You may obtain a copy of the License at +// +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, +// software distributed under the License is distributed on an +// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +// KIND, either express or implied. See the License for the +// specific language governing permissions and limitations +// under the License. + +#pragma once + +#include "arrow/status.h" +#include "arrow/util/logging.h" + +namespace arrow::internal { + +class StatusConstant { + public: + StatusConstant(StatusCode code, std::string msg, + std::shared_ptr detail = nullptr) + : state_{code, std::move(msg), std::move(detail), /*is_constant=*/true} { + ARROW_CHECK_NE(code, StatusCode::OK) << "Cannot construct ok status constant"; + } + + operator Status() const { // NOLINT(runtime/explicit) + Status st; + st.state_ = &state_; + return st; + } + + private: + Status::State state_; +}; + +} // namespace arrow::internal diff --git a/cpp/src/arrow/status_test.cc b/cpp/src/arrow/status_test.cc index b446705933285..990aadabec8d1 100644 --- a/cpp/src/arrow/status_test.cc +++ b/cpp/src/arrow/status_test.cc @@ -21,6 +21,7 @@ #include #include "arrow/status.h" +#include "arrow/status_internal.h" #include "arrow/testing/gtest_util.h" #include "arrow/testing/matchers.h" @@ -76,6 +77,18 @@ TEST(StatusTest, TestCoverageWarnNotOK) { ARROW_WARN_NOT_OK(Status::Invalid("invalid"), "Expected warning"); } +TEST(StatusTest, StatusConstant) { + internal::StatusConstant constant{StatusCode::Invalid, "default error"}; + Status st = constant; + + ASSERT_EQ(st.code(), StatusCode::Invalid); + ASSERT_EQ(st.message(), "default error"); + ASSERT_EQ(st.detail(), nullptr); + + Status copy = st; + ASSERT_EQ(&st.message(), ©.message()); +} + TEST(StatusTest, AndStatus) { Status a = Status::OK(); Status b = Status::OK(); From 3cfd338382766cfb6550ab0800eed0be40cb20d7 Mon Sep 17 00:00:00 2001 From: Benjamin Kietzman Date: Fri, 25 Oct 2024 10:22:54 -0500 Subject: [PATCH 2/8] DeleteState()->noexcept --- cpp/src/arrow/status.h | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cpp/src/arrow/status.h b/cpp/src/arrow/status.h index a9570d8126e64..1cfaf7cff2081 100644 --- a/cpp/src/arrow/status.h +++ b/cpp/src/arrow/status.h @@ -372,7 +372,7 @@ class ARROW_EXPORT [[nodiscard]] Status : public util::EqualityComparable Date: Fri, 25 Oct 2024 10:34:28 -0500 Subject: [PATCH 3/8] clang-format --- cpp/src/arrow/result.cc | 2 +- cpp/src/arrow/result.h | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/cpp/src/arrow/result.cc b/cpp/src/arrow/result.cc index e76231a411d49..e8c5a57ee7bc0 100644 --- a/cpp/src/arrow/result.cc +++ b/cpp/src/arrow/result.cc @@ -19,8 +19,8 @@ #include -#include "arrow/util/logging.h" #include "arrow/status_internal.h" +#include "arrow/util/logging.h" namespace arrow::internal { diff --git a/cpp/src/arrow/result.h b/cpp/src/arrow/result.h index bb3e49d0ca933..f8ae5b15d527c 100644 --- a/cpp/src/arrow/result.h +++ b/cpp/src/arrow/result.h @@ -303,7 +303,7 @@ class [[nodiscard]] Result : public util::EqualityComparable> { /// \return The stored non-OK status object, or an OK status if this object /// has a value. Status status() && { - if (ok()) return Status::OK(); + if (ARROW_PREDICT_TRUE(ok())) return Status::OK(); auto tmp = internal::UninitializedResult(); std::swap(status_, tmp); return tmp; From f0896ab2d063fea2a9f4a44fb66f9d6e8b21d090 Mon Sep 17 00:00:00 2001 From: Benjamin Kietzman Date: Fri, 25 Oct 2024 10:49:06 -0500 Subject: [PATCH 4/8] msvc: try fixing visibility for State::~State --- cpp/src/arrow/status.h | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cpp/src/arrow/status.h b/cpp/src/arrow/status.h index 1cfaf7cff2081..81b6175d3ce7d 100644 --- a/cpp/src/arrow/status.h +++ b/cpp/src/arrow/status.h @@ -361,7 +361,7 @@ class ARROW_EXPORT [[nodiscard]] Status : public util::EqualityComparable detail; From 8b0953864085c857f73481b3c25c1855d869a920 Mon Sep 17 00:00:00 2001 From: Benjamin Kietzman Date: Mon, 4 Nov 2024 11:32:22 -0600 Subject: [PATCH 5/8] review comments --- cpp/src/arrow/status.cc | 10 +++++----- cpp/src/arrow/status.h | 23 ++++++++++++++--------- cpp/src/arrow/status_internal.h | 3 ++- 3 files changed, 21 insertions(+), 15 deletions(-) diff --git a/cpp/src/arrow/status.cc b/cpp/src/arrow/status.cc index 34b6336c72911..de2955de4619e 100644 --- a/cpp/src/arrow/status.cc +++ b/cpp/src/arrow/status.cc @@ -31,12 +31,12 @@ Status::Status(StatusCode code, std::string msg, std::shared_ptr d state_ = new State{code, std::move(msg), std::move(detail)}; } -// We would prefer that this destructor *not* be inlined, since the vast majority of -// Statuses are OK and so inlining would superflously increase binary size. -Status::State::~State() = default; - void Status::CopyFrom(const Status& s) { - DeleteState(); + if (ARROW_PREDICT_FALSE(state_ != NULL)) { + if (!state_->is_constant) { + DeleteState(); + } + } if (s.state_ == nullptr) { state_ = nullptr; } else if (s.state_->is_constant) { diff --git a/cpp/src/arrow/status.h b/cpp/src/arrow/status.h index 81b6175d3ce7d..45d61a63c4f57 100644 --- a/cpp/src/arrow/status.h +++ b/cpp/src/arrow/status.h @@ -137,7 +137,13 @@ class ARROW_EXPORT [[nodiscard]] Status : public util::EqualityComparableis_constant) { + DeleteState(); + } + } + } Status(StatusCode code, const std::string& msg); /// \brief Pluggable constructor for use by sub-systems. detail cannot be null. @@ -361,12 +367,11 @@ class ARROW_EXPORT [[nodiscard]] Status : public util::EqualityComparable detail; bool is_constant = false; - ~State(); }; // OK status has a `NULL` state_. Otherwise, `state_` points to // a `State` structure containing the error code and message(s) @@ -375,11 +380,7 @@ class ARROW_EXPORT [[nodiscard]] Status : public util::EqualityComparableis_constant) { - delete state_; - } - } + delete state_; } void CopyFrom(const Status& s); inline void MoveFrom(Status& s); @@ -388,7 +389,11 @@ class ARROW_EXPORT [[nodiscard]] Status : public util::EqualityComparableis_constant) { + DeleteState(); + } + } state_ = s.state_; s.state_ = NULLPTR; } diff --git a/cpp/src/arrow/status_internal.h b/cpp/src/arrow/status_internal.h index 9474716551ab2..77474e389533f 100644 --- a/cpp/src/arrow/status_internal.h +++ b/cpp/src/arrow/status_internal.h @@ -27,7 +27,8 @@ class StatusConstant { StatusConstant(StatusCode code, std::string msg, std::shared_ptr detail = nullptr) : state_{code, std::move(msg), std::move(detail), /*is_constant=*/true} { - ARROW_CHECK_NE(code, StatusCode::OK) << "Cannot construct ok status constant"; + ARROW_CHECK_NE(code, StatusCode::OK) + << "StatusConstant is not intended for use with OK status codes"; } operator Status() const { // NOLINT(runtime/explicit) From 1be8452216a2ae80e92d5c746f5c4a57e12651e3 Mon Sep 17 00:00:00 2001 From: Benjamin Kietzman Date: Mon, 4 Nov 2024 11:53:42 -0600 Subject: [PATCH 6/8] Pack Struct::State a little with reordered is_constant --- cpp/src/arrow/status.cc | 4 ++-- cpp/src/arrow/status.h | 2 +- cpp/src/arrow/status_internal.h | 2 +- 3 files changed, 4 insertions(+), 4 deletions(-) diff --git a/cpp/src/arrow/status.cc b/cpp/src/arrow/status.cc index de2955de4619e..81f5f88e0f0d1 100644 --- a/cpp/src/arrow/status.cc +++ b/cpp/src/arrow/status.cc @@ -28,7 +28,7 @@ Status::Status(StatusCode code, const std::string& msg) Status::Status(StatusCode code, std::string msg, std::shared_ptr detail) { ARROW_CHECK_NE(code, StatusCode::OK) << "Cannot construct ok status with message"; - state_ = new State{code, std::move(msg), std::move(detail)}; + state_ = new State{code, /*is_constant=*/false, std::move(msg), std::move(detail)}; } void Status::CopyFrom(const Status& s) { @@ -165,7 +165,7 @@ void Status::AddContextLine(const char* filename, int line, const char* expr) { ss << "\n" << filename << ":" << line << " " << expr; if (state_->is_constant) { // We can't add context lines to a StatusConstant's state, so copy it now - state_ = new State{code(), message(), detail()}; + state_ = new State{code(), /*is_constant=*/false, message(), detail()}; } const_cast(state_)->msg += ss.str(); } diff --git a/cpp/src/arrow/status.h b/cpp/src/arrow/status.h index 45d61a63c4f57..a52a3600e434d 100644 --- a/cpp/src/arrow/status.h +++ b/cpp/src/arrow/status.h @@ -369,9 +369,9 @@ class ARROW_EXPORT [[nodiscard]] Status : public util::EqualityComparable detail; - bool is_constant = false; }; // OK status has a `NULL` state_. Otherwise, `state_` points to // a `State` structure containing the error code and message(s) diff --git a/cpp/src/arrow/status_internal.h b/cpp/src/arrow/status_internal.h index 77474e389533f..80e6cd2cd610f 100644 --- a/cpp/src/arrow/status_internal.h +++ b/cpp/src/arrow/status_internal.h @@ -26,7 +26,7 @@ class StatusConstant { public: StatusConstant(StatusCode code, std::string msg, std::shared_ptr detail = nullptr) - : state_{code, std::move(msg), std::move(detail), /*is_constant=*/true} { + : state_{code, /*is_constant=*/true, std::move(msg), std::move(detail)} { ARROW_CHECK_NE(code, StatusCode::OK) << "StatusConstant is not intended for use with OK status codes"; } From d552fa556077f94c415a716bbd6f05928f03f2a4 Mon Sep 17 00:00:00 2001 From: Antoine Pitrou Date: Thu, 14 Nov 2024 15:49:04 +0100 Subject: [PATCH 7/8] Remove const, improve test a bit --- cpp/src/arrow/status.cc | 2 +- cpp/src/arrow/status.h | 2 +- cpp/src/arrow/status_internal.h | 2 +- cpp/src/arrow/status_test.cc | 9 +++++++++ 4 files changed, 12 insertions(+), 3 deletions(-) diff --git a/cpp/src/arrow/status.cc b/cpp/src/arrow/status.cc index 81f5f88e0f0d1..8cbc6842c4bc3 100644 --- a/cpp/src/arrow/status.cc +++ b/cpp/src/arrow/status.cc @@ -167,7 +167,7 @@ void Status::AddContextLine(const char* filename, int line, const char* expr) { // We can't add context lines to a StatusConstant's state, so copy it now state_ = new State{code(), /*is_constant=*/false, message(), detail()}; } - const_cast(state_)->msg += ss.str(); + state_->msg += ss.str(); } #endif diff --git a/cpp/src/arrow/status.h b/cpp/src/arrow/status.h index a52a3600e434d..853fc284ee317 100644 --- a/cpp/src/arrow/status.h +++ b/cpp/src/arrow/status.h @@ -375,7 +375,7 @@ class ARROW_EXPORT [[nodiscard]] Status : public util::EqualityComparable Date: Thu, 14 Nov 2024 16:17:30 +0100 Subject: [PATCH 8/8] Fix unrelated CI failure --- cpp/src/arrow/buffer_test.cc | 9 ++------- 1 file changed, 2 insertions(+), 7 deletions(-) diff --git a/cpp/src/arrow/buffer_test.cc b/cpp/src/arrow/buffer_test.cc index 06ed0bfba0497..4dd210076ed10 100644 --- a/cpp/src/arrow/buffer_test.cc +++ b/cpp/src/arrow/buffer_test.cc @@ -511,13 +511,8 @@ TEST(TestBuffer, CopySliceEmpty) { } TEST(TestBuffer, ToHexString) { - const uint8_t data_array[] = "\a0hex string\xa9"; - std::basic_string data_str = data_array; - - auto data = reinterpret_cast(data_str.c_str()); - - Buffer buf(data, data_str.size()); - + const std::string data_str = "\a0hex string\xa9"; + Buffer buf(data_str); ASSERT_EQ(buf.ToHexString(), std::string("073068657820737472696E67A9")); }