// Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. #pragma once #include #include #include #include #include #include #include #include #include #include #include "arrow/array/builder_binary.h" #include "arrow/array/builder_primitive.h" #include "arrow/result.h" #include "arrow/status.h" #include "arrow/testing/gtest_compat.h" #include "arrow/testing/util.h" #include "arrow/testing/visibility.h" #include "arrow/type_fwd.h" #include "arrow/type_traits.h" #include "arrow/util/bit_util.h" #include "arrow/util/macros.h" // NOTE: failing must be inline in the macros below, to get correct file / line number // reporting on test failures. #define ASSERT_RAISES(ENUM, expr) \ do { \ auto _res = (expr); \ ::arrow::Status _st = ::arrow::internal::GenericToStatus(_res); \ if (!_st.Is##ENUM()) { \ FAIL() << "Expected '" ARROW_STRINGIFY(expr) "' to fail with " ARROW_STRINGIFY( \ ENUM) ", but got " \ << _st.ToString(); \ } \ } while (false) #define ASSERT_RAISES_WITH_MESSAGE(ENUM, message, expr) \ do { \ auto _res = (expr); \ ::arrow::Status _st = ::arrow::internal::GenericToStatus(_res); \ if (!_st.Is##ENUM()) { \ FAIL() << "Expected '" ARROW_STRINGIFY(expr) "' to fail with " ARROW_STRINGIFY( \ ENUM) ", but got " \ << _st.ToString(); \ } \ ASSERT_EQ((message), _st.ToString()); \ } while (false) #define EXPECT_RAISES_WITH_MESSAGE_THAT(ENUM, matcher, expr) \ do { \ auto _res = (expr); \ ::arrow::Status _st = ::arrow::internal::GenericToStatus(_res); \ if (!_st.Is##ENUM()) { \ FAIL() << "Expected '" ARROW_STRINGIFY(expr) "' to fail with " ARROW_STRINGIFY( \ ENUM) ", but got " \ << _st.ToString(); \ } \ EXPECT_THAT(_st.ToString(), (matcher)); \ } while (false) #define ASSERT_OK(expr) \ do { \ auto _res = (expr); \ ::arrow::Status _st = ::arrow::internal::GenericToStatus(_res); \ if (!_st.ok()) { \ FAIL() << "'" ARROW_STRINGIFY(expr) "' failed with " << _st.ToString(); \ } \ } while (false) #define ASSERT_OK_NO_THROW(expr) ASSERT_NO_THROW(ASSERT_OK(expr)) #define ARROW_EXPECT_OK(expr) \ do { \ auto _res = (expr); \ ::arrow::Status _st = ::arrow::internal::GenericToStatus(_res); \ EXPECT_TRUE(_st.ok()) << "'" ARROW_STRINGIFY(expr) "' failed with " \ << _st.ToString(); \ } while (false) #define ABORT_NOT_OK(expr) \ do { \ auto _res = (expr); \ ::arrow::Status _st = ::arrow::internal::GenericToStatus(_res); \ if (ARROW_PREDICT_FALSE(!_st.ok())) { \ _st.Abort(); \ } \ } while (false); #define ASSIGN_OR_HANDLE_ERROR_IMPL(handle_error, status_name, lhs, rexpr) \ auto&& status_name = (rexpr); \ handle_error(status_name.status()); \ lhs = std::move(status_name).ValueOrDie(); #define ASSERT_OK_AND_ASSIGN(lhs, rexpr) \ ASSIGN_OR_HANDLE_ERROR_IMPL( \ ASSERT_OK, ARROW_ASSIGN_OR_RAISE_NAME(_error_or_value, __COUNTER__), lhs, rexpr); #define ASSIGN_OR_ABORT(lhs, rexpr) \ ASSIGN_OR_HANDLE_ERROR_IMPL(ABORT_NOT_OK, \ ARROW_ASSIGN_OR_RAISE_NAME(_error_or_value, __COUNTER__), \ lhs, rexpr); #define EXPECT_OK_AND_ASSIGN(lhs, rexpr) \ ASSIGN_OR_HANDLE_ERROR_IMPL(ARROW_EXPECT_OK, \ ARROW_ASSIGN_OR_RAISE_NAME(_error_or_value, __COUNTER__), \ lhs, rexpr); #define ASSERT_OK_AND_EQ(expected, expr) \ do { \ ASSERT_OK_AND_ASSIGN(auto _actual, (expr)); \ ASSERT_EQ(expected, _actual); \ } while (0) namespace arrow { // ---------------------------------------------------------------------- // Useful testing::Types declarations using NumericArrowTypes = ::testing::Types; using RealArrowTypes = ::testing::Types; using IntegralArrowTypes = ::testing::Types; using TemporalArrowTypes = ::testing::Types; class Array; class ChunkedArray; class RecordBatch; class Table; struct Datum; ARROW_TESTING_EXPORT std::vector AllTypeIds(); #define ASSERT_ARRAYS_EQUAL(lhs, rhs) AssertArraysEqual((lhs), (rhs)) #define ASSERT_BATCHES_EQUAL(lhs, rhs) AssertBatchesEqual((lhs), (rhs)) #define ASSERT_BATCHES_APPROX_EQUAL(lhs, rhs) AssertBatchesApproxEqual((lhs), (rhs)) #define ASSERT_TABLES_EQUAL(lhs, rhs) AssertTablesEqual((lhs), (rhs)) // If verbose is true, then the arrays will be pretty printed ARROW_TESTING_EXPORT void AssertArraysEqual(const Array& expected, const Array& actual, bool verbose = false); ARROW_TESTING_EXPORT void AssertArraysApproxEqual( const Array& expected, const Array& actual, bool verbose = false, const EqualOptions& option = EqualOptions::Defaults()); // Returns true when values are both null ARROW_TESTING_EXPORT void AssertScalarsEqual( const Scalar& expected, const Scalar& actual, bool verbose = false, const EqualOptions& options = EqualOptions::Defaults()); ARROW_TESTING_EXPORT void AssertScalarsApproxEqual( const Scalar& expected, const Scalar& actual, bool verbose = false, const EqualOptions& options = EqualOptions::Defaults()); ARROW_TESTING_EXPORT void AssertBatchesEqual(const RecordBatch& expected, const RecordBatch& actual, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertBatchesApproxEqual(const RecordBatch& expected, const RecordBatch& actual); ARROW_TESTING_EXPORT void AssertChunkedEqual(const ChunkedArray& expected, const ChunkedArray& actual); ARROW_TESTING_EXPORT void AssertChunkedEqual(const ChunkedArray& actual, const ArrayVector& expected); // Like ChunkedEqual, but permits different chunk layout ARROW_TESTING_EXPORT void AssertChunkedEquivalent(const ChunkedArray& expected, const ChunkedArray& actual); ARROW_TESTING_EXPORT void AssertBufferEqual(const Buffer& buffer, const std::vector& expected); ARROW_TESTING_EXPORT void AssertBufferEqual(const Buffer& buffer, const std::string& expected); ARROW_TESTING_EXPORT void AssertBufferEqual(const Buffer& buffer, const Buffer& expected); ARROW_TESTING_EXPORT void AssertTypeEqual(const DataType& lhs, const DataType& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertTypeEqual(const std::shared_ptr& lhs, const std::shared_ptr& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertFieldEqual(const Field& lhs, const Field& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertFieldEqual(const std::shared_ptr& lhs, const std::shared_ptr& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertSchemaEqual(const Schema& lhs, const Schema& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertSchemaEqual(const std::shared_ptr& lhs, const std::shared_ptr& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertTypeNotEqual(const DataType& lhs, const DataType& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertTypeNotEqual(const std::shared_ptr& lhs, const std::shared_ptr& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertFieldNotEqual(const Field& lhs, const Field& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertFieldNotEqual(const std::shared_ptr& lhs, const std::shared_ptr& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertSchemaNotEqual(const Schema& lhs, const Schema& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT void AssertSchemaNotEqual(const std::shared_ptr& lhs, const std::shared_ptr& rhs, bool check_metadata = false); ARROW_TESTING_EXPORT Result> PrintArrayDiff( const ChunkedArray& expected, const ChunkedArray& actual); ARROW_TESTING_EXPORT void AssertTablesEqual(const Table& expected, const Table& actual, bool same_chunk_layout = true, bool flatten = false); ARROW_TESTING_EXPORT void AssertDatumsEqual(const Datum& expected, const Datum& actual, bool verbose = false); template void AssertNumericDataEqual(const C_TYPE* raw_data, const std::vector& expected_values) { for (auto expected : expected_values) { ASSERT_EQ(expected, *raw_data); ++raw_data; } } ARROW_TESTING_EXPORT void CompareBatch(const RecordBatch& left, const RecordBatch& right, bool compare_metadata = true); ARROW_TESTING_EXPORT void ApproxCompareBatch(const RecordBatch& left, const RecordBatch& right, bool compare_metadata = true); // Check if the padding of the buffers of the array is zero. // Also cause valgrind warnings if the padding bytes are uninitialized. ARROW_TESTING_EXPORT void AssertZeroPadded(const Array& array); // Check if the valid buffer bytes are initialized // and cause valgrind warnings otherwise. ARROW_TESTING_EXPORT void TestInitialized(const Array& array); template void FinishAndCheckPadding(BuilderType* builder, std::shared_ptr* out) { ASSERT_OK_AND_ASSIGN(*out, builder->Finish()); AssertZeroPadded(**out); TestInitialized(**out); } #define DECL_T() typedef typename TestFixture::T T; #define DECL_TYPE() typedef typename TestFixture::Type Type; // ArrayFromJSON: construct an Array from a simple JSON representation ARROW_TESTING_EXPORT std::shared_ptr ArrayFromJSON(const std::shared_ptr&, util::string_view json); ARROW_TESTING_EXPORT std::shared_ptr DictArrayFromJSON(const std::shared_ptr& type, util::string_view indices_json, util::string_view dictionary_json); ARROW_TESTING_EXPORT std::shared_ptr RecordBatchFromJSON(const std::shared_ptr&, util::string_view); ARROW_TESTING_EXPORT std::shared_ptr ChunkedArrayFromJSON(const std::shared_ptr&, const std::vector& json); ARROW_TESTING_EXPORT std::shared_ptr TableFromJSON(const std::shared_ptr&, const std::vector& json); // ArrayFromVector: construct an Array from vectors of C values template void ArrayFromVector(const std::shared_ptr& type, const std::vector& is_valid, const std::vector& values, std::shared_ptr* out) { auto type_id = TYPE::type_id; ASSERT_EQ(type_id, type->id()) << "template parameter and concrete DataType instance don't agree"; std::unique_ptr builder_ptr; ASSERT_OK(MakeBuilder(default_memory_pool(), type, &builder_ptr)); // Get the concrete builder class to access its Append() specializations auto& builder = dynamic_cast::BuilderType&>(*builder_ptr); for (size_t i = 0; i < values.size(); ++i) { if (is_valid[i]) { ASSERT_OK(builder.Append(values[i])); } else { ASSERT_OK(builder.AppendNull()); } } ASSERT_OK(builder.Finish(out)); } template void ArrayFromVector(const std::shared_ptr& type, const std::vector& values, std::shared_ptr* out) { auto type_id = TYPE::type_id; ASSERT_EQ(type_id, type->id()) << "template parameter and concrete DataType instance don't agree"; std::unique_ptr builder_ptr; ASSERT_OK(MakeBuilder(default_memory_pool(), type, &builder_ptr)); // Get the concrete builder class to access its Append() specializations auto& builder = dynamic_cast::BuilderType&>(*builder_ptr); for (size_t i = 0; i < values.size(); ++i) { ASSERT_OK(builder.Append(values[i])); } ASSERT_OK(builder.Finish(out)); } // Overloads without a DataType argument, for parameterless types template void ArrayFromVector(const std::vector& is_valid, const std::vector& values, std::shared_ptr* out) { auto type = TypeTraits::type_singleton(); ArrayFromVector(type, is_valid, values, out); } template void ArrayFromVector(const std::vector& values, std::shared_ptr* out) { auto type = TypeTraits::type_singleton(); ArrayFromVector(type, values, out); } // ChunkedArrayFromVector: construct a ChunkedArray from vectors of C values template void ChunkedArrayFromVector(const std::shared_ptr& type, const std::vector>& is_valid, const std::vector>& values, std::shared_ptr* out) { ArrayVector chunks; ASSERT_EQ(is_valid.size(), values.size()); for (size_t i = 0; i < values.size(); ++i) { std::shared_ptr array; ArrayFromVector(type, is_valid[i], values[i], &array); chunks.push_back(array); } *out = std::make_shared(chunks); } template void ChunkedArrayFromVector(const std::shared_ptr& type, const std::vector>& values, std::shared_ptr* out) { ArrayVector chunks; for (size_t i = 0; i < values.size(); ++i) { std::shared_ptr array; ArrayFromVector(type, values[i], &array); chunks.push_back(array); } *out = std::make_shared(chunks); } // Overloads without a DataType argument, for parameterless types template void ChunkedArrayFromVector(const std::vector>& is_valid, const std::vector>& values, std::shared_ptr* out) { auto type = TypeTraits::type_singleton(); ChunkedArrayFromVector(type, is_valid, values, out); } template void ChunkedArrayFromVector(const std::vector>& values, std::shared_ptr* out) { auto type = TypeTraits::type_singleton(); ChunkedArrayFromVector(type, values, out); } template static inline Status GetBitmapFromVector(const std::vector& is_valid, std::shared_ptr* result) { size_t length = is_valid.size(); ARROW_ASSIGN_OR_RAISE(auto buffer, AllocateEmptyBitmap(length)); uint8_t* bitmap = buffer->mutable_data(); for (size_t i = 0; i < static_cast(length); ++i) { if (is_valid[i]) { BitUtil::SetBit(bitmap, i); } } *result = buffer; return Status::OK(); } template inline void BitmapFromVector(const std::vector& is_valid, std::shared_ptr* out) { ASSERT_OK(GetBitmapFromVector(is_valid, out)); } template void AssertSortedEquals(std::vector u, std::vector v) { std::sort(u.begin(), u.end()); std::sort(v.begin(), v.end()); ASSERT_EQ(u, v); } ARROW_TESTING_EXPORT void SleepFor(double seconds); template std::vector IteratorToVector(Iterator iterator) { EXPECT_OK_AND_ASSIGN(auto out, iterator.ToVector()); return out; } // A RAII-style object that switches to a new locale, and switches back // to the old locale when going out of scope. Doesn't do anything if the // new locale doesn't exist on the local machine. // ATTENTION: may crash with an assertion failure on Windows debug builds. // See ARROW-6108, also https://gerrit.libreoffice.org/#/c/54110/ class ARROW_TESTING_EXPORT LocaleGuard { public: explicit LocaleGuard(const char* new_locale); ~LocaleGuard(); protected: class Impl; std::unique_ptr impl_; }; class ARROW_TESTING_EXPORT EnvVarGuard { public: EnvVarGuard(const std::string& name, const std::string& value); ~EnvVarGuard(); protected: const std::string name_; std::string old_value_; bool was_set_; }; #ifndef ARROW_LARGE_MEMORY_TESTS #define LARGE_MEMORY_TEST(name) DISABLED_##name #else #define LARGE_MEMORY_TEST(name) name #endif } // namespace arrow namespace nonstd { namespace sv_lite { // Without this hint, GTest will print string_views as a container of char template > void PrintTo(const basic_string_view& view, std::ostream* os) { *os << view; } } // namespace sv_lite namespace optional_lite { template void PrintTo(const optional& opt, std::ostream* os) { if (opt.has_value()) { *os << "{"; ::testing::internal::UniversalPrint(*opt, os); *os << "}"; } else { *os << "nullopt"; } } inline void PrintTo(const decltype(nullopt)&, std::ostream* os) { *os << "nullopt"; } } // namespace optional_lite } // namespace nonstd