// Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. #pragma once #include #include #include #include #include #include #include namespace arrow::internal { /// Create a vector containing the values from start up to stop template std::vector Iota(T start, T stop) { if (start > stop) { return {}; } std::vector result(static_cast(stop - start)); std::iota(result.begin(), result.end(), start); return result; } /// Create a vector containing the values from 0 up to length template std::vector Iota(T length) { return Iota(static_cast(0), length); } /// Create a range from a callable which takes a single index parameter /// and returns the value of iterator on each call and a length. /// Only iterators obtained from the same range should be compared, the /// behaviour generally similar to other STL containers. template class LazyRange { private: // callable which generates the values // has to be defined at the beginning of the class for type deduction const Generator gen_; // the length of the range int64_t length_; #ifdef _MSC_VER // workaround to VS2010 not supporting decltype properly // see https://stackoverflow.com/questions/21782846/decltype-for-class-member-function static Generator gen_static_; #endif public: #ifdef _MSC_VER using return_type = decltype(gen_static_(0)); #else using return_type = decltype(gen_(0)); #endif /// Construct a new range from a callable and length LazyRange(Generator gen, int64_t length) : gen_(gen), length_(length) {} // Class of the dependent iterator, created implicitly by begin and end class RangeIter { public: using difference_type = int64_t; using value_type = return_type; using reference = const value_type&; using pointer = const value_type*; using iterator_category = std::forward_iterator_tag; #ifdef _MSC_VER // msvc complains about unchecked iterators, // see https://stackoverflow.com/questions/21655496/error-c4996-checked-iterators using _Unchecked_type = typename LazyRange::RangeIter; #endif RangeIter() = delete; RangeIter(const RangeIter& other) = default; RangeIter& operator=(const RangeIter& other) = default; RangeIter(const LazyRange& range, int64_t index) : range_(&range), index_(index) {} const return_type operator*() const { return range_->gen_(index_); } RangeIter operator+(difference_type length) const { return RangeIter(*range_, index_ + length); } // pre-increment RangeIter& operator++() { ++index_; return *this; } // post-increment RangeIter operator++(int) { auto copy = RangeIter(*this); ++index_; return copy; } bool operator==(const typename LazyRange::RangeIter& other) const { return this->index_ == other.index_ && this->range_ == other.range_; } bool operator!=(const typename LazyRange::RangeIter& other) const { return this->index_ != other.index_ || this->range_ != other.range_; } int64_t operator-(const typename LazyRange::RangeIter& other) const { return this->index_ - other.index_; } bool operator<(const typename LazyRange::RangeIter& other) const { return this->index_ < other.index_; } private: // parent range reference const LazyRange* range_; // current index int64_t index_; }; friend class RangeIter; // Create a new begin const iterator RangeIter begin() { return RangeIter(*this, 0); } // Create a new end const iterator RangeIter end() { return RangeIter(*this, length_); } }; /// Helper function to create a lazy range from a callable (e.g. lambda) and length template LazyRange MakeLazyRange(Generator&& gen, int64_t length) { return LazyRange(std::forward(gen), length); } /// \brief A helper for iterating multiple ranges simultaneously, similar to C++23's /// zip() view adapter modelled after python's built-in zip() function. /// /// \code {.cpp} /// const std::vector& tables = ... /// std::function()> GetNames = ... /// for (auto [table, name] : Zip(tables, GetNames())) { /// static_assert(std::is_same_v); /// static_assert(std::is_same_v); /// // temporaries (like this vector of strings) are kept alive for the /// // duration of a loop and are safely movable). /// RegisterTableWithName(std::move(name), &table); /// } /// \endcode /// /// The zipped sequence ends as soon as any of its member ranges ends. /// /// Always use `auto` for the loop's declaration; it will always be a tuple /// of references so for example using `const auto&` will compile but will /// *look* like forcing const-ness even though the members of the tuple are /// still mutable references. /// /// NOTE: we *could* make Zip a more full fledged range and enable things like /// - gtest recognizing it as a container; it currently doesn't since Zip is /// always mutable so this breaks: /// EXPECT_THAT(Zip(std::vector{0}, std::vector{1}), /// ElementsAre(std::tuple{0, 1})); /// - letting it be random access when possible so we can do things like *sort* /// parallel ranges /// - ... /// /// However doing this will increase the compile time overhead of using Zip as /// long as we're still using headers. Therefore until we can use c++20 modules: /// *don't* extend Zip. template struct Zip; template Zip(Ranges&&...) -> Zip, std::index_sequence_for>; template struct Zip, std::index_sequence> { explicit Zip(Ranges... ranges) : ranges_(std::forward(ranges)...) {} std::tuple ranges_; using sentinel = std::tuple(ranges_)))...>; constexpr sentinel end() { return {std::end(std::get(ranges_))...}; } struct iterator : std::tuple(ranges_)))...> { using std::tuple(ranges_)))...>::tuple; constexpr auto operator*() { return std::tuple(*this))...>{*std::get(*this)...}; } constexpr iterator& operator++() { (++std::get(*this), ...); return *this; } constexpr bool operator!=(const sentinel& s) const { bool all_iterators_valid = (... && (std::get(*this) != std::get(s))); return all_iterators_valid; } }; constexpr iterator begin() { return {std::begin(std::get(ranges_))...}; } }; /// \brief A lazy sequence of integers which starts from 0 and never stops. /// /// This can be used in conjunction with Zip() to emulate python's built-in /// enumerate() function: /// /// \code {.cpp} /// const std::vector& tables = ... /// for (auto [i, table] : Zip(Enumerate<>, tables)) { /// std::cout << "#" << i << ": " << table.name() << std::endl; /// } /// \endcode template constexpr auto Enumerate = [] { struct { struct sentinel {}; constexpr sentinel end() const { return {}; } struct iterator { I value{0}; constexpr I operator*() { return value; } constexpr iterator& operator++() { ++value; return *this; } constexpr std::true_type operator!=(sentinel) const { return {}; } }; constexpr iterator begin() const { return {}; } } out; return out; }(); } // namespace arrow::internal