Skip to content

Commit

Permalink
Automerge: [libc++] Optimize ranges::move{,_backward} for vector<bool…
Browse files Browse the repository at this point in the history
…>::iterator (#121109)

As a follow-up to #121013 (which optimized `ranges::copy`) and #121026
(which optimized `ranges::copy_backward`), this PR enhances the
performance of `std::ranges::{move, move_backward}` for
`vector<bool>::iterator`, addressing a subtask outlined in issue #64038.

The optimizations bring performance improvements analogous to those
achieved for the `{copy, copy_backward}` algorithms: up to 2000x for
aligned moves and 60x for unaligned moves. Moreover, comprehensive
tests covering up to 4 storage words (256 bytes) with odd and even bit
sizes are provided, which validate the proposed optimizations in this
patch.
  • Loading branch information
winner245 authored and github-actions[bot] committed Feb 19, 2025
2 parents b487d48 + ab3d793 commit 9a005b8
Show file tree
Hide file tree
Showing 10 changed files with 414 additions and 112 deletions.
4 changes: 2 additions & 2 deletions libcxx/docs/ReleaseNotes/21.rst
Original file line number Diff line number Diff line change
Expand Up @@ -43,8 +43,8 @@ Implemented Papers
Improvements and New Features
-----------------------------

- The ``std::ranges::{copy, copy_n, copy_backward}`` algorithms have been optimized for ``std::vector<bool>::iterator``\s,
resulting in a performance improvement of up to 2000x.
- The ``std::ranges::{copy, copy_n, copy_backward, move, move_backward}`` algorithms have been optimized for
``std::vector<bool>::iterator``, resulting in a performance improvement of up to 2000x.

- Updated formatting library to Unicode 16.0.0.

Expand Down
10 changes: 10 additions & 0 deletions libcxx/include/__algorithm/move.h
Original file line number Diff line number Diff line change
Expand Up @@ -9,11 +9,13 @@
#ifndef _LIBCPP___ALGORITHM_MOVE_H
#define _LIBCPP___ALGORITHM_MOVE_H

#include <__algorithm/copy.h>
#include <__algorithm/copy_move_common.h>
#include <__algorithm/for_each_segment.h>
#include <__algorithm/iterator_operations.h>
#include <__algorithm/min.h>
#include <__config>
#include <__fwd/bit_reference.h>
#include <__iterator/iterator_traits.h>
#include <__iterator/segmented_iterator.h>
#include <__type_traits/common_type.h>
Expand Down Expand Up @@ -98,6 +100,14 @@ struct __move_impl {
}
}

template <class _Cp, bool _IsConst>
_LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_SINCE_CXX20 pair<__bit_iterator<_Cp, _IsConst>, __bit_iterator<_Cp, false> >
operator()(__bit_iterator<_Cp, _IsConst> __first,
__bit_iterator<_Cp, _IsConst> __last,
__bit_iterator<_Cp, false> __result) {
return std::__copy(__first, __last, __result);
}

// At this point, the iterators have been unwrapped so any `contiguous_iterator` has been unwrapped to a pointer.
template <class _In, class _Out, __enable_if_t<__can_lower_move_assignment_to_memmove<_In, _Out>::value, int> = 0>
_LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_SINCE_CXX14 pair<_In*, _Out*>
Expand Down
10 changes: 10 additions & 0 deletions libcxx/include/__algorithm/move_backward.h
Original file line number Diff line number Diff line change
Expand Up @@ -9,10 +9,12 @@
#ifndef _LIBCPP___ALGORITHM_MOVE_BACKWARD_H
#define _LIBCPP___ALGORITHM_MOVE_BACKWARD_H

#include <__algorithm/copy_backward.h>
#include <__algorithm/copy_move_common.h>
#include <__algorithm/iterator_operations.h>
#include <__algorithm/min.h>
#include <__config>
#include <__fwd/bit_reference.h>
#include <__iterator/iterator_traits.h>
#include <__iterator/segmented_iterator.h>
#include <__type_traits/common_type.h>
Expand Down Expand Up @@ -107,6 +109,14 @@ struct __move_backward_impl {
}
}

template <class _Cp, bool _IsConst>
_LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_SINCE_CXX20 pair<__bit_iterator<_Cp, _IsConst>, __bit_iterator<_Cp, false> >
operator()(__bit_iterator<_Cp, _IsConst> __first,
__bit_iterator<_Cp, _IsConst> __last,
__bit_iterator<_Cp, false> __result) {
return std::__copy_backward<_ClassicAlgPolicy>(__first, __last, __result);
}

// At this point, the iterators have been unwrapped so any `contiguous_iterator` has been unwrapped to a pointer.
template <class _In, class _Out, __enable_if_t<__can_lower_move_assignment_to_memmove<_In, _Out>::value, int> = 0>
_LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_SINCE_CXX14 pair<_In*, _Out*>
Expand Down
16 changes: 0 additions & 16 deletions libcxx/include/__bit_reference
Original file line number Diff line number Diff line change
Expand Up @@ -210,22 +210,6 @@ private:
__mask_(__m) {}
};

// move

template <class _Cp, bool _IsConst>
inline _LIBCPP_HIDE_FROM_ABI __bit_iterator<_Cp, false>
move(__bit_iterator<_Cp, _IsConst> __first, __bit_iterator<_Cp, _IsConst> __last, __bit_iterator<_Cp, false> __result) {
return std::copy(__first, __last, __result);
}

// move_backward

template <class _Cp, bool _IsConst>
inline _LIBCPP_HIDE_FROM_ABI __bit_iterator<_Cp, false> move_backward(
__bit_iterator<_Cp, _IsConst> __first, __bit_iterator<_Cp, _IsConst> __last, __bit_iterator<_Cp, false> __result) {
return std::copy_backward(__first, __last, __result);
}

// swap_ranges

template <class _Cl, class _Cr>
Expand Down
71 changes: 71 additions & 0 deletions libcxx/test/benchmarks/algorithms/move.bench.cpp
Original file line number Diff line number Diff line change
@@ -0,0 +1,71 @@
//===----------------------------------------------------------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//

// UNSUPPORTED: c++03, c++11, c++14, c++17, c++20

#include <algorithm>
#include <benchmark/benchmark.h>
#include <ranges>
#include <vector>

template <bool aligned>
void bm_ranges_move_vb(benchmark::State& state) {
auto n = state.range();
std::vector<bool> v1(n, true);
std::vector<bool> v2(n, false);
benchmark::DoNotOptimize(v1);
benchmark::DoNotOptimize(v2);
std::vector<bool>* in = &v1;
std::vector<bool>* out = &v2;
for (auto _ : state) {
if constexpr (aligned) {
benchmark::DoNotOptimize(std::ranges::move(*in, std::ranges::begin(*out)));
} else {
benchmark::DoNotOptimize(
std::ranges::move(std::views::counted(in->begin() + 4, n - 4), std::ranges::begin(*out)));
}
std::swap(in, out);
benchmark::DoNotOptimize(in);
benchmark::DoNotOptimize(out);
}
}

template <bool aligned>
void bm_move_vb(benchmark::State& state) {
auto n = state.range();
std::vector<bool> v1(n, true);
std::vector<bool> v2(n, false);
benchmark::DoNotOptimize(v1);
benchmark::DoNotOptimize(v2);
std::vector<bool>* in = &v1;
std::vector<bool>* out = &v2;
for (auto _ : state) {
auto first1 = in->begin();
auto last1 = in->end();
auto first2 = out->begin();
if constexpr (aligned) {
benchmark::DoNotOptimize(std::move(first1, last1, first2));
} else {
benchmark::DoNotOptimize(std::move(first1 + 4, last1, first2));
}
std::swap(in, out);
benchmark::DoNotOptimize(in);
benchmark::DoNotOptimize(out);
}
}

BENCHMARK(bm_ranges_move_vb<true>)
->Name("bm_ranges_move_vb_aligned")
->Range(8, 1 << 16)
->DenseRange(102400, 204800, 4096);
BENCHMARK(bm_ranges_move_vb<false>)->Name("bm_ranges_move_vb_unaligned")->Range(8, 1 << 20);

BENCHMARK(bm_move_vb<true>)->Name("bm_move_vb_aligned")->Range(8, 1 << 20);
BENCHMARK(bm_move_vb<false>)->Name("bm_move_vb_unaligned")->Range(8, 1 << 20);

BENCHMARK_MAIN();
71 changes: 71 additions & 0 deletions libcxx/test/benchmarks/algorithms/move_backward.bench.cpp
Original file line number Diff line number Diff line change
@@ -0,0 +1,71 @@
//===----------------------------------------------------------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//

// UNSUPPORTED: c++03, c++11, c++14, c++17, c++20

#include <algorithm>
#include <benchmark/benchmark.h>
#include <ranges>
#include <vector>

template <bool aligned>
void bm_ranges_move_backward_vb(benchmark::State& state) {
auto n = state.range();
std::vector<bool> v1(n, true);
std::vector<bool> v2(n, false);
benchmark::DoNotOptimize(v1);
benchmark::DoNotOptimize(v2);
std::vector<bool>* in = &v1;
std::vector<bool>* out = &v2;
for (auto _ : state) {
if constexpr (aligned) {
benchmark::DoNotOptimize(std::ranges::move_backward(*in, std::ranges::end(*out)));
} else {
benchmark::DoNotOptimize(
std::ranges::move_backward(std::views::counted(in->begin(), n - 4), std::ranges::end(*out)));
}
std::swap(in, out);
benchmark::DoNotOptimize(in);
benchmark::DoNotOptimize(out);
}
}

template <bool aligned>
void bm_move_backward_vb(benchmark::State& state) {
auto n = state.range();
std::vector<bool> v1(n, true);
std::vector<bool> v2(n, false);
benchmark::DoNotOptimize(v1);
benchmark::DoNotOptimize(v2);
std::vector<bool>* in = &v1;
std::vector<bool>* out = &v2;
for (auto _ : state) {
auto first1 = in->begin();
auto last1 = in->end();
auto last2 = out->end();
if constexpr (aligned) {
benchmark::DoNotOptimize(std::move_backward(first1, last1, last2));
} else {
benchmark::DoNotOptimize(std::move_backward(first1, last1 - 4, last2));
}
std::swap(in, out);
benchmark::DoNotOptimize(in);
benchmark::DoNotOptimize(out);
}
}

BENCHMARK(bm_ranges_move_backward_vb<true>)
->Name("bm_ranges_move_backward_vb_aligned")
->Range(8, 1 << 16)
->DenseRange(102400, 204800, 4096);
BENCHMARK(bm_ranges_move_backward_vb<false>)->Name("bm_ranges_move_backward_vb_unaligned")->Range(8, 1 << 20);

BENCHMARK(bm_move_backward_vb<true>)->Name("bm_move_backward_vb_aligned")->Range(8, 1 << 20);
BENCHMARK(bm_move_backward_vb<false>)->Name("bm_move_backward_vb_unaligned")->Range(8, 1 << 20);

BENCHMARK_MAIN();
Original file line number Diff line number Diff line change
Expand Up @@ -20,6 +20,7 @@
#include <cassert>
#include <iterator>
#include <memory>
#include <vector>

#include "MoveOnly.h"
#include "test_iterators.h"
Expand All @@ -45,15 +46,15 @@ struct Test {
template <class OutIter>
TEST_CONSTEXPR_CXX20 void operator()() {
const unsigned N = 1000;
int ia[N] = {};
int ia[N] = {};
for (unsigned i = 0; i < N; ++i)
ia[i] = i;
ia[i] = i;
int ib[N] = {0};

OutIter r = std::move(InIter(ia), InIter(ia+N), OutIter(ib));
assert(base(r) == ib+N);
OutIter r = std::move(InIter(ia), InIter(ia + N), OutIter(ib));
assert(base(r) == ib + N);
for (unsigned i = 0; i < N; ++i)
assert(ia[i] == ib[i]);
assert(ia[i] == ib[i]);
}
};

Expand All @@ -73,13 +74,13 @@ struct Test1 {
const unsigned N = 100;
std::unique_ptr<int> ia[N];
for (unsigned i = 0; i < N; ++i)
ia[i].reset(new int(i));
ia[i].reset(new int(i));
std::unique_ptr<int> ib[N];

OutIter r = std::move(InIter(ia), InIter(ia+N), OutIter(ib));
assert(base(r) == ib+N);
OutIter r = std::move(InIter(ia), InIter(ia + N), OutIter(ib));
assert(base(r) == ib + N);
for (unsigned i = 0; i < N; ++i)
assert(*ib[i] == static_cast<int>(i));
assert(*ib[i] == static_cast<int>(i));
}
};

Expand All @@ -92,6 +93,28 @@ struct Test1OutIters {
}
};

TEST_CONSTEXPR_CXX20 bool test_vector_bool(std::size_t N) {
std::vector<bool> v(N, false);
for (std::size_t i = 0; i < N; i += 2)
v[i] = true;

{ // Test move with aligned bytes
std::vector<bool> in(v);
std::vector<bool> out(N);
std::move(in.begin(), in.end(), out.begin());
assert(out == v);
}
{ // Test move with unaligned bytes
std::vector<bool> in(v);
std::vector<bool> out(N);
std::move(in.begin() + 4, in.end(), out.begin());
for (std::size_t i = 0; i < N - 4; ++i)
assert(v[i + 4] == out[i]);
}

return true;
}

TEST_CONSTEXPR_CXX20 bool test() {
types::for_each(types::cpp17_input_iterator_list<int*>(), TestOutIters());
if (TEST_STD_AT_LEAST_23_OR_RUNTIME_EVALUATED)
Expand All @@ -118,7 +141,7 @@ TEST_CONSTEXPR_CXX20 bool test() {
// When non-trivial
{
MoveOnly from[3] = {1, 2, 3};
MoveOnly to[3] = {};
MoveOnly to[3] = {};
std::move(std::begin(from), std::end(from), std::begin(to));
assert(to[0] == MoveOnly(1));
assert(to[1] == MoveOnly(2));
Expand All @@ -127,14 +150,24 @@ TEST_CONSTEXPR_CXX20 bool test() {
// When trivial
{
TrivialMoveOnly from[3] = {1, 2, 3};
TrivialMoveOnly to[3] = {};
TrivialMoveOnly to[3] = {};
std::move(std::begin(from), std::end(from), std::begin(to));
assert(to[0] == TrivialMoveOnly(1));
assert(to[1] == TrivialMoveOnly(2));
assert(to[2] == TrivialMoveOnly(3));
}
}

{ // Test vector<bool>::iterator optimization
assert(test_vector_bool(8));
assert(test_vector_bool(19));
assert(test_vector_bool(32));
assert(test_vector_bool(49));
assert(test_vector_bool(64));
assert(test_vector_bool(199));
assert(test_vector_bool(256));
}

return true;
}

Expand Down
Loading

0 comments on commit 9a005b8

Please sign in to comment.