如何避免std :: vector<>初始化其所有元素？ [英] How can I avoid std::vector<> to initialize all its elements?

查看：616 发布时间：2016/10/23 13:30:40 c++ optimization gcc default-value

本文介绍了如何避免std :: vector<>初始化其所有元素？的处理方法，对大家解决问题具有一定的参考价值，需要的朋友们下面随着小编来一起学习吧！

问题描述

EDIT：我更精确地编辑了问题及其标题。

考虑下列源代码：

  #include< vector> 
 struct xyz {
 xyz（）{} //空构造函数，但编译器不关心
 xyz（const xyz& o）：v（ov）{} 
 xyz& operator =（const xyz& o）{v = o.v; return * this; } 
 int v; //<将被初始化为int（），这意味着0 
}; 
 
 std :: vector< xyz> test（）{
 return std :: vector< xyz>（1024） //将做一个memset（）:-( 
}

我避免了向量<>分配的内存要用其第一个元素的副本进行初始化，这是一个O（n）操作，我宁愿跳过为了速度，因为我的默认构造函数什么都不做？

一个g ++特定的解决方案将做，如果没有通用的存在（但我找不到任何属性这样做）。

EDIT ：生成的代码如下（命令行：arm-elf-g ++ - 4.5 -O3 -S -fno-verbose-asm -o - test.cpp | arm-elf-c ++ filt | grep -vE'^ [[：space：]] + [。@]。* $'）

  test ：
 mov r3，＃0 
 stmfd sp !, {r4，lr} 
 mov r4，r0 
 str r3，[r0，＃0] 
 str r3 ，[r0，＃4] 
 str r3，[r0，＃8] 
 mov r0，＃4096 
 bl运算符new（unsigned long）
 add r1，r0， 4096 
 add r2，r0，＃4080 
 str r0，[r4，＃0] 
 stmib r4，{r0，r1} 
 add r2，r2，＃12 
b .L4 @ 
 .L8：@ 
 add r0，r0，＃4 @ 
 .L4：@ 
 cmp r0，＃0 @填写内存
 movne r3，＃0 @ 
 strne r3，[r0，＃0] @ 
 cmp r0，r2 @ 
 bne .L8 @ 
 str r1，[r4，＃4] 
 mov r0，r4 
 ldmfd sp !, {r4，pc}

EDIT：为了完整起见，下面是x86_64的程序集：

  .globl test ）
 test（）：
 LFB450：
 pushq％rbp 
 LCFI0：
 movq％rsp，％rbp 
 LCFI1：
 rbx 
 LCFI2：
 movq％rdi，％rbx 
 subq $ 8，％rsp 
 LCFI3：
 movq $ 0（％rdi）
 movq $ 0， 8（％rdi）
 movq $ 0，16（％rdi）
 movl $ 4096，％edi 
调用操作符new（unsigned long）
 leaq 4096（％rax），％rcx 
 movq％rax，（％rbx）
 movq％rax，8（％rbx）
 leaq 4092（％rax），％rdx 
 movq％rcx，16 ）
 jmp L4 @ 
 L8：@ 
 addq $ 4，％rax @ 
 L4：@ 
 testq％rax，％rax @ memory-filling loop 
 je L2 @ 
 movl $ 0，（％rax）@ 
 L2：@ 
 cmpq％rdx，％rax @ 
 jne L8 @ 
 movq％rcx，8 （％rbx）
 movq％rbx，％rax 
 addq $ 8，％rsp 
 popq％rbx 
 leave 
 LCFI4：
 ret 
 LFE450：
 EH_frame1：
 LSCIE1：
 LECIE1：
 LSFDE1：
 LASFDE1：
 LEFDE1：

EDIT：我认为结论是不要使用 std :: vector<> 当你想避免不必要的初始化。我最后展开了我自己的模板容器，它执行得更好（并有氖和armv7的专门版本）。

解决方案

的分配的元素由Allocator模板参数控制，如果您需要定制它，请自定义它。但请记住，这可以很容易地结束在肮脏的黑客的领域，所以谨慎使用。例如，这里是一个很脏的解决方案。它将避免初始化，但它最可能会更糟的性能，但为了示范的缘故（因为人们说这是不可能的...不可能不是一个C ++程序员的词汇！）：

  template< typename T> 
 class switch_init_allocator：public std :: allocator< T> {
 private：
 bool * should_init; 
 public：
 template< typename U> 
 struct rebind {
 typedef switch_init_allocator< U>其他; 
}; 
 
 //提供所需的no-throw构造函数/析构函数：
 switch_init_allocator（bool * aShouldInit = NULL）throw（）：std :: allocator< xyz>（），should_init（aShouldInit） {}; 
 switch_init_allocator（const switch_init_allocator< T>&rhs）throw（）：std :: allocator< T>（rhs），should_init（rhs.should_init）{}; 
 template< typename U> 
 switch_init_allocator（const switch_init_allocator< U>& rhs，bool * aShouldInit = NULL）throw（）：std :: allocator< T>（rhs），should_init（aShouldInit）{}; 
〜switch_init_allocator（）throw（）{}; 
 
 //导入所需的typedefs：
 typedef typename std :: allocator< T> :: value_type value_type; 
 typedef typename std :: allocator< T> :: pointer pointer; 
 typedef typename std :: allocator< T> :: reference reference; 
 typedef typename std :: allocator< T> :: const_pointer const_pointer; 
 typedef typename std :: allocator< T> :: const_reference const_reference; 
 typedef typename std :: allocator< T> :: size_type size_type; 
 typedef typename std :: allocator< T> :: difference_type difference_type; 
 
 //重新定义构造函数（隐藏基类版本）：
 void construct（pointer p，const_reference）{
 if（（should_init）&& * should_init））
 new（（void *）p）T（const_reference）; 
 // else，do nothing。 
}; 
}; 
 
 template< typename T> 
 class my_vector：public std :: vector< T，switch_init_allocator< T> > {
 public：
 typedef switch_init_allocator< T> allocator_type; 
 typedef std :: vector< T，allocator_type> vector_type; 
 typedef base_type :: size_type size_type; 
 private：
 bool switch_flag; //这里的顺序非常重要！ 
 vector_type vec; 
 public：
 my_vector（size_type aCount）：switch_flag（false），vec（aCount，allocator_type（& switch_flag））{}; 
 // ...和这个包装类的其余部分... 
 vector_type& get_vector（）{return vec; }; 
 const vector_type& get_vector（）const {return vec; }; 
 void set_switch（bool value）{switch_flag = value; }; 
}; 
 
 int main（）{
 my_vector< xyz> v（1024）。 //这将不会初始化内存。 
 v.set_switch（true）; //设置为true以重新启动初始化（需要调整大小等）
 return 0; 
};

当然，上面是尴尬，不推荐，肯定不会比实际让内存充满第一个元素的副本（特别是因为使用这个标志检查将阻碍每个元素的构造）。但是，它是一个探索当寻求优化在STL容器中的元素的分配和初始化时的一个途径，所以我想展示它。关键是，你可以注入代码，停止std :: vector容器调用复制构造函数来初始化你的元素是在向量的allocator对象的构造函数中。

此外，你可以取消switch，只需要做一个no-init-allocator，然后，你还关闭在调整大小时复制数据所需的拷贝构造将使这个向量类更不有用）。

EDIT: I edited both the question and its title to be more precise.

Considering the following source code:

#include <vector>
struct xyz {
    xyz() { } // empty constructor, but the compiler doesn't care
    xyz(const xyz& o): v(o.v) { } 
    xyz& operator=(const xyz& o) { v=o.v; return *this; }
    int v; // <will be initialized to int(), which means 0
};

std::vector<xyz> test() {
    return std::vector<xyz>(1024); // will do a memset() :-(
}

...how can I avoid the memory allocated by the vector<> to be initialized with copies of its first element, which is a O(n) operation I'd rather skip for the sake of speed, since my default constructor does nothing ?

A g++ specific solution will do, if no generic one exists (but I couldn't find any attribute to do that).

EDIT: generated code follows (command line: arm-elf-g++-4.5 -O3 -S -fno-verbose-asm -o - test.cpp | arm-elf-c++filt | grep -vE '^[[:space:]]+[.@].*$' )

test():
    mov r3, #0
    stmfd   sp!, {r4, lr}
    mov r4, r0
    str r3, [r0, #0]
    str r3, [r0, #4]
    str r3, [r0, #8]
    mov r0, #4096
    bl  operator new(unsigned long)
    add r1, r0, #4096
    add r2, r0, #4080
    str r0, [r4, #0]
    stmib   r4, {r0, r1}
    add r2, r2, #12
    b       .L4          @
.L8:                     @
    add     r0, r0, #4   @
.L4:                     @
    cmp     r0, #0       @  fill the memory
    movne   r3, #0       @
    strne   r3, [r0, #0] @
    cmp     r0, r2       @
    bne     .L8          @
    str r1, [r4, #4]
    mov r0, r4
    ldmfd   sp!, {r4, pc}

EDIT: For the sake of completeness, here is the assembly for x86_64:

.globl test()
test():
LFB450:
    pushq   %rbp
LCFI0:
    movq    %rsp, %rbp
LCFI1:
    pushq   %rbx
LCFI2:
    movq    %rdi, %rbx
    subq    $8, %rsp
LCFI3:
    movq    $0, (%rdi)
    movq    $0, 8(%rdi)
    movq    $0, 16(%rdi)
    movl    $4096, %edi
    call    operator new(unsigned long)
    leaq    4096(%rax), %rcx
    movq    %rax, (%rbx)
    movq    %rax, 8(%rbx)
    leaq    4092(%rax), %rdx
    movq    %rcx, 16(%rbx)
    jmp     L4          @
L8:                     @
    addq    $4, %rax    @
L4:                     @
    testq   %rax, %rax  @ memory-filling loop
    je      L2          @
    movl    $0, (%rax)  @
L2:                     @
    cmpq    %rdx, %rax  @
    jne     L8          @
    movq    %rcx, 8(%rbx)
    movq    %rbx, %rax
    addq    $8, %rsp
    popq    %rbx
    leave
LCFI4:
    ret
LFE450:
EH_frame1:
LSCIE1:
LECIE1:
LSFDE1:
LASFDE1:
LEFDE1:

EDIT: I think the conclusion is to not use std::vector<> when you want to avoid unneeded initialization. I ended up unrolling my own templated container, which performs better (and has specialized versions for neon and armv7).

解决方案

The initialization of the elements allocated is controlled by the Allocator template argument, if you need it customized, customize it. But remember that this can get easily wind-up in the realm of dirty hacking, so use with caution. For instance, here is a pretty dirty solution. It will avoid the initialization, but it most probably will be worse in performance, but for demonstration's sake (as people have said this is impossible!... impossible is not in a C++ programmer's vocabulary!):

template <typename T>
class switch_init_allocator : public std::allocator< T > {
  private:
    bool* should_init;
  public:
    template <typename U>
    struct rebind {
      typedef switch_init_allocator<U> other;
    };

    //provide the required no-throw constructors / destructors:
    switch_init_allocator(bool* aShouldInit = NULL) throw() : std::allocator<xyz>(), should_init(aShouldInit) { };
    switch_init_allocator(const switch_init_allocator<T>& rhs) throw() : std::allocator<T>(rhs), should_init(rhs.should_init) { };
    template <typename U>
    switch_init_allocator(const switch_init_allocator<U>& rhs, bool* aShouldInit = NULL) throw() : std::allocator<T>(rhs), should_init(aShouldInit) { };
    ~switch_init_allocator() throw() { };

    //import the required typedefs:
    typedef typename std::allocator<T>::value_type value_type;
    typedef typename std::allocator<T>::pointer pointer;
    typedef typename std::allocator<T>::reference reference;
    typedef typename std::allocator<T>::const_pointer const_pointer;
    typedef typename std::allocator<T>::const_reference const_reference;
    typedef typename std::allocator<T>::size_type size_type;
    typedef typename std::allocator<T>::difference_type difference_type;

    //redefine the construct function (hiding the base-class version):
    void construct( pointer p, const_reference ) {
      if((should_init) && (*should_init))
        new ((void*)p) T ( const_reference );
      //else, do nothing.
    };
};

template <typename T>
class my_vector : public std::vector<T, switch_init_allocator<T> > {
  public:
    typedef switch_init_allocator<T> allocator_type;
    typedef std::vector<T, allocator_type > vector_type;
    typedef base_type::size_type size_type;
  private:
    bool switch_flag; //the order here is very important!!
    vector_type vec;
  public:  
    my_vector(size_type aCount) : switch_flag(false), vec(aCount, allocator_type(&switch_flag)) { };
    //... and the rest of this wrapper class...
    vector_type& get_vector() { return vec; };
    const vector_type& get_vector() const { return vec; };
    void set_switch(bool value) { switch_flag = value; };
};

int main() {
  my_vector<xyz> v(1024); //this won't initialize the memory at all.
  v.set_switch(true); //set back to true to turn initialization back on (needed for resizing and such)
  return 0;
};

Of course, the above is awkward and not recommended, and certainly won't be any better than actually letting the memory get filled with copies of the first element (especially since the use of this flag-checking will impede on each element-construction). But it is an avenue to explore when looking to optimize the allocation and initialization of elements in an STL container, so I wanted to show it. The point is that the only place you can inject code that will stop the std::vector container from calling the copy-constructor to initialize your elements is in the construct function of the vector's allocator object.

Also, you could do away with the "switch" and simply do a "no-init-allocator", but then, you also turn off copy-construction which is needed to copy the data during resizing (which would make this vector class much less useful).

这篇关于如何避免std :: vector<>初始化其所有元素？的文章就介绍到这了，希望我们推荐的答案对大家有所帮助，也希望大家多多支持IT屋！

查看全文

如何避免std :: vector<>初始化其所有元素？ [英] How can I avoid std::vector<> to initialize all its elements?

问题描述

相关文章

C/C++开发最新文章

热门教程

热门工具

登录关闭

如何避免std :: vector&lt;&gt;初始化其所有元素？ [英] How can I avoid std::vector&lt;&gt; to initialize all its elements?

问题描述

相关文章

C/C++开发最新文章

热门教程

热门工具

登录 关闭

如何避免std :: vector<>初始化其所有元素？ [英] How can I avoid std::vector<> to initialize all its elements?

登录关闭