libc ++中短字符串优化的机制是什么？

// short string: (s)ize and 3 bytes of char (d)atasssssss0;dddddddd;dddddddd;dddddddd ^- is_long = 0// long string: (c)apacityccccccc1;cccccccc;cccccccc;cccccccc ^- is_long = 1

在libc中++实现有点复杂，我会忽略它的替代性设计，并假设小端计算机：template <...>class basic_string {/* many many things */    struct __long    {        size_type __cap_;        size_type __size_;        pointer   __data_;    };    enum {__short_mask = 0x01};    enum {__long_mask  = 0x1ul};    enum {__min_cap = (sizeof(__long) - 1)/sizeof(value_type) > 2 ?                      (sizeof(__long) - 1)/sizeof(value_type) : 2};    struct __short    {        union        {            unsigned char __size_;            value_type __lx;        };        value_type __data_[__min_cap];    };    union __ulx{__long __lx; __short __lxx;};    enum {__n_words = sizeof(__ulx) / sizeof(size_type)};    struct __raw    {        size_type __words[__n_words];    };    struct __rep    {        union        {            __long  __l;            __short __s;            __raw   __r;        };    };    __compressed_pair<__rep, allocator_type> __r_;}; // basic_string注意：__compressed_pair基本上是针对空基优化而优化的一对，又称template <T1, T2> struct __compressed_pair: T1, T2 {};; 对于所有意图和目的，你可以认为它是一个常规对。它的重要性刚刚出现，因为它std::allocator是无国籍的，因此是空的。好的，这是相当原始的，所以让我们检查一下这些机制！在内部，许多函数将调用__get_pointer()自己调用__is_long以确定字符串是否使用__long或__short表示：bool __is_long() const _NOEXCEPT    { return bool(__r_.first().__s.__size_ & __short_mask); }// __r_.first() -> __rep const&//     .__s     -> __short const&//     .__size_ -> unsigned char说实话，我不太确定这是标准C ++（我知道最初的子序列规定，union但不知道它是如何与匿名联合和别名一起抛出的），但是允许标准库利用定义的实现无论如何。

libc ++中短字符串优化的机制是什么？

2回答