RetroSearch Browse

++] = 0 + sub_octet;

461

bits[

++] = 1 + sub_octet;

464

bits[

] = 0 + sub_octet;

465

bits[

+1] = 1 + sub_octet;

469

bits[

++] = 2 + sub_octet;

472

bits[

+0] = 0 + sub_octet;

473

bits[

+1] = 2 + sub_octet;

477

bits[

+0] = 1 + sub_octet;

478

bits[

+1] = 2 + sub_octet;

482

bits[

+0] = 0 + sub_octet;

483

bits[

+1] = 1 + sub_octet;

484

bits[

+2] = 2 + sub_octet;

488

bits[

++] = 3 + sub_octet;

491

bits[

+0] = 0 + sub_octet;

492

bits[

+1] = 3 + sub_octet;

496

bits[

+0] = 1 + sub_octet;

497

bits[

+1] = 3 + sub_octet;

501

bits[

+0] = 0 + sub_octet;

502

bits[

+1] = 1 + sub_octet;

503

bits[

+2] = 3 + sub_octet;

507

bits[

+0] = 2 + sub_octet;

508

bits[

+1] = 3 + sub_octet;

512

bits[

+0] = 0 + sub_octet;

513

bits[

+1] = 2 + sub_octet;

514

bits[

+2] = 3 + sub_octet;

518

bits[

+0] = 1 + sub_octet;

519

bits[

+1] = 2 + sub_octet;

520

bits[

+2] = 3 + sub_octet;

524

bits[

+0] = 0 + sub_octet;

525

bits[

+1] = 1 + sub_octet;

526

bits[

+2] = 2 + sub_octet;

527

bits[

+3] = 3 + sub_octet;

537 #ifdef BM_NONSTANDARD_EXTENTIONS 545 unsigned

bitscan_nibble_gcc(

unsigned

* bits)

BMNOEXCEPT 547 static void

* d_table[] = { &&l0,

548

&&l1, &&l3_1, &&l3, &&l7_1, &&l5, &&l7_0, &&l7, &&l15_1,

549

&&l9, &&l11_0, &&l11, &&l15_0, &&l13, &&l14, &&l15 };

552 for

(

unsigned

sub_octet = 0; w; w >>= 4, sub_octet+=4)

554 goto

*d_table[w & 15];

556

bits[

++] = sub_octet;

559

bits[

++] = sub_octet;

561

bits[

++] = 1 + sub_octet;

564

bits[

++] = sub_octet;

567

bits[

++] = sub_octet;

569

bits[

++] = 1 + sub_octet;

571

bits[

++] = 2 + sub_octet;

574

bits[

++] = sub_octet;

578

bits[

++] = sub_octet;

580

bits[

++] = 1 + sub_octet;

581

bits[

++] = 3 + sub_octet;

584

bits[

++] = sub_octet;

587

bits[

++] = 1 + sub_octet;

590

bits[

++] = 0 + sub_octet;

591

bits[

++] = 1 + sub_octet;

593

bits[

++] = 2 + sub_octet;

595

bits[

++] = 3 + sub_octet;

608 template

typename

622 bp_

[0] = (

)bit_idx0;

[1] = (

)bit_idx1;

630 bp_

[0] = (

)bit_idx0;

[1] = (

)bit_idx1;

[2] = (

)bit_idx2;

639 bp_

[0] = (

)bit_idx0;

[1] = (

)bit_idx1;

640 bp_

[2] = (

)bit_idx2;

[3] = (

)bit_idx3;

663

dest[nword] |= unsigned(1u << nbit);

676

dest[nword] &= ~(unsigned(1u << nbit));

690 return

(block[nword] >> nbit) & 1u;

704 template

typename

709 return

(

unsigned

)(func.

ptr

() - bits);

722 template

typename

727 return

(

unsigned

)(func.

ptr

() - bits);

740 template

typename

751 return

(

unsigned short

)pos;

763 template

typename

773 return

(

unsigned short

)pos;

784 template

typename

787 unsigned short

pos = 0;

806 template

typename

809 unsigned short

pos = 0;

818 template

typename

OT>

821 unsigned short

pos = 0;

839 template

typename

842 unsigned short

pos = 0;

860 template

typename

864 unsigned short

pos = 0;

878 template

typename

882 #if (defined(__arm__) || defined(__aarch64__)) 883 if

constexpr (

sizeof

(V) == 8)

888 if

constexpr (

sizeof

(V) == 8)

914 for

(

unsigned count

= 0; w; w >>=1ull, ++

)

916

rank -= unsigned(w & 1ull);

1006 unsigned t

= w & -w;

1050 #if defined(BMI2_SELECT64) 1051 return

BMI2_SELECT64(w, rank);

1053 #if defined(BMI1_SELECT64) 1054 return

BMI2_SELECT64(w, rank);

1056 #if (defined(__arm__) || defined(__aarch64__)) 1077 #if defined(BMI2_SELECT64) 1078 return

BMI2_SELECT64(w, rank);

1080 #if defined(BMI1_SELECT64) 1081 return

BMI2_SELECT64(w, rank);

1083 #if (defined(__arm__) || defined(__aarch64__)) 1120 for

(

unsigned i

= from;

<= to; ++

)

1121

m |= (1ull << (

/ 1024));

1143

((~0ull) >> (63 - (digest_to - digest_from))) << digest_from;

1165 unsigned

bitpos_from,

unsigned

bitpos_to)

BMNOEXCEPT 1168 return

!(digest &

);

1185 bool

curr = digest &

;

1186 if

(curr && curr !=

)

1204 for

(

unsigned i

= 0;

< 64; ++

)

1209 #if defined(VECT_BLOCK_SET_DIGEST) 1214

block[off] = block[off+1] = block[off+2] = block[off+3] =

;

1235 for

(

unsigned i

= 0;

< 64; ++

)

1238 #if defined(VECT_IS_DIGEST_ZERO) 1245 bm::word_t

w = block[off+j+0] | block[off+j+1] |

1246

block[off+j+2] | block[off+j+3];

1249

digest0 |= (

);

1285 #if defined(VECT_IS_DIGEST_ZERO) 1287

digest &= all_zero ? ~(

<< wave) : digest;

1296

src_u->w64[j+0] | src_u->w64[j+1] | src_u->w64[j+2] | src_u->w64[j+3];

1299

digest &= w64 ? digest : ~(

<< wave);

1326 unsigned

t_wave = 0;

1341 for

(; sub_block < sub_block_end; t_sub_block+=4, sub_block+=4)

1343

t_sub_block[0] = sub_block[0];

1344

t_sub_block[1] = sub_block[1];

1345

t_sub_block[2] = sub_block[2];

1346

t_sub_block[3] = sub_block[3];

1363 for

(; t_sub_block < t_sub_block_end; t_sub_block+=4)

1393 unsigned

s_wave = 0;

1400 const bm::word_t

* sub_block = block + s_off;

1407 for

(; sub_block < sub_block_end; t_sub_block+=4, sub_block+=4)

1409

t_sub_block[0] = sub_block[0];

1410

t_sub_block[1] = sub_block[1];

1411

t_sub_block[2] = sub_block[2];

1412

t_sub_block[3] = sub_block[3];

1423 for

(; t_sub_block < t_sub_block_end; t_sub_block+=4)

1425

t_sub_block[0] = 0; t_sub_block[1] = 0;

1426

t_sub_block[2] = 0; t_sub_block[3] = 0;

1442 return

(

int

(op) >=

int

(

set_COUNT

));

1475

::memset(_p, 0xFF,

sizeof

(_p));

1476 if

constexpr (

sizeof

(

void

*) == 8)

1478 const unsigned long long

magic_mask = 0xFFFFfffeFFFFfffe;

1479

::memcpy(&_p_fullp, &magic_mask,

sizeof

(magic_mask));

1481

_s[

] =

reinterpret_cast<bm::word_t

>

(magic_mask);

1485 const unsigned

magic_mask = 0xFFFFfffe;

1486

::memcpy(&_p_fullp, &magic_mask,

sizeof

(magic_mask));

1488

_s[

] =

reinterpret_cast<bm::word_t

>

(magic_mask);

1499 if

constexpr (

sizeof

(

void

*) == 8)

1501 bm::id64_t

w =

reinterpret_cast<unsigned long long>

(bp);

1508 unsigned

w =

reinterpret_cast<unsigned long>

(bp);

1536 template

typename

1545 const unsigned

unroll_factor = 4;

1546 const unsigned len

= (

- start);

1547 const unsigned

len_unr =

- (

% unroll_factor);

1551 for

(k = 0; k < len_unr; k+=unroll_factor)

1562

*pos = k + start + 1;

1567

*pos = k + start + 2;

1572

*pos = k + start + 3;

1578 for

(; k <

; ++k)

1587 for

(; start <

; ++start)

1617 int

res = (w1 & 1) - (w2 & 1);

1618 if

(res != 0)

return

res;

1645 return

diff? ( (

& diff & -diff)? 1 : -1 ) : 0;

1662 #if defined(VECT_IS_ZERO_BLOCK) 1669 if

(blk[0] | blk[1] | blk[2] | blk[3])

1672

}

while

(blk < blk_end);

1727 template

typename

1731 return

glevel_len[(*

>> 1) & 3];

1743 template

typename

1747 return

glevel_len[(*

>> 1) & 3]-4;

1758 template

typename

1761 return T

((*

>> 1) & 3u);

1775 template

typename

1781 T

is_set = (*buf) & 1u;

1782 T

end =

((*

) >> 3u);

1786

is_set ^=

((end-1) & 1u);

1806 template

typename

1812 T

is_set = (*buf) & 1u;

1834 template

typename

1840 #if defined(VECT_GAP_BFIND) 1844 unsigned

end = ((*buf) >> 3);

1846 unsigned size

= end - start;

1847 for

(;

>= 64;

= end - start)

1849 unsigned

mid = (start + end) >> 1;

1850 if

(

[mid] < pos)

1854 if

(

[mid = (start + end) >> 1] < pos)

1858 if

(

[mid = (start + end) >> 1] < pos)

1862 if

(

[mid = (start + end) >> 1] < pos)

1868 for

(;

>= 16;

= end - start)

1870 if

(

unsigned

mid = (start + end) >> 1;

[mid] < pos)

1874 if

(

unsigned

mid = (start + end) >> 1;

[mid] < pos)

1880 for

(;

true

; ++start)

1881 if

(

[start] >= pos)

1884

*is_set = ((*buf) & 1) ^ ((start-1) & 1);

1899 template

typename

1905 unsigned

end = 1 + ((*buf) >> 3);

1906 if

(end - start < 10)

1908 unsigned

sv = *

& 1;

1909 unsigned

sv1= sv ^ 1;

1910 if

(

[1] >= pos)

return

sv;

1911 if

(

[2] >= pos)

return

sv1;

1912 if

(

[3] >= pos)

return

sv;

1913 if

(

[4] >= pos)

return

sv1;

1914 if

(

[5] >= pos)

return

sv;

1915 if

(

[6] >= pos)

return

sv1;

1916 if

(

[7] >= pos)

return

sv;

1917 if

(

[8] >= pos)

return

sv1;

1926 if

(

unsigned

mid = (start + end) >> 1;

[mid] < pos)

1930

}

while

(start != end);

1932 return

((*

) & 1) ^ ((--start) & 1);

1942 template

typename

1948 #if defined(VECT_GAP_TEST) 1960 template

typename

1965 if

(nb_from > nb_to)

1972 if

(i_from >= top_size)

1974 if

(i_to >= top_size)

1976

i_to = unsigned(top_size-1);

1980 for

(

unsigned i

= i_from;

<= i_to; ++

)

1982 T

** blk_blk = root[

];

1987 unsigned

j = (

== i_from) ? j_from : 0;

1988 if

(!j && (

!= i_to))

1995 if

((

== i_to) && (j == j_to))

2002 unsigned

j = (

== i_from) ? j_from : 0;

2007 if

((

== i_to) && (j == j_to))

2017 template

class

2020 typedef typename

F::size_type size_type;

2021 for

(

unsigned i

= 0;

< size1; ++

)

2023 T

** blk_blk = root[

];

2026 f

.on_empty_top(

);

2029 f

.on_non_empty_top(

);

2041 unsigned

non_empty_top = 0;

2046 #if defined(BM64_AVX2) || defined(BM64_AVX512) 2050 T

* blk0 = blk_blk[j + 0];

2051 T

* blk1 = blk_blk[j + 1];

2052 T

* blk2 = blk_blk[j + 2];

2053 T

* blk3 = blk_blk[j + 3];

2055

size_type block_idx =

+ j + 0;

2057 f

(blk0, block_idx);

2059 f

.on_empty_block(block_idx);

2062 f

(blk1, block_idx + 1);

2064 f

.on_empty_block(block_idx + 1);

2067 f

(blk2, block_idx + 2);

2069 f

.on_empty_block(block_idx + 2);

2072 f

(blk3, block_idx + 3);

2074 f

.on_empty_block(block_idx + 3);

2078 f

.on_empty_block(

+ j + 0);

.on_empty_block(

+ j + 1);

2079 f

.on_empty_block(

+ j + 2);

.on_empty_block(

+ j + 3);

2082 #elif defined(BM64_SSE4) 2086 T

* blk0 = blk_blk[j + 0];

2087 T

* blk1 = blk_blk[j + 1];

2089

size_type block_idx =

+ j + 0;

2091 f

(blk0, block_idx);

2093 f

.on_empty_block(block_idx);

2097 f

(blk1, block_idx);

2099 f

.on_empty_block(block_idx);

2103 f

.on_empty_block(

+ j + 0);

2104 f

.on_empty_block(

+ j + 1);

2110 f

(blk_blk[j],

+ j);

2114 f

.on_empty_block(

+ j);

2119 if

(non_empty_top == 0)

2120 f

.on_empty_top(

);

2126 template

class

2130 for

(

unsigned i

= 0;

< size1; ++

)

2133 if

((blk_blk = root[

])!=0)

2150 T

* blk0 = blk_blk[j + 0];

2151 T

* blk1 = blk_blk[j + 1];

2161 T

* blk0 = blk_blk[j + 2];

2162 T

* blk1 = blk_blk[j + 3];

2172 #elif defined(BM64_AVX2) || defined(BM64_AVX512) 2173 for

(

unsigned i

= 0;

< size1; ++

)

2176 if

((blk_blk = root[

]) != 0)

2189

__m256i w0 = _mm256_loadu_si256((__m256i*)(blk_blk + j));

2190 if

(!_mm256_testz_si256(w0, w0))

2194 T

* blk0 = blk_blk[j + 0];

2195 T

* blk1 = blk_blk[j + 1];

2196 T

* blk2 = blk_blk[j + 2];

2197 T

* blk3 = blk_blk[j + 3];

2213 for

(

unsigned i

= 0;

< size1; ++

)

2216 if

((blk_blk = root[

])!=0)

2248 template

typename

BI,

typename

2252 for

(BI

= 0;

< size1; ++

)

2254 T

** blk_blk = root[

];

2273 if

(

(blk_blk[j], block_idx))

2282 template

class

typename

BLOCK_IDX>

2285

BLOCK_IDX block_idx = start;

2286 for

(

unsigned i

= 0;

< size1; ++

)

2288 T

** blk_blk = root[

];

2301 f

(blk_blk[j], block_idx);

2330 template

typename

2349 template

typename

2358 for

(

unsigned i

= 1;

< arr_len; ++

)

2388 template

typename

2395 if

(arr_len <= wlen)

2397 unsigned

min_w_prev = ~0u;

2399 for

(

unsigned i

= 1;

< wlen; ++

)

2403

min_w_prev =

;

2405

min_w_prev -=

(min_w_prev);

2409 for

(

unsigned i

= wlen;

< arr_len; ++wave,

+=wlen)

2411 if

(

+ wlen > arr_len)

2413 unsigned r

= arr_len % wlen;

2418 unsigned

min_w = ~0u;

2419 for

(

unsigned

j = 0; j < wlen; ++j)

2424 if

(

<= min_w_prev)

2432 if

(min_w_prev && (min_w > min0))

2439

min_w_prev = (min_w > min0) ? min_w - 1 : min0;

2449 template

typename

2460 T

min_w_prev =

(~0u);

2462 for

(

unsigned i

= 1;

< wlen; ++

)

2467

min_w_prev =

;

2471

tarr[

] =

[

] - min0 - delta_acc;

2475

min_w_prev -=

(min_w_prev);

2478 for

(

unsigned

wave = 1,

=wlen;

< arr_len;

+=wlen, ++wave)

2480 if

(

+ wlen > arr_len)

2482 unsigned r

= arr_len % wlen;

2488 for

(

unsigned

j = 0; j < wlen; ++j)

2497

tarr[

+j] =

[

+j] - min_w_prev - delta_acc;

2498

delta_acc += min_w_prev;

2502

tarr[

+j] =

[

+j] - min0 - delta_acc;

2507

min_w_prev = (min_w > min0) ? min_w - 1 : min0;

2516 template

typename

2526 unsigned

min_w_prev = ~0u;

2528 for

(

unsigned i

= 1;

< wlen; ++

)

2531 arr

[

] += min0 + delta_acc;

2537

min_w_prev =

;

2541

min_w_prev -=

(min_w_prev);

2545 for

(

unsigned i

= wlen;

< arr_len; ++wave,

+=wlen)

2547 if

(

+ wlen > arr_len)

2549 unsigned r

= arr_len % wlen;

2554 unsigned

min_w = ~0u;

2555 for

(

unsigned

j = 0; j < wlen; ++j)

2559 arr

[

+j] += (

)(min_w_prev + delta_acc);

2560

delta_acc += (

)min_w_prev;

2564 arr

[

+j] += min0 + delta_acc;

2571

min_w_prev = (min_w > min0) ? min_w - 1 : min0;

2583 template

typename

2585 unsigned

* hist,

unsigned

hist_len)

BMNOEXCEPT 2588 for

(

unsigned i

= 1;

< arr_len; ++

)

2594 if

(

< hist_len)

2604 template

typename

2606 T

* arr_dst,

unsigned

& dst_len,

2607 const T

unsigned

arr_len,

2612

d1_len = dst_len = 0;

2613

arr_dst[dst_len] =

[dst_len];

2616 for

(

unsigned i

= 1;

< arr_len; ++

)

2620 if

(

<= ex_max_delta)

2621

arr_d1[d1_len++] =

[

];

2623

arr_dst[dst_len++] =

[

];

2631 template

typename

2634

tarr[0] =

[0] - delta_acc;

2635 for

(

unsigned i

= 1;

< arr_len; ++

)

2637

tarr[

] =

[

] - min0 - delta_acc;

2647 template

typename

2650 arr

[0] =

[0] + delta_acc;

2651 for

(

unsigned i

= 1;

< arr_len; ++

)

2653 arr

[

] += min0 + delta_acc;

2665 template

typename

2668 const T

* pcurr =

;

2669 auto

dsize = (*pcurr >> 3);

2671 const T

* pend = pcurr + dsize;

2676 for

(++pcurr; pcurr <= pend; pcurr++)

2678 T delta

= *pcurr - *(pcurr-1);

2684 delta

= *pcurr - *(pcurr-1);

2702 template

typename

2704 unsigned

* hist0,

unsigned

* hist1,

unsigned

hist_len

2707 const T

* pcurr =

;

2710 unsigned

is_set = (*pcurr & 1u);

2712 const T

* pend = pcurr + dsize;

2716 if

(

< hist_len)

2721 for

(++pcurr; pcurr <= pend; pcurr++, is_set ^= 1u)

2723 delta

= *pcurr - *(pcurr-1);

2724 if

(

< hist_len)

2728

++pcurr; is_set ^= 1u;

2731 delta

= *pcurr - *(pcurr-1);

2732 if

(

< hist_len)

2741 template

typename

2790 template

typename

2793 const unsigned

* hist0,

const unsigned

* hist1,

2794 T

* tbuf,

* ex0_arr,

* ex1_arr,

2795 unsigned

& ex0_cnt,

unsigned

& ex1_cnt)

BMNOEXCEPT 2797 bool

ex0_first =

true

;

2798

ex0_cnt = ex1_cnt = 0;

2799 unsigned

dsize =

;

2801

::memcpy(tbuf,

, (1+dsize) *

sizeof

(

));

2804 for

(

T i

= 1;

< h_limit; ++

)

2806 unsigned

ex0_cnt_s {ex0_cnt}, ex1_cnt_s {ex1_cnt};

2808 bool

h0_flag{0}, h1_flag{0};

2809 if

(hist0[

] < hist1[

])

2819 if

(hist0[

] == 0)

2823 const T

* pcurr = tbuf+1;

2824

dsize = (*tbuf >> 3);

2825 const T

* pend = pcurr + dsize;

2826 unsigned

is_set = (*tbuf & 1u);

2829 if

(

&& !is_set)

2830 for

(

unsigned

j = 0; j <= *pcurr; ++j)

2831

ex0_arr[ex0_cnt++] = (

)j;

2832 for

(++pcurr, is_set ^= 1u; pcurr <= pend; ++pcurr,is_set ^= 1u)

2834 delta

= *pcurr - *(pcurr-1);

2835 if

(

&& !is_set)

2836 for

(

unsigned

j = *(pcurr-1)+1; j <= *pcurr; ++j)

2837

ex0_arr[ex0_cnt++] = (

)j;

2839

++pcurr; is_set ^= 1u;

2842 delta

= *pcurr - *(pcurr-1);

2843 if

(

&& !is_set)

2844 for

(

unsigned

j = *(pcurr-1)+1; j <= *pcurr; ++j)

2845

ex0_arr[ex0_cnt++] = (

)j;

2848 auto

new_len = dsize;

2849 for

(

unsigned

k = ex0_cnt_s; k < ex0_cnt; ++k)

2867 if

(hist1[

] == 0)

2871 const T

* pcurr = tbuf+1;

2873 const T

* pend = pcurr + (*tbuf >> 3);

2874 unsigned

is_set = (*tbuf & 1u);

2877 if

(

&& is_set)

2878 for

(

unsigned

j = 0; j <= *pcurr; ++j)

2879

ex1_arr[ex1_cnt++] = (

)j;

2881 for

(++pcurr; pcurr <= pend; ++pcurr,is_set ^= 1u)

2883 delta

= *pcurr - *(pcurr-1);

2884 if

(

&& is_set)

2885 for

(

unsigned

j = *(pcurr-1)+1; j <= *pcurr; ++j)

2886

ex1_arr[ex1_cnt++] = (

)j;

2888

++pcurr; is_set ^= 1u;

2891 delta

= *pcurr - *(pcurr-1);

2892 if

(

&& is_set)

2893 for

(

unsigned

j = *(pcurr-1)+1; j <= *pcurr; ++j)

2894

ex1_arr[ex1_cnt++] = (

)j;

2897 auto

new_len = dsize;

2898 for

(

unsigned

k = ex1_cnt_s; k < ex1_cnt; ++k)

2904 BM_ASSERT

(dsize >= new_len); (void) new_len;

2925 unsigned

ex_limit,

unsigned

* ex_sum)

BMNOEXCEPT 2930 for

(

= 0; (

< hist_len) && (*ex_sum < ex_limit); ++

)

2932

*ex_sum += hist0[

] + hist1[

];

2945 template

typename

2948 const T

* pcurr =

;

2949 auto

dsize = (*pcurr >> 3);

2950 const T

* pend = pcurr + dsize;

2957 T prev

= *tcurr = (*pcurr - min0); (void)

;

2961 for

(; pcurr <= pend; )

2972 prev

= *tcurr = *pcurr - min1 - delta_acc;

2979 prev

= *tcurr = *pcurr - min0 - delta_acc;

2999 template

typename

3003 auto

dsize = (*pcurr >> 3);

3004 const T

* pend = pcurr + dsize;

3008

*pcurr = (*pcurr + min0);

3011 for

(++pcurr; pcurr <= pend; )

3019

*pcurr = *pcurr + min1 + delta_acc;

3024

*pcurr = *pcurr + min0 + delta_acc;

3042 template

typename

3045 const T

* pcurr =

;

3047

dsize = (*pcurr >> 3);

3048 const T

* pend = pcurr + dsize;

3053 for

(; pcurr <= pend; pcurr++)

3069 template

typename

3072 const T

* pcurr =

;

3074

dsize = (*pcurr >> 3);

3076 const T

* pend = pcurr + dsize;

3078 unsigned

bits_counter = 0;

3083

bits_counter += *pcurr + 1;

3086 for

(++pcurr; pcurr <= pend; pcurr += 2)

3087

bits_counter += *pcurr - *(pcurr-1);

3088 return

bits_counter;

3097 template

typename

3100 const T

* pcurr =

;

3101 unsigned

dsize = (*pcurr >> 3);

3105 T

first_one = *

& 1;

3113 #if defined(BMAVX2OPT) || defined(BMAVX512OPT) 3116 const unsigned

unr_factor = 32;

3117 unsigned

waves = (dsize-2) / unr_factor;

3120 #elif defined(BMSSE42OPT) || defined(BMSSE2OPT) 3123 const unsigned

unr_factor = 16;

3124 unsigned

waves = (dsize - 2) / unr_factor;

3130 const unsigned

unr_factor = 8;

3131 unsigned

waves = (dsize - 2) / unr_factor;

3132 for

(

unsigned i

= 0;

< waves;

+= unr_factor)

3134 cnt

+= pcurr[0] - pcurr[0 - 1];

3135 cnt

+= pcurr[2] - pcurr[2 - 1];

3136 cnt

+= pcurr[4] - pcurr[4 - 1];

3137 cnt

+= pcurr[6] - pcurr[6 - 1];

3139

pcurr += unr_factor;

3144 const T

* pend =

+ dsize;

3145 for

( ; pcurr <= pend ; pcurr+=2)

3146 cnt

+= *pcurr - *(pcurr - 1);

3163 template

typename

bool

RIGHT_END = false>

3170 unsigned

is_set, bits_counter, prev_gap;

3172

is_set = ~(is_set - 1u);

3174 const T

* pcurr =

+ start_pos;

3175 if

(right <= *pcurr)

3176

bits_counter = unsigned(right - left + 1u) & is_set;

3179

bits_counter = unsigned(*pcurr - left + 1u) & is_set;

3180 if

constexpr (RIGHT_END)

3183 for

(prev_gap = *pcurr++ ;

true

; prev_gap = *pcurr++)

3185

bits_counter += (is_set ^= ~0u) & (*pcurr - prev_gap);

3192 for

(prev_gap = *pcurr++; right > *pcurr; prev_gap = *pcurr++)

3193

bits_counter += (is_set ^= ~0u) & (*pcurr - prev_gap);

3194

bits_counter += unsigned(right - prev_gap) & (is_set ^ ~0u);

3197 return

bits_counter;

3206 template

typename

3208 const unsigned

start_pos,

3211 unsigned

is_set_c, pos;

3213 bool r

= (pos == (start_pos) &&

bool

(is_set) ==

(is_set_c));

3214 BM_ASSERT

(

bool

(is_set) ==

bool

(is_set_c));

3230 template

typename

3232 unsigned

left,

unsigned

right,

unsigned

hint)

BMNOEXCEPT 3237 unsigned

is_set, bits_counter, prev_gap;

3241

is_set = ~(is_set - 1u);

3242 unsigned

start_pos = hint >> 1;

3254 const T

* pcurr =

+ start_pos;

3255 if

(right <= *pcurr)

3256

bits_counter = unsigned(right - left + 1u) & is_set;

3259

bits_counter = unsigned(*pcurr - left + 1u) & is_set;

3260 for

(prev_gap = *pcurr++; right > *pcurr; prev_gap = *pcurr++)

3261

bits_counter += (is_set ^= ~0u) & (*pcurr - prev_gap);

3262

bits_counter += unsigned(right - prev_gap) & (is_set ^ ~0u);

3264 return

bits_counter;

3276 template

typename

3287 const T

const

pcurr =

+ start_pos;

3288 return

(right <= *pcurr);

3299 template

typename

3308 const T

const

pcurr =

+ start_pos;

3312 if

(right <= *pcurr)

3328 template

typename

3339 const T

* pcurr =

+ start_pos;

3340 if

(!is_set || (right != *pcurr) || (start_pos <= 1))

3343 if

(*pcurr != left-1)

3357 template

typename

3368

*pos =

[start_pos];

3382 template

typename

3397

*pos =

[start_pos]+1;

3410 template

typename

3428

*pos =

[start_pos];

3447 template

typename

SIZE_TYPE>

3456 const T

* pcurr = block;

3457 const T

* pend = pcurr + (*pcurr >> 3);

3459 unsigned

bits_counter = 0;

3461 unsigned

start_pos =

bm::gap_bfind

(block, nbit_from, &is_set);

3462

is_set = ~(is_set - 1u);

3464

pcurr = block + start_pos;

3465

bits_counter += unsigned(*pcurr - nbit_from + 1u) & is_set;

3466 if

(bits_counter >= rank)

3468

nbit_pos = nbit_from + unsigned(rank) - 1u;

3471

rank -= bits_counter;

3472 unsigned

prev_gap = *pcurr++;

3473 for

(is_set ^= ~0u; pcurr <= pend; is_set ^= ~0u)

3475

bits_counter = (*pcurr - prev_gap) & is_set;

3476 if

(bits_counter >= rank)

3478

nbit_pos = prev_gap + unsigned(rank);

3481

rank -= bits_counter;

3482

prev_gap = *pcurr++;

3489 template

typename

bool

TCORRECT=false>

3494 unsigned

bits_counter, prev_gap;

3496 unsigned

is_set = ~((unsigned(*

) & 1u) - 1u);

3497 const T

* pcurr =

+ 1;

3498 if

(right <= *pcurr)

3500

bits_counter = (right + 1u) & is_set;

3504

bits_counter = (*pcurr + 1u) & is_set;

3505

prev_gap = *pcurr++;

3506 for

(is_set ^= ~0u; right > *pcurr; is_set ^= ~0u, prev_gap = *pcurr++)

3508

bits_counter += (*pcurr - prev_gap) & is_set;

3512

bits_counter += (right - prev_gap) & is_set;

3516 if

constexpr (TCORRECT)

3517

bits_counter -= (is_set & unsigned(TCORRECT));

3518 return

bits_counter;

3532 template

class

Func>

3535 const T

* pcurr = gap_buf;

3536 const T

* pend = pcurr + (*pcurr >> 3);

3540

func((

)(

+ 1));

3544

func((

)(*pcurr -

));

3546

}

while

(++pcurr < pend);

3573 template

typename

3579

*dgap_buf++ = *gap_buf;

3583

for_each_dgap<T, d_copy_func<T> >(gap_buf, copy_func);

3599 template

typename

3603 const T

* pcurr = dgap_buf;

3608

*gap_buf++ = *pcurr++;

3612 len

= gap_header >> 3;

3613

*gap_buf++ = gap_header;

3616 const T

* pend = pcurr +

;

3618

*gap_buf = *pcurr++;

3622

*gap_buf =

(*gap_buf - 1);

3624 for

(++gap_buf; pcurr < pend; ++pcurr)

3626 T prev

= *(gap_buf-1);

3627

*gap_buf++ =

(*pcurr +

);

3641 template

typename

3644 const T

* pcurr1 = buf1;

3645 const T

* pend1 = pcurr1 + (*pcurr1 >> 3);

3646 unsigned

bitval1 = *buf1 & 1;

3649 const T

* pcurr2 = buf2;

3650 unsigned

bitval2 = *buf2 & 1;

3653 while

(pcurr1 <= pend1)

3655 if

(*pcurr1 == *pcurr2)

3657 if

(bitval1 != bitval2)

3659 return

(bitval1) ? 1 : -1;

3664 if

(bitval1 == bitval2)

3668 return

(*pcurr1 < *pcurr2) ? -1 : 1;

3672 return

(*pcurr1 < *pcurr2) ? 1 : -1;

3677 return

(bitval1) ? 1 : -1;

3697 template

typename

3704 const T

* pcurr1 = buf1;

3705 const T

* pend1 = pcurr1 + (*pcurr1 >> 3);

3706 const T

* pcurr2 = buf2;

3707 for

(++pcurr1, ++pcurr2; pcurr1 <= pend1; ++pcurr1, ++pcurr2)

3709 if

(*pcurr1 != *pcurr2)

3711

*pos = 1 + ((*pcurr1 < *pcurr2) ? *pcurr1 : *pcurr2);

3737 template

typename

class

3740 unsigned

vect1_mask,

3742 unsigned

vect2_mask,

3745 const T

* cur1 = vect1;

3746 const T

* cur2 = vect2;

3748 T

bitval1 = (

)((*cur1++ & 1) ^ vect1_mask);

3749 T

bitval2 = (

)((*cur2++ & 1) ^ vect2_mask);

3751 T

bitval = (

) F::op(bitval1, bitval2);

3752 T

bitval_prev = bitval;

3758 T

c1 = *cur1;

c2 = *cur2;

3761

bitval = (

) F::op(bitval1, bitval2);

3766

res += (bitval != bitval_prev);

3767

bitval_prev = bitval;

3787

bitval1 ^= 1; bitval2 ^= 1;

3793

dlen = (unsigned)(res - dest);

3794

*dest = (

)((*dest & 7) + (dlen << 3));

3812 template

typename

class

3814 unsigned

vect1_mask,

3818 const T

* cur1 = vect1;

3819 const T

* cur2 = vect2;

3821 unsigned

bitval1 = (*cur1++ & 1) ^ vect1_mask;

3822 unsigned

bitval2 = (*cur2++ & 1) ^ vect2_mask;

3824 unsigned

bitval = F::op(bitval1, bitval2);

3827 unsigned

bitval_prev = bitval;

3831

bitval = F::op(bitval1, bitval2);

3835 if

(bitval != bitval_prev)

3836

bitval_prev = bitval;

3856

bitval1 ^= 1; bitval2 ^= 1;

3877 template

typename

class

3881 const T

* cur1 = vect1;

3882 const T

* cur2 = vect2;

3884 unsigned

bitval1 = (*cur1++ & 1);

3885 unsigned

bitval2 = (*cur2++ & 1);

3886 unsigned

bitval =

= F::op(bitval1, bitval2);

3887 unsigned

bitval_prev = bitval;

3894

bitval = F::op(bitval1, bitval2);

3897 if

(bitval != bitval_prev)

3899

bitval_prev = bitval;

3908 count

+= res - res_prev;

3911

++cur1; bitval1 ^= 1;

3918 count

+= res - res_prev;

3931

bitval1 ^= 1; bitval2 ^= 1;

3943 #pragma GCC diagnostic push 3944 #pragma GCC diagnostic ignored "-Wconversion" 3961 template

typename

3968 T

end = (

)(*

>> 3);

3969 if

(*is_set ==

)

3976 T

* pcurr =

+ curr;

3977 T

* pprev = pcurr - 1;

3978 T

* pend =

+ end;

3993

pprev =

+ 1; pcurr = pprev + 1;

3998 if

(curr > 1 && ((

unsigned

)(*pprev))+1 == pos)

4001 if

(*pprev == *pcurr)

4009 do

{ *pprev++ = *pcurr++; }

while

(pcurr < pend);

4017

end += (pcurr == pend);

4022 ::memmove

(pcurr+2, pcurr, (end - curr + 1)*(

sizeof

(

)));

4024

pcurr[0] = (

)(pos-1);

4025

pcurr[1] = (

)pos;

4029

= (

)((*

& 7) + (end << 3));

4047 template

typename

4074 template

typename

4082 T

end = (

) (*

>> 3);

4086 T

* pcurr =

+ curr;

4087 T

* pprev = pcurr - 1;

4088 T

* pend =

+ end;

4103

pprev =

+ 1; pcurr = pprev + 1;

4108 if

(curr > 1 && ((

unsigned

)(*pprev))+1 == pos)

4111 if

(*pprev == *pcurr)

4119 do

{ *pprev++ = *pcurr++; }

while

(pcurr < pend);

4127

end += (pcurr == pend);

4132 ::memmove

(pcurr+2, pcurr, (end - curr + 1)*(

sizeof

(

)));

4134

pcurr[0] = (

)(pos-1);

4135

pcurr[1] = (

)pos;

4139

= (

)((*

& 7) + (end << 3));

4152 template

typename

4157 T

end = (

)(*

>> 3);

4159 T

* pcurr =

+ end;

4161 T

* pprev = pcurr - 1;

4176

pprev =

+ 1; pcurr = pprev + 1;

4178 do

{ *pprev++ = *pcurr++; }

while

(pcurr < pend);

4181 else if

(((

unsigned

)(*pprev))+1 == pos && (curr > 1) )

4184 if

(*pprev == *pcurr)

4190 else if

(*pcurr == pos)

4193

end += (pcurr == pend);

4197

pcurr[0] = (

)(pos-1);

4198

pcurr[1] = (

)pos;

4203

= (

)((*

& 7) + (end << 3));

4209 #pragma GCC diagnostic pop 4222 template

typename

4229 bool

co, gap_set_flag;

4230 unsigned len

= (*

>> 3);

4233 unsigned

bitval = *

& 1;

4234

gap_set_flag = (bitval != co_flag);

4240 for

(;

; ++

)

4275 template

typename

4282 bool

co, gap_set_flag;

4287

gap_set_flag = (

!= is_set);

4288 unsigned len

= (*

>> 3);

4298 for

(;

; ++

)

4331 template

typename

4342 unsigned

bitval = *

& 1;

4364 unsigned len

= (*

>> 3);

4366 for

(;

; ++

)

4392 template

typename

4395

= (

)((*

& 6u) + (1u << 3));

4397 T

* pcurr =

+ 1;

4403

*pcurr = (

)(curr - 1);

4413 for

(

= 1;

; ++

)

4416 if

(curr ==

+ 1)

4425

*pcurr++ = (

)(curr-1);

4436 unsigned

gap_len = unsigned(pcurr -

);

4437 BM_ASSERT

(gap_len == ((gap_len << 3) >> 3));

4439

= (

)((*

& 7) + (gap_len << 3));

4453 template

typename

4456 unsigned

gap_count = 1;

4460 for

(

unsigned i

= 1;

; ++

)

4463 if

(curr !=

+ 1)

4485 template

typename

4500 unsigned val

[gap_idx] + 1;

4520 const unsigned

maskFF = ~0u;

4527

*dest |= (1u << bitpos);

4532 unsigned

mask_r = maskFF << bitpos;

4533 if

(

unsigned

right_margin = bitpos + bitcount; right_margin < 32)

4535

*dest |= (maskFF >> (32 - right_margin)) & mask_r;

4539

bitcount -= 32 - bitpos;

4541 for

( ;bitcount >= 64; bitcount-=64, dest+=2)

4542

dest[0] = dest[1] = maskFF;

4544

{ *dest++ = maskFF; bitcount -= 32; }

4546

*dest |= (maskFF >> (32 - bitcount));

4567

*dest &= ~(bitcount << bitpos);

4570 const unsigned

maskFF = ~0u;

4573 unsigned

mask_r = maskFF << bitpos;

4574 if

(

unsigned

right_margin = bitpos + bitcount; right_margin < 32)

4576

*dest &= ~((maskFF >> (32 - right_margin)) & mask_r);

4580

bitcount -= 32 - bitpos;

4582 for

( ;bitcount >= 64; bitcount-=64, dest+=2)

4583

dest[0] = dest[1] = 0u;

4586

*dest++ = 0u; bitcount -= 32;

4589

*dest &= ~(maskFF >> (32 - bitcount));

4614

*word ^= unsigned(1 << nbit);

4620 unsigned

right_margin = nbit + bitcount;

4625 if

(right_margin < 32)

4629 unsigned mask

= mask_r & mask_l;

4634

bitcount -= 32 - nbit;

4637 for

( ;bitcount >= 64; bitcount-=64, word+=2)

4639

word[0] ^= ~0u; word[1] ^= ~0u;

4643

*word++ ^= ~0u; bitcount -= 32;

4659 template

typename

4665 const T

* pend = pcurr + (*pcurr >> 3);

4671 for

(pcurr += 2; pcurr <= pend; pcurr += 2)

4690 template

typename

4697 const unsigned len

= (*pcurr >> 3);

4716 unsigned

found_pos =

bm::gap_bfind

(pbuf, start_pos, &is_set);

4719

found_pos += !is_set;

4720

pcurr = pbuf + found_pos;

4722 BM_ASSERT

(pcurr > pend || *pcurr >= start_pos);

4726 for

(; pcurr <= pend; pcurr += 2)

4727 if

(*pcurr >= start_pos)

4735 for

(

T prev

; pcurr <= pend; pcurr += 2)

4739 unsigned

pos = 1u +

;

4758 template

typename

4764 const T

* pend = pcurr + (*pcurr >> 3);

4770 for

(pcurr += 2; pcurr <= pend; pcurr += 2)

4786 template

typename

4792 const T

* pend = pcurr +

;

4803 for

(; pcurr <= pend; )

4806

pos = 1u + pcurr[-1];

4807

bc = *pcurr - pcurr[-1];

4821 template

typename

4825 unsigned len

= (*pcurr >> 3);

4837 template

typename

4843 const T

* pend = pcurr + (*pcurr >> 3);

4853 for

(; pcurr <= pend; )

4856

pos = 1u + pcurr[-1];

4857

bc = *pcurr - pcurr[-1];

4874 template

typename

4882 const unsigned len

= (*pcurr >> 3);

4901 unsigned

found_pos =

bm::gap_bfind

(pbuf, start_pos, &is_set);

4904

found_pos += is_set;

4905

pcurr = pbuf + found_pos;

4907 BM_ASSERT

(pcurr > pend || *pcurr >= start_pos);

4911 for

(; pcurr <= pend; pcurr += 2)

4912 if

(*pcurr >= start_pos)

4921 for

(

T prev

; pcurr <= pend; pcurr += 2)

4925 unsigned

pos = 1u +

;

4945 template

typename

4950 const T

* pend = pcurr + (*pcurr >> 3);

4957 for

(pcurr +=2 ;pcurr <= pend; pcurr += 2)

4973 template

typename

4979 const T

* pend = pcurr + (*pcurr >> 3);

4986 for

(pcurr +=2 ;!

&& pcurr <= pend; pcurr += 2)

5003 template

typename

5009 const T

* pcurr =

;

5010 const T

* pend = pcurr + (*pcurr >> 3);

5022 for

(;pcurr <= pend; pcurr+=2)

5038 template

typename

5044 const T

* pcurr =

;

5045 const T

* pend = pcurr + (*pcurr >> 3);

5059 for

(; !

&& pcurr <= pend; pcurr+=2)

5076 template

typename

5082 const T

* pcurr =

;

5083 const T

* pend = pcurr + (*pcurr >> 3);

5086 unsigned

bitval = *

& 1;

5094 for

(bitval^=1, ++pcurr; pcurr <= pend; bitval^=1, ++pcurr)

5096 T prev

= (

)(*(pcurr-1)+1);

5100

c = (*pcurr -

+ 1) - c;

5114 template

typename

5120 const T

* pcurr =

;

5121 const T

* pend = pcurr + (*pcurr >> 3);

5124 unsigned

bitval = *

& 1;

5130 for

(bitval^=1, ++pcurr; !

&& pcurr <= pend; bitval^=1, ++pcurr)

5132 T prev

= (

)(*(pcurr-1)+1);

5136

c = (*pcurr -

+ 1) - c;

5152 template

typename

5157 const T

* pcurr =

;

5158 const T

* pend = pcurr + (*pcurr >> 3);

5161 unsigned

bitval = *

& 1;

5165 for

(bitval^=1, ++pcurr; pcurr <= pend; bitval^=1, ++pcurr)

5167 T prev

= (

)(*(pcurr-1)+1);

5169

bitval ? (*pcurr -

+ 1)

5184 template

typename

5222 template

typename

5247 template

typename

5252 if

(

[1] == set_max - 1)

5268 template

typename

5271 unsigned

end = *

>> 3;

5273 const T

* pcurr =

;

5274 const T

* pend = pcurr + (*pcurr >> 3);

5282 while

(pcurr <= pend)

5304

*(++

) = (

)(set_max - 1);

5329 if

(to == set_max - 1)

5337 buf

[2] = (

)(set_max - 1);

5338 buf

[0] = (

)((*

& 6u) + (gap_len << 3) +

value

);

5345 if

(to == set_max - 1)

5348 buf

[1] = (

)(from - 1);

5349 buf

[2] = (

)(set_max - 1);

5354 buf

[1] = (

) (from - 1);

5356 buf

[3] = (

)(set_max - 1);

5358 buf

[0] = (

)((*

& 6u) + (gap_len << 3) +

value

);

5375 #pragma GCC diagnostic push 5376 #pragma GCC diagnostic ignored "-Wconversion" 5386 template

typename

5392

= (

)(((level & 3) << 1) | (*

& 1) | (*

& ~7));

5395 #pragma GCC diagnostic pop 5408 template

typename

5411 if

(

unsigned

(glevel_len[0]-4))

return

5412 if

(

unsigned

(glevel_len[1]-4))

return

5413 if

(

unsigned

(glevel_len[2]-4))

return

5414 if

(

unsigned

(glevel_len[3]-4))

return

5429 template

typename

5435 return

capacity -

;

5447 template

typename

5451 const T

* pend1 = buf1 +

;

5458 return

(w1 & diff & -diff) ? 1 : -1;

5459

}

while

(buf1 < pend1);

5478 #ifdef VECT_BIT_FIND_DIFF 5498

*pos = unsigned(idx + (

* 8u *

unsigned

(

sizeof

(

bm::wordop_t

))));

5510

*pos = unsigned(idx + (

* 8u *

sizeof

(

)));

5541 unsigned

bitval = (*block) & 1u;

5544 unsigned

bit_idx = 0;

5548 unsigned val

= *block;

5549 while

== ~0u)

5551 if

(bitval !=

unsigned

(

bool

(

)))

5555 BM_ASSERT

((pcurr-1) == (dest+1) || *(pcurr-1) > *(pcurr-2));

5558

bit_idx += unsigned(

sizeof

(*block) * 8);

5559 if

(++block >= block_end)

5566 unsigned

bits_consumed = 0;

5570 if

(bitval != (

& 1u))

5574 BM_ASSERT

((pcurr-1) == (dest+1) || *(pcurr-1) > *(pcurr-2));

5584

bits_consumed += tz;

5590 if

(bits_consumed < 32u)

5594

bit_idx += 32u - bits_consumed;

5595 BM_ASSERT

((pcurr-1) == (dest+1) || *(pcurr-1) > *(pcurr-2));

5602

}

while

(++block < block_end);

5606 unsigned len

= (unsigned)(pcurr - dest);

5622 #if defined(VECT_BIT_TO_GAP) 5634 template

class

5637 const T

* pcurr =

;

5638 const T

* pend = pcurr + (*pcurr >> 3);

5648 unsigned

to = *pcurr;

5649 for

(

unsigned i

= 0;

<= to; ++

)

5662 while

(pcurr <= pend)

5664 unsigned

from = *(pcurr-1)+1;

5665 unsigned

to = *pcurr;

5668

func(from -

+ first_inc);

5676 for

(

unsigned i

= from+1;

<= to; ++

)

5689 template

typename

5696 const T

* pend = pcurr + (*pcurr >> 3);

5701 int

bitval = (*buf) & 1;

5707 if

(

unsigned

(*pcurr + 1) >= dest_len)

5711 for

(

T i

= 0; ;++

)

5714 if

(

== to)

break

;

5720 while

(pcurr <= pend)

5722 unsigned

pending = *pcurr - *(pcurr-1);

5723 if

(pending >= dest_len)

5725

dest_len -= pending;

5726 T

from = (

)(*(pcurr-1)+1);

5728 for

(

T i

= from; ;++

)

5731 if

(

== to)

break

;

5735 return

(

) (dest_curr - dest);

5757 #if defined(BM_USE_GCC_BUILD) 5758 count

+= unsigned(__builtin_popcountll(x) + __builtin_popcountll(y)

5759

+ __builtin_popcountll(u) + __builtin_popcountll(v));

5771

}

while

(block < block_end);

5782

}

while

(block < block_end);

5821 #ifdef VECT_BIT_COUNT_DIGEST 5844 #if defined(BM_USE_GCC_BUILD) 5845 count

+= unsigned(__builtin_popcountll(x) + __builtin_popcountll(y)

5846

+ __builtin_popcountll(u) + __builtin_popcountll(v));

5871

}

while

(blk < blk_end);

5899 count

-= (w >> ((

sizeof

(w) * 8) - 1));

5912 unsigned

gap_count = 1;

5917 const int

w_shift =

int

(

sizeof

(w) * 8 - 1);

5920

gap_count -= (w_prev = (w0 >> w_shift));

5923 for

(++block; block < block_end; ++block)

5929

gap_count -= !w_prev;

5937

gap_count -= (w0 >> w_shift);

5938

gap_count -= !(w_prev ^ w_l);

5940

w_prev = (w0 >> w_shift);

5954 unsigned

gap_count = 1;

5960 const int

w_shift =

int

(

sizeof

(w) * 8 - 1);

5963

gap_count -= unsigned(w_prev = (w0 >> w_shift));

5966 for

(++block; block < block_end; ++block)

5972

gap_count -= !w_prev;

5980

gap_count -= unsigned(w0 >> w_shift);

5981

gap_count -= !(w_prev ^ w_l);

5982

w_prev = (w0 >> w_shift);

6006 #ifdef VECT_BLOCK_CHANGE_BC 6033 #if defined(VECT_BLOCK_CHANGE) 6056 unsigned

nbit, bitcount, temp;

6061 return

(*word >> nbit) & 1u;

6065 unsigned

right_margin = nbit + right - left;

6066 if

(right_margin < 32)

6070 unsigned mask

= mask_r & mask_l;

6075

temp = *word & mask_r;

6078

bitcount = (right - left + 1u) - (32 - nbit);

6083

bitcount = right - left + 1u;

6090 #if defined(BM64OPT) || defined(BM64_SSE4) || defined(BMAVX2OPT) || defined(BMAVX512OPT) 6092 for

( ;bitcount >= 128; bitcount-=128, word+=4)

6096 if

((w64_0 ^ maskFF64) | (w64_1 ^ maskFF64))

6100 for

( ;bitcount >= 128; bitcount-=128, word+=4)

6102 bm::word_t

m = (word[0] != maskFF) || (word[1] != maskFF) |

6103

(word[2] != maskFF) || (word[3] != maskFF);

6109 for

( ;bitcount >= 32; bitcount-=32, ++word)

6111 if

(*word != maskFF)

6118

temp = *word & mask_l;

6137 template

bool

LWA,

bool

RWA>

6145 unsigned

nword, nbit, bitcount,

, right_margin;

6149 return

(*block >> nbit) & 1u;

6151

bitcount = 1u + (right_margin = (right - left));

6160

right_margin += nbit;

6162 if

(right_margin < 32)

6168

bitcount -= 32 - nbit;

6175 #if defined(BM64_SSE4) || defined(BM64_AVX2) || defined(BM64_AVX512) 6176 for

( ;bitcount >= 128; bitcount-=128)

6185 for

( ;bitcount >= 64; bitcount-=64)

6197 for

( ;bitcount >= 32; bitcount-=32)

6232 unsigned

bitcount = right + 1;

6235 #if defined(BMAVX2OPT) || defined(BMAVX512OPT) 6238

__m256i

= _mm256_setzero_si256();

6241 for

( ;bitcount >= 256; bitcount -= 256)

6243 const

__m256i* src = (__m256i*)block;

6244

__m256i xmm256 = _mm256_load_si256(src);

6246 cnt

= _mm256_add_epi64(

, bc);

6251 count

+= (unsigned)(cnt64[0] + cnt64[1] + cnt64[2] + cnt64[3]);

6254 for

( ;bitcount >= 64; bitcount -= 64)

6286

block[

] = (block[

] << 1) | (block[

+ 1] >> 31);

6300 const unsigned

unroll_factor = 4;

6306

w0 = block[

+ 1] >> 31;

6307

w1 = block[

+ 2] >> 31;

6308

w2 = block[

+ 3] >> 31;

6309

w3 = block[

+ 4] >> 31;

6311

block[0 +

] = (block[0 +

] << 1) | w0;

6312

block[1 +

] = (block[1 +

] << 1) | w1;

6313

block[2 +

] = (block[2 +

] << 1) | w2;

6314

block[3 +

] = (block[3 +

] << 1) | w3;

6316

block[

] = (block[

] << 1) | (block[

+ 1] >> 31);

6317

block[

+ 1] = (block[

+ 1] << 1) | (block[

+ 2] >> 31);

6318

block[

+ 2] = (block[

+ 2] << 1) | (block[

+ 3] >> 31);

6351

block[nword] = w | (unsigned(

value

) << nbit) | wl;

6363

w = (w << 1u) | co_flag;

6394

acc |= w = (w << 1u) | co_flag;

6418 #if defined(BM64OPT) 6430

acc0 |= w = (w << 1u) | co_flag;

6431

b_u->w64[

++] = w;

6436

acc1 |= w = (w << 1u) | co_flag;

6441

*empty_acc =

(acc0 | acc1);

6465 #if defined(VECT_SHIFT_R1) 6495

acc |= w = (w >> 1u) | (co_flag << 31u);

6523

w0 = block[

]; w1 = block[

-1];

6525

acc |= w0 = (w0 >> 1u) | (co_flag << 31u);

6529

acc |= w1 = (w1 >> 1u) | (co_flag << 31u);

6534

w0 = block[

]; w1 = block[

-1];

6536

acc |= w0 = (w0 >> 1u) | (co_flag << 31u);

6540

acc |= w1 = (w1 >> 1u) | (co_flag << 31u);

6565 #if defined(VECT_SHIFT_L1) 6605

w = (w >> 1u) | (co_flag << 31u);

6617

w |= wl | (co_flag << 31u);

6622

block[nword] = (block[nword] >> 1u) | (co_flag << 31u);

6657 for

(; di < 64; ++di)

6670

w = (w << 1u) | co_flag;

6671

acc |= block[

] = w & mask_block[

];

6687

block[d_base] = co_flag & mask_block[d_base];

6719 #if defined(VECT_SHIFT_R1_AND) 6741 unsigned

nbit = left;

6749 return

(*word >> nbit) & 1;

6752 unsigned

bitcount = right - left + 1;

6756 unsigned

right_margin = nbit + (right - left);

6757 if

(right_margin < 32)

6761 unsigned mask

= mask_r & mask_l;

6762 return

*word &

;

6767

acc = *word & mask_r;

6770

bitcount -= 32 - nbit;

6778 for

( ;bitcount >= 128; bitcount-=128, word+=4)

6780

acc = word[0] | word[1] | word[2] | word[3];

6786 for

( ;bitcount >= 32; bitcount -= 32)

6794

acc |= (*word) & mask_l;

6804 template

typename

6814

start[0] = ~start[0];

6815

start[1] = ~start[1];

6816

start[2] = ~start[2];

6817

start[3] = ~start[3];

6819

}

while

(start < end);

6831 #if defined(VECT_IS_ONE_BLOCK) 6839

start[0] & start[1] & start[2] & start[3];

6843

}

while

(start < end);

6884 bool

is_left, is_right, all_one;

6897 if

(is_left ==

false

)

6901 if

(is_right ==

false

)

6934

w &= (1u << bit_pos);

6949

w = (~block[nword]) >> bit_pos;

6954

*pos = unsigned(bit_pos + (nword * 8u *

unsigned

(

sizeof

(

)))-1);

6964

*pos = unsigned(bit_pos + (nword * 8u *

unsigned

(

sizeof

(

)))-1);

7030

w &= (1u << bit_pos);

7046

w = (~block[nword]) & mask_l;

7050

*pos = unsigned(bit_pos + (nword * 8u *

unsigned

(

sizeof

(

)))+1);

7056 for

(--nword;

true

; --nword)

7062

*pos = unsigned(bit_pos + (nword * 8u *

unsigned

(

sizeof

(

)))+1);

7094

w &= (1u << bit_pos);

7097

*pos = unsigned(bit_pos + (nword * 8u *

unsigned

(

sizeof

(

))));

7109

w = block[nword] & mask_l;

7113

*pos = unsigned(bit_pos + (nword * 8u *

unsigned

(

sizeof

(

))));

7119 for

(--nword;

true

; --nword)

7126

unsigned(bit_pos + (nword * 8u *

unsigned

(

sizeof

(

))));

7155 if

(

&& *found_nbit == 0)

7166 if

(

&& *found_nbit == 0)

7194

*found_nbit = nbit_from;

7271

bm::gap_buff_op<bm::gap_word_t, bm::and_func>(

7272

tmp_buf, vect1, 0, vect2, 0, dsize);

7294 return

gap_buff_any_op<bm::gap_word_t, bm::and_func>(vect1, 0, vect2, 0);

7311 return

bm::gap_buff_count_op<bm::gap_word_t, bm::and_func>(vect1, vect2);

7338

bm::gap_buff_op<bm::gap_word_t, bm::xor_func>(

7339

tmp_buf, vect1, 0, vect2, 0, dsize);

7376 return

gap_buff_any_op<bm::gap_word_t, bm::xor_func>(vect1, 0, vect2, 0);

7392 return

bm::gap_buff_count_op<bm::gap_word_t, bm::xor_func>(vect1, vect2);

7419

bm::gap_buff_op<bm::gap_word_t, bm::and_func>(tmp_buf, vect1, 1, vect2, 1, dsize);

7437 return

gap_buff_count_op<bm::gap_word_t, bm::or_func>(vect1, vect2);

7465

bm::gap_buff_op<bm::gap_word_t, bm::and_func>(

7466

tmp_buf, vect1, 0, vect2, 1, dsize);

7490

bm::gap_buff_any_op<bm::gap_word_t, bm::and_func>(

7491

vect1, 0, vect2, 1);

7508 return

bm::gap_buff_count_op<bm::gap_word_t, bm::sub_func>(vect1, vect2);

7546 #ifdef VECT_COPY_BLOCK_UNALIGN 7567 #ifdef VECT_STREAM_BLOCK 7585 #ifdef VECT_STREAM_BLOCK_UNALIGN 7620 for

(

unsigned i

= 0;

< arr_sz;

+=4)

7622

acc |= (dst_u->w64[

] &= src_u->w64[

]) |

7623

(dst_u->w64[

+1] &= src_u->w64[

+1]) |

7624

(dst_u->w64[

+2] &= src_u->w64[

+2]) |

7625

(dst_u->w64[

+3] &= src_u->w64[

+3]);

7661 #if defined(VECT_AND_DIGEST) 7664

digest &= ~(

<< wave);

7673

acc |= dst_u->w64[j+0] &= src_u->w64[j+0];

7674

acc |= dst_u->w64[j+1] &= src_u->w64[j+1];

7675

acc |= dst_u->w64[j+2] &= src_u->w64[j+2];

7676

acc |= dst_u->w64[j+3] &= src_u->w64[j+3];

7681

digest &= ~(

<< wave);

7705 BM_ASSERT

(src0 && src1 && src2 && src3);

7716 #if defined(VECT_AND_DIGEST_5WAY) 7717 bool

all_zero =

VECT_AND_DIGEST_5WAY

(&dst[off], &src0[off], &src1[off], &src2[off], &src3[off]);

7719

digest &= ~(

<< wave);

7731

acc |= dst_u->w64[j + 0] &= src_u0->w64[j + 0] & src_u1->w64[j + 0] & src_u2->w64[j + 0] & src_u3->w64[j + 0];

7732

acc |= dst_u->w64[j + 1] &= src_u0->w64[j + 1] & src_u1->w64[j + 1] & src_u2->w64[j + 1] & src_u3->w64[j + 1];

7733

acc |= dst_u->w64[j + 2] &= src_u0->w64[j + 2] & src_u1->w64[j + 2] & src_u2->w64[j + 2] & src_u3->w64[j + 2];

7734

acc |= dst_u->w64[j + 3] &= src_u0->w64[j + 3] & src_u1->w64[j + 3] & src_u2->w64[j + 3] & src_u3->w64[j + 3];

7738

digest &= ~(

<< wave);

7778 #if defined(VECT_AND_DIGEST_3WAY) 7781

digest &= ~(

<< wave);

7792

acc |= dst_u->w64[j] &= src_u1->w64[j] & src_u2->w64[j];

7793

acc |= dst_u->w64[j+1] &= src_u1->w64[j+1] & src_u2->w64[j+1];

7794

acc |= dst_u->w64[j+2] &= src_u1->w64[j+2] & src_u2->w64[j+2];

7795

acc |= dst_u->w64[j+3] &= src_u1->w64[j+3] & src_u2->w64[j+3];

7800

digest &= ~(

<< wave);

7843 #if defined(VECT_AND_DIGEST_2WAY) 7846

digest &= ~(

<< wave);

7857

acc |= dst_u->w64[j] = src_u1->w64[j] & src_u2->w64[j];

7858

acc |= dst_u->w64[j+1] = src_u1->w64[j+1] & src_u2->w64[j+1];

7859

acc |= dst_u->w64[j+2] = src_u1->w64[j+2] & src_u2->w64[j+2];

7860

acc |= dst_u->w64[j+3] = src_u1->w64[j+3] & src_u2->w64[j+3];

7865

digest &= ~(

<< wave);

7895 for

(

unsigned i

= 0;

< 64; ++

)

7900 #if defined(VECT_AND_DIGEST_2WAY) 7915

acc |= dst_u->w64[j] = src_u1->w64[j] & src_u2->w64[j];

7916

acc |= dst_u->w64[j+1] = src_u1->w64[j+1] & src_u2->w64[j+1];

7917

acc |= dst_u->w64[j+2] = src_u1->w64[j+2] & src_u2->w64[j+2];

7918

acc |= dst_u->w64[j+3] = src_u1->w64[j+3] & src_u2->w64[j+3];

7929 #if defined(VECT_BLOCK_SET_DIGEST) 7934

dst[off] = dst[off+1] = dst[off+2] = dst[off+3] = 0u;

7976 #if defined(VECT_AND_OR_DIGEST_2WAY) 7980

digest &= ~(

<< wave);

7993

acc |= dst_u->w64[j+0] |= src_u1->w64[j+0] & src_u2->w64[j+0];

7994

acc |= dst_u->w64[j+1] |= src_u1->w64[j+1] & src_u2->w64[j+1];

7995

acc |= dst_u->w64[j+2] |= src_u1->w64[j+2] & src_u2->w64[j+2];

7996

acc |= dst_u->w64[j+3] |= src_u1->w64[j+3] & src_u2->w64[j+3];

8001

digest &= ~(

<< wave);

8042

}

while

(b1 < b1_end);

8052

}

while

(src1 < src1_end);

8076 count

= (src1[0] & src2[0]) |

8077

(src1[1] & src2[1]) |

8078

(src1[2] & src2[2]) |

8079

(src1[3] & src2[3]);

8081

}

while

((src1 < src1_end) && !

);

8119

}

while

(b1 < b1_end);

8129

}

while

(src1 < src1_end);

8153 count

= (src1[0] ^ src2[0]) |

8154

(src1[1] ^ src2[1]) |

8155

(src1[2] ^ src2[2]) |

8156

(src1[3] ^ src2[3]);

8158

}

while

&& (src1 < src1_end));

8192

}

while

(b1 < b1_end);

8202

}

while

(src1 < src1_end);

8226 count

= (src1[0] & ~src2[0]) |

8227

(src1[1] & ~src2[1]) |

8228

(src1[2] & ~src2[2]) |

8229

(src1[3] & ~src2[3]);

8231

}

while

((src1 < src1_end) && (

== 0));

8267

}

while

(b1 < b1_end);

8277

}

while

(src1 < src1_end);

8300 count

= (src1[0] | src2[0]) |

8301

(src1[1] | src2[1]) |

8302

(src1[2] | src2[2]) |

8303

(src1[3] | src2[3]);

8306

}

while

&& (src1 < src1_end));

8598

acc &= (dst_ptr[0] |= wrd_ptr[0]);

8599

acc &= (dst_ptr[1] |= wrd_ptr[1]);

8600

acc &= (dst_ptr[2] |= wrd_ptr[2]);

8601

acc &= (dst_ptr[3] |= wrd_ptr[3]);

8603

dst_ptr+=4;wrd_ptr+=4;

8605

}

while

(wrd_ptr < wrd_end);

8606 return

acc == not_acc;

8636

acc &= (dst_ptr[0] = wrd_ptr1[0] | wrd_ptr2[0]);

8637

acc &= (dst_ptr[1] = wrd_ptr1[1] | wrd_ptr2[1]);

8638

acc &= (dst_ptr[2] = wrd_ptr1[2] | wrd_ptr2[2]);

8639

acc &= (dst_ptr[3] = wrd_ptr1[3] | wrd_ptr2[3]);

8641

dst_ptr+=4; wrd_ptr1+=4; wrd_ptr2+=4;

8643

}

while

(wrd_ptr1 < wrd_end1);

8644 return

acc == not_acc;

8674

acc |= (dst_ptr[0] = wrd_ptr1[0] ^ wrd_ptr2[0]);

8675

acc |= (dst_ptr[1] = wrd_ptr1[1] ^ wrd_ptr2[1]);

8676

acc |= (dst_ptr[2] = wrd_ptr1[2] ^ wrd_ptr2[2]);

8677

acc |= (dst_ptr[3] = wrd_ptr1[3] ^ wrd_ptr2[3]);

8679

dst_ptr+=4; wrd_ptr1+=4; wrd_ptr2+=4;

8681

}

while

(wrd_ptr1 < wrd_end1);

8716

acc &= (dst_ptr[0] |= wrd_ptr1[0] | wrd_ptr2[0]);

8717

acc &= (dst_ptr[1] |= wrd_ptr1[1] | wrd_ptr2[1]);

8718

acc &= (dst_ptr[2] |= wrd_ptr1[2] | wrd_ptr2[2]);

8719

acc &= (dst_ptr[3] |= wrd_ptr1[3] | wrd_ptr2[3]);

8721

dst_ptr+=4; wrd_ptr1+=4;wrd_ptr2+=4;

8723

}

while

(wrd_ptr1 < wrd_end1);

8724 return

acc == not_acc;

8764

acc &= (dst_ptr[0] |= wrd_ptr1[0] | wrd_ptr2[0] | wrd_ptr3[0] | wrd_ptr4[0]);

8765

acc &= (dst_ptr[1] |= wrd_ptr1[1] | wrd_ptr2[1] | wrd_ptr3[1] | wrd_ptr4[1]);

8766

acc &= (dst_ptr[2] |= wrd_ptr1[2] | wrd_ptr2[2] | wrd_ptr3[2] | wrd_ptr4[2]);

8767

acc &= (dst_ptr[3] |= wrd_ptr1[3] | wrd_ptr2[3] | wrd_ptr3[3] | wrd_ptr4[3]);

8770

wrd_ptr1+=4;wrd_ptr2+=4;wrd_ptr3+=4;wrd_ptr4+=4;

8772

}

while

(wrd_ptr1 < wrd_end1);

8773 return

acc == not_acc;

8866 for

(

unsigned i

= 0;

< arr_sz;

+=4)

8868

acc |= (dst_u->w64[

] &= ~src_u->w64[

]) |

8869

(dst_u->w64[

+1] &= ~src_u->w64[

+1]) |

8870

(dst_u->w64[

+2] &= ~src_u->w64[

+2]) |

8871

(dst_u->w64[

+3] &= ~src_u->w64[

+3]);

8908 #if defined(VECT_SUB_DIGEST) 8911

digest &= ~(

<< wave);

8920

acc |= dst_u->w64[j+0] &= ~src_u->w64[j+0];

8921

acc |= dst_u->w64[j+1] &= ~src_u->w64[j+1];

8922

acc |= dst_u->w64[j+2] &= ~src_u->w64[j+2];

8923

acc |= dst_u->w64[j+3] &= ~src_u->w64[j+3];

8928

digest &= ~(

<< wave);

8969 #if defined(VECT_SUB_DIGEST_2WAY) 8972

digest &= ~(

<< wave);

8985

acc |= dst_u->w64[j+0] = src_u1->w64[j+0] & ~src_u2->w64[j+0];

8986

acc |= dst_u->w64[j+1] = src_u1->w64[j+1] & ~src_u2->w64[j+1];

8987

acc |= dst_u->w64[j+2] = src_u1->w64[j+2] & ~src_u2->w64[j+2];

8988

acc |= dst_u->w64[j+3] = src_u1->w64[j+3] & ~src_u2->w64[j+3];

8993

digest &= ~(

<< wave);

9015 BM_ASSERT

(src0 && src1 && src2 && src3);

9027 #if defined(VECT_SUB_DIGEST_5WAY) 9028 bool

all_zero =

VECT_SUB_DIGEST_5WAY

(&dst[off], &src0[off], &src1[off], &src2[off], &src3[off]);

9030

digest &= ~(

<< wave);

9042

acc |= dst_u->w64[j + 0] &= ~src_u0->w64[j + 0] & ~src_u1->w64[j + 0] & ~src_u2->w64[j + 0] & ~src_u3->w64[j + 0];

9043

acc |= dst_u->w64[j + 1] &= ~src_u0->w64[j + 1] & ~src_u1->w64[j + 1] & ~src_u2->w64[j + 1] & ~src_u3->w64[j + 1];

9044

acc |= dst_u->w64[j + 2] &= ~src_u0->w64[j + 2] & ~src_u1->w64[j + 2] & ~src_u2->w64[j + 2] & ~src_u3->w64[j + 2];

9045

acc |= dst_u->w64[j + 3] &= ~src_u0->w64[j + 3] & ~src_u1->w64[j + 3] & ~src_u2->w64[j + 3] & ~src_u3->w64[j + 3];

9050

digest &= ~(

<< wave);

9082 #if defined(VECT_SUB_DIGEST_3WAY) 9085

digest &= ~(

<< wave);

9095

acc |= dst_u->w64[j + 0] &= ~src_u0->w64[j + 0] & ~src_u1->w64[j + 0];

9096

acc |= dst_u->w64[j + 1] &= ~src_u0->w64[j + 1] & ~src_u1->w64[j + 1];

9097

acc |= dst_u->w64[j + 2] &= ~src_u0->w64[j + 2] & ~src_u1->w64[j + 2];

9098

acc |= dst_u->w64[j + 3] &= ~src_u0->w64[j + 3] & ~src_u1->w64[j + 3];

9103

digest &= ~(

<< wave);

9198 for

(

unsigned i

= 0;

< arr_sz;

+=4)

9200

acc |= dst_u->w64[

] ^= src_u->w64[

];

9201

acc |= dst_u->w64[

+1] ^= src_u->w64[

+1];

9202

acc |= dst_u->w64[

+2] ^= src_u->w64[

+2];

9203

acc |= dst_u->w64[

+3] ^= src_u->w64[

+3];

9235

dst_ptr+=4; wrd_ptr+=4;

9236

}

while

(wrd_ptr < wrd_end);

9257 if

(src == dst)

return

9263 if

(!src)

return

dst;

9269 if

(!src)

return

dst;

9353 const T

* blk_end = blk + data_size - 2;

9358 const T

* blk_j = blk + 1;

9359 for

(; blk_j < blk_end; ++blk_j)

9369 const T

* blk_j = blk + 1;

9370 for

( ; blk_j < blk_end; ++blk_j)

9374 if

(blk_j[1] | blk_j[2])

9384 count

+= unsigned(blk_j - blk) * unsigned(

sizeof

(

));

9389 while

(blk < blk_end);

9390 return count

+ unsigned(2 *

sizeof

(

));

9415

w &= (1u << bit_pos);

9421

w = block[nword] >> bit_pos;

9426

*pos = unsigned(bit_pos + (nword * 8u *

unsigned

(

sizeof

(

))));

9436

*pos = unsigned(bit_pos + (

* 8u *

unsigned

(

sizeof

(

))));

9470

last

= unsigned(idx + (

* 8u *

unsigned

(

sizeof

(

))));

9496 #ifdef VECT_BIT_FIND_FIRST 9505

*pos = unsigned(idx + (

* 8u *

unsigned

(

sizeof

(

))));

9537 #ifdef VECT_BIT_FIND_FIRST 9545 unsigned

base =

* 8u * unsigned(

sizeof

(

));

9555

w64 = block[

] | block[

+1];

9558 unsigned

base =

* 8u * unsigned(

sizeof

(

));

9598 #if defined(BMSSE42OPT) || defined(BMAVX2OPT) || defined(BMAVX512OPT) 9604 const unsigned cnt

+ 4;

9613 for

(++

;

; ++

)

9620

}

while

(++

);

9633 if

(

auto

w = block[

])

9663 template

typename

SIZE_TYPE>

9675 unsigned

pos = nbit_from;

9685

rank -= bc; pos += unsigned(32u - nbit);

9691

nbit_pos = pos + idx;

9696 #if defined(BM64OPT) || defined(BM64_SSE4) || defined(BMAVX2OPT) || defined(BMAVX512OPT) 9706

nbit_pos = pos + idx;

9721

rank -= bc; pos += 32u;

9725

nbit_pos = pos + idx;

9744 template

typename

SIZE_TYPE>

9770 unsigned

total_possible_bitcount,

9778 if

((gap_size < block_size) && (gap_size < arr_size) && (gap_size < inv_arr_size))

9783 if

(arr_size < inv_arr_size)

9785 if

((arr_size < block_size) && (arr_size < gap_size))

9792 if

((inv_arr_size < block_size) && (inv_arr_size < gap_size))

9811 template

typename

9816 const bm::id64_t

imask64 = inverted ? ~0ull : 0;

9819

src+=2, bit_idx += unsigned(

sizeof

(*src) * 8 * 2))

9830 return

(

unsigned

)(pcurr - dest);

9834 template

typename

9838 for

(

unsigned i

= 1;

< sz; ++

)

9841 unsigned

d =

[

] -

[

-1];

9855 template

typename

9864 unsigned

bitpos = 0;

9865 unsigned

w = block[nword];

9872 b

= (~w) & (1 << 1);

9875

arr_ex0[ex0_cnt] = 0; ++ex0_cnt;

9880 for

(;

<= 65534; ++

)

9885 b

= w & (1 << bitpos);

9893 bool

b_prev = w & (1 << bitpos);

9900 bool

b_next = w & (1 << bitpos);

9909

w &= ~(1 << bitpos);

9911

arr_ex0[ex0_cnt] = (

)

; ++ex0_cnt;

9925

arr_ex0[ex0_cnt] = 0; ++ex0_cnt;

9931 for

(;

<= 65534; ++

)

9936 b

= w & (1 << bitpos);

9944 bool

b_prev = w & (1 << bitpos);

9951 bool

b_next = w & (1 << bitpos);

9962

arr_ex0[ex0_cnt] = (

)

; ++ex0_cnt;

9975 template

typename

9981 for

(

unsigned

k = 0; k < ex0_cnt; ++k)

10007 template

typename

10016 const bm::id64_t

imask64 = inverted ? ~0ull : 0;

10024

src+=2, bit_idx += unsigned(

sizeof

(*src) * 8 * 2))

10032 if

(idx !=

+1)

10036

*pcurr_r++ =

(

- rl);

10040

*pcurr_s++ =

(idx);

10044 if

(!rl && (pcurr_s != dst_s))

10055

*pcurr_r++ =

(

- rl);

10059

s_cnt = (unsigned)(pcurr_s - dst_s);

10060

r_cnt = (unsigned)(pcurr_r - dst_r);

10068 template

typename

10076 for

(

unsigned i

= 0;

< s_cnt; ++

)

10080 for

(

unsigned i

= 0;

< r_cnt; ++

)

10098 if

(!blk)

return true

;

10122 if

(blk == 0)

return false

;

10142 template

typename

10144 const T

* length_end,

10147 BM_ASSERT

(length && length_end && glevel_len);

10149 unsigned

overhead = 0;

10150 for

(;length < length_end; ++length)

10152 unsigned len

= *length;

10155 unsigned

capacity = glevel_len[level];

10157

overhead += capacity -

;

10169 template

typename

10171 const T

* length_end,

10174 BM_ASSERT

(length && length_end && glevel_len);

10176 size_t

lsize = size_t(length_end - length);

10182 for

(

= 0;

< lsize; ++

)

10184 if

(length[

] > max_len)

10185

max_len = length[

];

10189

glevel_len[0] =

(max_len + 4);

10199 unsigned

min_overhead =

gap_overhead

(length, length_end, glevel_len);

10200 bool

is_improved =

false

;

10208 bool

imp_flag =

false

;

10210 for

(j = 0; j < lsize; ++j)

10212

glevel_len[

] =

(length[j] + 4);

10213 unsigned

ov =

gap_overhead

(length, length_end, glevel_len);

10214 if

(ov <= min_overhead)

10224

is_improved =

true

;

10228

glevel_len[

] = gap_saved_value;

10236 T val

= *glevel_len;

10237 T

* gp = glevel_len;

10238 T

* res = glevel_len;

10255 return

is_improved;

10275 if

(!blk || !arg_blk)

10307 if

(arg_gap != gap)

10418 if

(cnt_ < from_ || cnt_ >

to_

)

10420

cnt_

;

return

10438 template

class

It1,

class

It2,

class

BinaryOp,

class

Encoder>

10444 for

(

unsigned i

= 0;

< block_size; ++

)

10449

enc.push_back( w );

10583

&gap_and_to_bitset<bm::gap_word_t>,

10584

&gap_add_to_bitset<bm::gap_word_t>,

10585

&gap_sub_to_bitset<bm::gap_word_t>,

10586

&gap_xor_to_bitset<bm::gap_word_t>,

10641

w0 = w_ptr[0]; w1 = w_ptr[1];

10643 #if defined(BMAVX512OPT) || defined(BMAVX2OPT) || defined(BM64OPT) || defined(BM64_SSE4) 10648

w0 = w_ptr[2]; w1 = w_ptr[3];

10652 #if (defined(__arm__) || defined(__aarch64__)) 10656

w0 = w_ptr[2]; w1 = w_ptr[3];

10658

cnt0 +=

bm::bitscan_bsf

(w1, bits + cnt0, (

unsigned short

)(64+32));

10664

w0 = w_ptr[2]; w1 = w_ptr[3];

10669 return static_cast<unsigned short>

(cnt0);

10672 #if defined (BM64_SSE4) || defined(BM64_AVX2) || defined(BM64_AVX512) 10682 unsigned size

unsigned

start,

10685 typedef unsigned

TRGW;

10686 typedef unsigned IDX

;

10687 #if defined(BM64_SSE4) 10690 if

constexpr (

sizeof

(TRGW)==4 &&

sizeof

(

IDX

)==4)

10695 #elif defined(BM64_AVX2) || defined(BM64_AVX512) 10696 if

constexpr (

sizeof

(TRGW)==4 &&

sizeof

(

IDX

)==4)

10712 template

typename

TRGW,

typename

IDX,

typename

SZ>

10721 const

= (

- start);

10722 const

SZ len_unr =

- (

% 2);

10724 for

(; k < len_unr; k+=2)

10726 const

SZ base = start + k;

10734 for

(; k <

; ++k)

10762 for

(;(start <

) &&

10787 #if defined(VECT_ARR_BLOCK_LOOKUP) 10790 for

(;(start <

) &&

10825

block[nword] |= (1u << nbit);

10849 #if defined(VECT_SET_BLOCK_BITS) 10854 unsigned n

= idx[start++];

10858

block[nword] |= (1u << nbit);

10859

}

while

(start < stop);

10873 unsigned

& left,

unsigned

& right)

BMNOEXCEPT 10911 #if defined(VECT_LOWER_BOUND_SCAN_U32) 10914 for

(; from <= to; ++from)

10916 if

(

[from] >= target)

10929 unsigned long long

target,

10936 for

(; from <= to; ++from)

10938 if

(

[from] >= target)

10958 const unsigned

linear_cutoff = 32;

10960 unsigned l

= from;

unsigned r

= to;

10961 unsigned

dist =

;

10962 if

(dist < linear_cutoff)

10969 unsigned

mid = (

)/2+

;

10970 if

(

[mid] < target)

10975 if

(dist < linear_cutoff)

10989 unsigned long long

target,

10994 const unsigned

linear_cutoff = 32;

10996 unsigned l

= from;

unsigned r

= to;

10997 unsigned

dist =

;

10998 if

(dist < linear_cutoff)

11005 unsigned

mid = (

) / 2 +

;

11006 if

(

[mid] < target)

11011 if

(dist < linear_cutoff)

11025 bool find_ptr

(

const void

const

* p_arr,

size_t

arr_size,

11029 for

(

size_t i

= 0;

< arr_size; ++

)

11030 if

(ptr == p_arr[

])

11032

*idx =

;

return true

;

11050 return

block_idx + base_idx;

11059 return

block_idx + base_idx;

11073 unsigned

md =

[1] -

[0];

11074 for

(

size_t i

= 1;

< arr_size; ++

)

11077 unsigned

curr =

[

];

11102 for

(

size_t i

= 1;

< arr_size; ++

)

11113 template

typename

VT,

typename

SZ>

11116 bool

found =

false

;

11118 for

(SZ

= 0;

< arr_size; ++

)

11123

max_v = v; *found_idx =

;

11134 template

typename

VT,

typename

SZ>

11137 for

(SZ

= 0;

< arr_size; ++

)

11153 template

typename

VT,

typename

SZ>

11157 for

(SZ

= 0;

< arr_size; ++

)

11194 float

bie_bits_per_int,

11202 if

(bc == max_bits)

11208 unsigned

ibc = max_bits - bc;

11214 float

cost_in_bits = float(gc) * bie_bits_per_int;

11215 if

(cost_in_bits >=

float

(max_bits))

11225 float

cost_in_bits = float(bc) * bie_bits_per_int;

11226 if

(cost_in_bits >=

float

(max_bits))

11231

*best_metric = ibc;

11232 float

cost_in_bits = float(ibc) * bie_bits_per_int;

11233 if

(cost_in_bits >=

float

(max_bits))

11239 template

typename

11242 unsigned

& win_size,

float

& best_save)

11244 bool

use_wdr =

false

;

11247 for

(

unsigned

w_size = 20; w_size <= 78; w_size += 2)

11258 unsigned

total_windows = (sz + w_size - 1) / w_size;

11259 float

bits_extra = float(total_windows + 1 + 8 + 8);

11260 float

save_per_window = 0.15f * w_size;

11261 float

total_save = save_per_window * wcnt;

11262

total_save -= bits_extra;

11263 if

(total_save > 0.0f)

11267

use_wdr =

true

; win_size = w_size; best_save = total_save;

11270 if

(total_save >= best_save)

11272

win_size = w_size; best_save = total_save;

11300 template

typename

11303 T

temp = *

; *

= *

; *

= temp;

11309 template

typename

11322 while

(

[j] >

[pivot])

11353 unsigned

arr_idx = idx >> 1;

11356 unsigned char

old_val =

[arr_idx];

11358 arr

[arr_idx] = (

unsigned

char)(old_val | (v << 4));

11362 unsigned char

old_val =

[arr_idx];

11364 arr

[arr_idx] = (

unsigned

char)(old_val | (v & 0xF));

11380 unsigned char

v =