diff options
Diffstat (limited to 'subversion/libsvn_subr/bit_array.c')
-rw-r--r-- | subversion/libsvn_subr/bit_array.c | 194 |
1 files changed, 194 insertions, 0 deletions
diff --git a/subversion/libsvn_subr/bit_array.c b/subversion/libsvn_subr/bit_array.c new file mode 100644 index 000000000000..c239d1c9dde7 --- /dev/null +++ b/subversion/libsvn_subr/bit_array.c @@ -0,0 +1,194 @@ +/* + * bit_array.c : implement a simple packed bit array + * + * ==================================================================== + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + * ==================================================================== + */ + + +#include "svn_sorts.h" +#include "private/svn_subr_private.h" + +/* We allocate our data buffer in blocks of this size (in bytes). + * For performance reasons, this shall be a power of two. + * It should also not exceed 80kB (to prevent APR pool fragmentation) and + * not be too small (to keep the number of OS-side memory allocations low - + * avoiding hitting system-specific limits). + */ +#define BLOCK_SIZE 0x10000 + +/* Number of bits in each block. + */ +#define BLOCK_SIZE_BITS (8 * BLOCK_SIZE) + +/* Initial array size (covers INITIAL_BLOCK_COUNT * BLOCK_SIZE_BITS bits). + * For performance reasons, this shall be a power of two. + */ +#define INITIAL_BLOCK_COUNT 16 + +/* We store the bits in a lazily allocated two-dimensional array. + * For every BLOCK_SIZE_BITS range of indexes, there is one entry in the + * BLOCKS array. If index / BLOCK_SIZE_BITS exceeds BLOCK_COUNT-1, the + * blocks are implicitly empty. Only if a bit will be set to 1, will the + * BLOCKS array be auto-expanded. + * + * As long as no bit got set in a particular block, the respective entry in + * BLOCKS entry will be NULL, implying that all block contents is 0. + */ +struct svn_bit_array__t +{ + /* Data buffer of BLOCK_COUNT blocks, BLOCK_SIZE_BITS each. Never NULL. + * Every block may be NULL, though. */ + unsigned char **blocks; + + /* Number of bytes allocated to DATA. Never shrinks. */ + apr_size_t block_count; + + /* Reallocate DATA form this POOL when growing. */ + apr_pool_t *pool; +}; + +/* Given that MAX shall be an actual bit index in a packed bit array, + * return the number of blocks entries to allocate for the data buffer. */ +static apr_size_t +select_data_size(apr_size_t max) +{ + /* We allocate a power of two of bytes but at least 16 blocks. */ + apr_size_t size = INITIAL_BLOCK_COUNT; + + /* Caution: + * MAX / BLOCK_SIZE_BITS == SIZE still means that MAX is out of bounds. + * OTOH, 2 * (MAX/BLOCK_SIZE_BITS) is always within the value range of + * APR_SIZE_T. */ + while (size <= max / BLOCK_SIZE_BITS) + size *= 2; + + return size; +} + +svn_bit_array__t * +svn_bit_array__create(apr_size_t max, + apr_pool_t *pool) +{ + svn_bit_array__t *array = apr_pcalloc(pool, sizeof(*array)); + + array->block_count = select_data_size(max); + array->pool = pool; + array->blocks = apr_pcalloc(pool, + array->block_count * sizeof(*array->blocks)); + + return array; +} + +void +svn_bit_array__set(svn_bit_array__t *array, + apr_size_t idx, + svn_boolean_t value) +{ + unsigned char *block; + + /* Index within ARRAY->BLOCKS for the block containing bit IDX. */ + apr_size_t block_idx = idx / BLOCK_SIZE_BITS; + + /* Within that block, index of the byte containing IDX. */ + apr_size_t byte_idx = (idx % BLOCK_SIZE_BITS) / 8; + + /* Within that byte, index of the bit corresponding to IDX. */ + apr_size_t bit_idx = (idx % BLOCK_SIZE_BITS) % 8; + + /* If IDX is outside the allocated range, we _may_ have to grow it. + * + * Be sure to use division instead of multiplication as we need to cover + * the full value range of APR_SIZE_T for the bit indexes. + */ + if (block_idx >= array->block_count) + { + apr_size_t new_count; + unsigned char **new_blocks; + + /* Unallocated indexes are implicitly 0, so no actual allocation + * required in that case. + */ + if (!value) + return; + + /* Grow block list to cover IDX. + * Clear the new entries to guarantee our array[idx]==0 default. + */ + new_count = select_data_size(idx); + new_blocks = apr_pcalloc(array->pool, new_count * sizeof(*new_blocks)); + memcpy(new_blocks, array->blocks, + array->block_count * sizeof(*new_blocks)); + array->blocks = new_blocks; + array->block_count = new_count; + } + + /* IDX is covered by ARRAY->BLOCKS now. */ + + /* Get the block that contains IDX. Auto-allocate it if missing. */ + block = array->blocks[block_idx]; + if (block == NULL) + { + /* Unallocated indexes are implicitly 0, so no actual allocation + * required in that case. + */ + if (!value) + return; + + /* Allocate the previously missing block and clear it for our + * array[idx] == 0 default. */ + block = apr_pcalloc(array->pool, BLOCK_SIZE); + array->blocks[block_idx] = block; + } + + /* Set / reset one bit. Be sure to use unsigned shifts. */ + if (value) + block[byte_idx] |= (unsigned char)(1u << bit_idx); + else + block[byte_idx] &= ~(unsigned char)(1u << bit_idx); +} + +svn_boolean_t +svn_bit_array__get(svn_bit_array__t *array, + apr_size_t idx) +{ + unsigned char *block; + + /* Index within ARRAY->BLOCKS for the block containing bit IDX. */ + apr_size_t block_idx = idx / BLOCK_SIZE_BITS; + + /* Within that block, index of the byte containing IDX. */ + apr_size_t byte_idx = (idx % BLOCK_SIZE_BITS) / 8; + + /* Within that byte, index of the bit corresponding to IDX. */ + apr_size_t bit_idx = (idx % BLOCK_SIZE_BITS) % 8; + + /* Indexes outside the allocated range are implicitly 0. */ + if (block_idx >= array->block_count) + return 0; + + /* Same if the respective block has not been allocated. */ + block = array->blocks[block_idx]; + if (block == NULL) + return 0; + + /* Extract one bit (get the byte, shift bit to LSB, extract it). */ + return (block[byte_idx] >> bit_idx) & 1; +} + |