| 1 | #include <stdio.h> | 
|---|
| 2 |  | 
|---|
| 3 | #include <roaring/bitset_util.h> | 
|---|
| 4 | #include <roaring/containers/containers.h> | 
|---|
| 5 | #include <roaring/containers/convert.h> | 
|---|
| 6 | #include <roaring/containers/perfparameters.h> | 
|---|
| 7 |  | 
|---|
| 8 | // file contains grubby stuff that must know impl. details of all container | 
|---|
| 9 | // types. | 
|---|
| 10 | bitset_container_t *bitset_container_from_array(const array_container_t *a) { | 
|---|
| 11 | bitset_container_t *ans = bitset_container_create(); | 
|---|
| 12 | int limit = array_container_cardinality(a); | 
|---|
| 13 | for (int i = 0; i < limit; ++i) bitset_container_set(ans, a->array[i]); | 
|---|
| 14 | return ans; | 
|---|
| 15 | } | 
|---|
| 16 |  | 
|---|
| 17 | bitset_container_t *bitset_container_from_run(const run_container_t *arr) { | 
|---|
| 18 | int card = run_container_cardinality(arr); | 
|---|
| 19 | bitset_container_t *answer = bitset_container_create(); | 
|---|
| 20 | for (int rlepos = 0; rlepos < arr->n_runs; ++rlepos) { | 
|---|
| 21 | rle16_t vl = arr->runs[rlepos]; | 
|---|
| 22 | bitset_set_lenrange(answer->array, vl.value, vl.length); | 
|---|
| 23 | } | 
|---|
| 24 | answer->cardinality = card; | 
|---|
| 25 | return answer; | 
|---|
| 26 | } | 
|---|
| 27 |  | 
|---|
| 28 | array_container_t *array_container_from_run(const run_container_t *arr) { | 
|---|
| 29 | array_container_t *answer = | 
|---|
| 30 | array_container_create_given_capacity(run_container_cardinality(arr)); | 
|---|
| 31 | answer->cardinality = 0; | 
|---|
| 32 | for (int rlepos = 0; rlepos < arr->n_runs; ++rlepos) { | 
|---|
| 33 | int run_start = arr->runs[rlepos].value; | 
|---|
| 34 | int run_end = run_start + arr->runs[rlepos].length; | 
|---|
| 35 |  | 
|---|
| 36 | for (int run_value = run_start; run_value <= run_end; ++run_value) { | 
|---|
| 37 | answer->array[answer->cardinality++] = (uint16_t)run_value; | 
|---|
| 38 | } | 
|---|
| 39 | } | 
|---|
| 40 | return answer; | 
|---|
| 41 | } | 
|---|
| 42 |  | 
|---|
| 43 | array_container_t *array_container_from_bitset(const bitset_container_t *bits) { | 
|---|
| 44 | array_container_t *result = | 
|---|
| 45 | array_container_create_given_capacity(bits->cardinality); | 
|---|
| 46 | result->cardinality = bits->cardinality; | 
|---|
| 47 | //  sse version ends up being slower here | 
|---|
| 48 | // (bitset_extract_setbits_sse_uint16) | 
|---|
| 49 | // because of the sparsity of the data | 
|---|
| 50 | bitset_extract_setbits_uint16(bits->array, BITSET_CONTAINER_SIZE_IN_WORDS, | 
|---|
| 51 | result->array, 0); | 
|---|
| 52 | return result; | 
|---|
| 53 | } | 
|---|
| 54 |  | 
|---|
| 55 | /* assumes that container has adequate space.  Run from [s,e] (inclusive) */ | 
|---|
| 56 | static void add_run(run_container_t *r, int s, int e) { | 
|---|
| 57 | r->runs[r->n_runs].value = s; | 
|---|
| 58 | r->runs[r->n_runs].length = e - s; | 
|---|
| 59 | r->n_runs++; | 
|---|
| 60 | } | 
|---|
| 61 |  | 
|---|
| 62 | run_container_t *run_container_from_array(const array_container_t *c) { | 
|---|
| 63 | int32_t n_runs = array_container_number_of_runs(c); | 
|---|
| 64 | run_container_t *answer = run_container_create_given_capacity(n_runs); | 
|---|
| 65 | int prev = -2; | 
|---|
| 66 | int run_start = -1; | 
|---|
| 67 | int32_t card = c->cardinality; | 
|---|
| 68 | if (card == 0) return answer; | 
|---|
| 69 | for (int i = 0; i < card; ++i) { | 
|---|
| 70 | const uint16_t cur_val = c->array[i]; | 
|---|
| 71 | if (cur_val != prev + 1) { | 
|---|
| 72 | // new run starts; flush old one, if any | 
|---|
| 73 | if (run_start != -1) add_run(answer, run_start, prev); | 
|---|
| 74 | run_start = cur_val; | 
|---|
| 75 | } | 
|---|
| 76 | prev = c->array[i]; | 
|---|
| 77 | } | 
|---|
| 78 | // now prev is the last seen value | 
|---|
| 79 | add_run(answer, run_start, prev); | 
|---|
| 80 | // assert(run_container_cardinality(answer) == c->cardinality); | 
|---|
| 81 | return answer; | 
|---|
| 82 | } | 
|---|
| 83 |  | 
|---|
| 84 | /** | 
|---|
| 85 | * Convert the runcontainer to either a Bitmap or an Array Container, depending | 
|---|
| 86 | * on the cardinality.  Frees the container. | 
|---|
| 87 | * Allocates and returns new container, which caller is responsible for freeing | 
|---|
| 88 | */ | 
|---|
| 89 |  | 
|---|
| 90 | void *convert_to_bitset_or_array_container(run_container_t *r, int32_t card, | 
|---|
| 91 | uint8_t *resulttype) { | 
|---|
| 92 | if (card <= DEFAULT_MAX_SIZE) { | 
|---|
| 93 | array_container_t *answer = array_container_create_given_capacity(card); | 
|---|
| 94 | answer->cardinality = 0; | 
|---|
| 95 | for (int rlepos = 0; rlepos < r->n_runs; ++rlepos) { | 
|---|
| 96 | uint16_t run_start = r->runs[rlepos].value; | 
|---|
| 97 | uint16_t run_end = run_start + r->runs[rlepos].length; | 
|---|
| 98 | for (uint16_t run_value = run_start; run_value <= run_end; | 
|---|
| 99 | ++run_value) { | 
|---|
| 100 | answer->array[answer->cardinality++] = run_value; | 
|---|
| 101 | } | 
|---|
| 102 | } | 
|---|
| 103 | assert(card == answer->cardinality); | 
|---|
| 104 | *resulttype = ARRAY_CONTAINER_TYPE_CODE; | 
|---|
| 105 | run_container_free(r); | 
|---|
| 106 | return answer; | 
|---|
| 107 | } | 
|---|
| 108 | bitset_container_t *answer = bitset_container_create(); | 
|---|
| 109 | for (int rlepos = 0; rlepos < r->n_runs; ++rlepos) { | 
|---|
| 110 | uint16_t run_start = r->runs[rlepos].value; | 
|---|
| 111 | bitset_set_lenrange(answer->array, run_start, r->runs[rlepos].length); | 
|---|
| 112 | } | 
|---|
| 113 | answer->cardinality = card; | 
|---|
| 114 | *resulttype = BITSET_CONTAINER_TYPE_CODE; | 
|---|
| 115 | run_container_free(r); | 
|---|
| 116 | return answer; | 
|---|
| 117 | } | 
|---|
| 118 |  | 
|---|
| 119 | /* Converts a run container to either an array or a bitset, IF it saves space. | 
|---|
| 120 | */ | 
|---|
| 121 | /* If a conversion occurs, the caller is responsible to free the original | 
|---|
| 122 | * container and | 
|---|
| 123 | * he becomes responsible to free the new one. */ | 
|---|
| 124 | void *convert_run_to_efficient_container(run_container_t *c, | 
|---|
| 125 | uint8_t *typecode_after) { | 
|---|
| 126 | int32_t size_as_run_container = | 
|---|
| 127 | run_container_serialized_size_in_bytes(c->n_runs); | 
|---|
| 128 |  | 
|---|
| 129 | int32_t size_as_bitset_container = | 
|---|
| 130 | bitset_container_serialized_size_in_bytes(); | 
|---|
| 131 | int32_t card = run_container_cardinality(c); | 
|---|
| 132 | int32_t size_as_array_container = | 
|---|
| 133 | array_container_serialized_size_in_bytes(card); | 
|---|
| 134 |  | 
|---|
| 135 | int32_t min_size_non_run = | 
|---|
| 136 | size_as_bitset_container < size_as_array_container | 
|---|
| 137 | ? size_as_bitset_container | 
|---|
| 138 | : size_as_array_container; | 
|---|
| 139 | if (size_as_run_container <= min_size_non_run) {  // no conversion | 
|---|
| 140 | *typecode_after = RUN_CONTAINER_TYPE_CODE; | 
|---|
| 141 | return c; | 
|---|
| 142 | } | 
|---|
| 143 | if (card <= DEFAULT_MAX_SIZE) { | 
|---|
| 144 | // to array | 
|---|
| 145 | array_container_t *answer = array_container_create_given_capacity(card); | 
|---|
| 146 | answer->cardinality = 0; | 
|---|
| 147 | for (int rlepos = 0; rlepos < c->n_runs; ++rlepos) { | 
|---|
| 148 | int run_start = c->runs[rlepos].value; | 
|---|
| 149 | int run_end = run_start + c->runs[rlepos].length; | 
|---|
| 150 |  | 
|---|
| 151 | for (int run_value = run_start; run_value <= run_end; ++run_value) { | 
|---|
| 152 | answer->array[answer->cardinality++] = (uint16_t)run_value; | 
|---|
| 153 | } | 
|---|
| 154 | } | 
|---|
| 155 | *typecode_after = ARRAY_CONTAINER_TYPE_CODE; | 
|---|
| 156 | return answer; | 
|---|
| 157 | } | 
|---|
| 158 |  | 
|---|
| 159 | // else to bitset | 
|---|
| 160 | bitset_container_t *answer = bitset_container_create(); | 
|---|
| 161 |  | 
|---|
| 162 | for (int rlepos = 0; rlepos < c->n_runs; ++rlepos) { | 
|---|
| 163 | int start = c->runs[rlepos].value; | 
|---|
| 164 | int end = start + c->runs[rlepos].length; | 
|---|
| 165 | bitset_set_range(answer->array, start, end + 1); | 
|---|
| 166 | } | 
|---|
| 167 | answer->cardinality = card; | 
|---|
| 168 | *typecode_after = BITSET_CONTAINER_TYPE_CODE; | 
|---|
| 169 | return answer; | 
|---|
| 170 | } | 
|---|
| 171 |  | 
|---|
| 172 | // like convert_run_to_efficient_container but frees the old result if needed | 
|---|
| 173 | void *convert_run_to_efficient_container_and_free(run_container_t *c, | 
|---|
| 174 | uint8_t *typecode_after) { | 
|---|
| 175 | void *answer = convert_run_to_efficient_container(c, typecode_after); | 
|---|
| 176 | if (answer != c) run_container_free(c); | 
|---|
| 177 | return answer; | 
|---|
| 178 | } | 
|---|
| 179 |  | 
|---|
| 180 | /* once converted, the original container is disposed here, rather than | 
|---|
| 181 | in roaring_array | 
|---|
| 182 | */ | 
|---|
| 183 |  | 
|---|
| 184 | // TODO: split into run-  array-  and bitset-  subfunctions for sanity; | 
|---|
| 185 | // a few function calls won't really matter. | 
|---|
| 186 |  | 
|---|
| 187 | void *convert_run_optimize(void *c, uint8_t typecode_original, | 
|---|
| 188 | uint8_t *typecode_after) { | 
|---|
| 189 | if (typecode_original == RUN_CONTAINER_TYPE_CODE) { | 
|---|
| 190 | void *newc = convert_run_to_efficient_container((run_container_t *)c, | 
|---|
| 191 | typecode_after); | 
|---|
| 192 | if (newc != c) { | 
|---|
| 193 | container_free(c, typecode_original); | 
|---|
| 194 | } | 
|---|
| 195 | return newc; | 
|---|
| 196 | } else if (typecode_original == ARRAY_CONTAINER_TYPE_CODE) { | 
|---|
| 197 | // it might need to be converted to a run container. | 
|---|
| 198 | array_container_t *c_qua_array = (array_container_t *)c; | 
|---|
| 199 | int32_t n_runs = array_container_number_of_runs(c_qua_array); | 
|---|
| 200 | int32_t size_as_run_container = | 
|---|
| 201 | run_container_serialized_size_in_bytes(n_runs); | 
|---|
| 202 | int32_t card = array_container_cardinality(c_qua_array); | 
|---|
| 203 | int32_t size_as_array_container = | 
|---|
| 204 | array_container_serialized_size_in_bytes(card); | 
|---|
| 205 |  | 
|---|
| 206 | if (size_as_run_container >= size_as_array_container) { | 
|---|
| 207 | *typecode_after = ARRAY_CONTAINER_TYPE_CODE; | 
|---|
| 208 | return c; | 
|---|
| 209 | } | 
|---|
| 210 | // else convert array to run container | 
|---|
| 211 | run_container_t *answer = run_container_create_given_capacity(n_runs); | 
|---|
| 212 | int prev = -2; | 
|---|
| 213 | int run_start = -1; | 
|---|
| 214 |  | 
|---|
| 215 | assert(card > 0); | 
|---|
| 216 | for (int i = 0; i < card; ++i) { | 
|---|
| 217 | uint16_t cur_val = c_qua_array->array[i]; | 
|---|
| 218 | if (cur_val != prev + 1) { | 
|---|
| 219 | // new run starts; flush old one, if any | 
|---|
| 220 | if (run_start != -1) add_run(answer, run_start, prev); | 
|---|
| 221 | run_start = cur_val; | 
|---|
| 222 | } | 
|---|
| 223 | prev = c_qua_array->array[i]; | 
|---|
| 224 | } | 
|---|
| 225 | assert(run_start >= 0); | 
|---|
| 226 | // now prev is the last seen value | 
|---|
| 227 | add_run(answer, run_start, prev); | 
|---|
| 228 | *typecode_after = RUN_CONTAINER_TYPE_CODE; | 
|---|
| 229 | array_container_free(c_qua_array); | 
|---|
| 230 | return answer; | 
|---|
| 231 | } else if (typecode_original == | 
|---|
| 232 | BITSET_CONTAINER_TYPE_CODE) {  // run conversions on bitset | 
|---|
| 233 | // does bitset need conversion to run? | 
|---|
| 234 | bitset_container_t *c_qua_bitset = (bitset_container_t *)c; | 
|---|
| 235 | int32_t n_runs = bitset_container_number_of_runs(c_qua_bitset); | 
|---|
| 236 | int32_t size_as_run_container = | 
|---|
| 237 | run_container_serialized_size_in_bytes(n_runs); | 
|---|
| 238 | int32_t size_as_bitset_container = | 
|---|
| 239 | bitset_container_serialized_size_in_bytes(); | 
|---|
| 240 |  | 
|---|
| 241 | if (size_as_bitset_container <= size_as_run_container) { | 
|---|
| 242 | // no conversion needed. | 
|---|
| 243 | *typecode_after = BITSET_CONTAINER_TYPE_CODE; | 
|---|
| 244 | return c; | 
|---|
| 245 | } | 
|---|
| 246 | // bitset to runcontainer (ported from Java  RunContainer( | 
|---|
| 247 | // BitmapContainer bc, int nbrRuns)) | 
|---|
| 248 | assert(n_runs > 0);  // no empty bitmaps | 
|---|
| 249 | run_container_t *answer = run_container_create_given_capacity(n_runs); | 
|---|
| 250 |  | 
|---|
| 251 | int long_ctr = 0; | 
|---|
| 252 | uint64_t cur_word = c_qua_bitset->array[0]; | 
|---|
| 253 | int run_count = 0; | 
|---|
| 254 | while (true) { | 
|---|
| 255 | while (cur_word == UINT64_C(0) && | 
|---|
| 256 | long_ctr < BITSET_CONTAINER_SIZE_IN_WORDS - 1) | 
|---|
| 257 | cur_word = c_qua_bitset->array[++long_ctr]; | 
|---|
| 258 |  | 
|---|
| 259 | if (cur_word == UINT64_C(0)) { | 
|---|
| 260 | bitset_container_free(c_qua_bitset); | 
|---|
| 261 | *typecode_after = RUN_CONTAINER_TYPE_CODE; | 
|---|
| 262 | return answer; | 
|---|
| 263 | } | 
|---|
| 264 |  | 
|---|
| 265 | int local_run_start = __builtin_ctzll(cur_word); | 
|---|
| 266 | int run_start = local_run_start + 64 * long_ctr; | 
|---|
| 267 | uint64_t cur_word_with_1s = cur_word | (cur_word - 1); | 
|---|
| 268 |  | 
|---|
| 269 | int run_end = 0; | 
|---|
| 270 | while (cur_word_with_1s == UINT64_C(0xFFFFFFFFFFFFFFFF) && | 
|---|
| 271 | long_ctr < BITSET_CONTAINER_SIZE_IN_WORDS - 1) | 
|---|
| 272 | cur_word_with_1s = c_qua_bitset->array[++long_ctr]; | 
|---|
| 273 |  | 
|---|
| 274 | if (cur_word_with_1s == UINT64_C(0xFFFFFFFFFFFFFFFF)) { | 
|---|
| 275 | run_end = 64 + long_ctr * 64;  // exclusive, I guess | 
|---|
| 276 | add_run(answer, run_start, run_end - 1); | 
|---|
| 277 | bitset_container_free(c_qua_bitset); | 
|---|
| 278 | *typecode_after = RUN_CONTAINER_TYPE_CODE; | 
|---|
| 279 | return answer; | 
|---|
| 280 | } | 
|---|
| 281 | int local_run_end = __builtin_ctzll(~cur_word_with_1s); | 
|---|
| 282 | run_end = local_run_end + long_ctr * 64; | 
|---|
| 283 | add_run(answer, run_start, run_end - 1); | 
|---|
| 284 | run_count++; | 
|---|
| 285 | cur_word = cur_word_with_1s & (cur_word_with_1s + 1); | 
|---|
| 286 | } | 
|---|
| 287 | return answer; | 
|---|
| 288 | } else { | 
|---|
| 289 | assert(false); | 
|---|
| 290 | __builtin_unreachable(); | 
|---|
| 291 | return NULL; | 
|---|
| 292 | } | 
|---|
| 293 | } | 
|---|
| 294 |  | 
|---|
| 295 | bitset_container_t *bitset_container_from_run_range(const run_container_t *run, | 
|---|
| 296 | uint32_t min, uint32_t max) { | 
|---|
| 297 | bitset_container_t *bitset = bitset_container_create(); | 
|---|
| 298 | int32_t union_cardinality = 0; | 
|---|
| 299 | for (int32_t i = 0; i < run->n_runs; ++i) { | 
|---|
| 300 | uint32_t rle_min = run->runs[i].value; | 
|---|
| 301 | uint32_t rle_max = rle_min + run->runs[i].length; | 
|---|
| 302 | bitset_set_lenrange(bitset->array, rle_min, rle_max - rle_min); | 
|---|
| 303 | union_cardinality += run->runs[i].length + 1; | 
|---|
| 304 | } | 
|---|
| 305 | union_cardinality += max - min + 1; | 
|---|
| 306 | union_cardinality -= bitset_lenrange_cardinality(bitset->array, min, max-min); | 
|---|
| 307 | bitset_set_lenrange(bitset->array, min, max - min); | 
|---|
| 308 | bitset->cardinality = union_cardinality; | 
|---|
| 309 | return bitset; | 
|---|
| 310 | } | 
|---|
| 311 |  | 
|---|