varnish-cache/bin/varnishd/hash/hash_critbit.c
0
/*-
1
 * Copyright (c) 2008-2011 Varnish Software AS
2
 * All rights reserved.
3
 *
4
 * Author: Poul-Henning Kamp <phk@phk.freebsd.dk>
5
 *
6
 * SPDX-License-Identifier: BSD-2-Clause
7
 *
8
 * Redistribution and use in source and binary forms, with or without
9
 * modification, are permitted provided that the following conditions
10
 * are met:
11
 * 1. Redistributions of source code must retain the above copyright
12
 *    notice, this list of conditions and the following disclaimer.
13
 * 2. Redistributions in binary form must reproduce the above copyright
14
 *    notice, this list of conditions and the following disclaimer in the
15
 *    documentation and/or other materials provided with the distribution.
16
 *
17
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20
 * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
21
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27
 * SUCH DAMAGE.
28
 *
29
 * A Crit Bit tree based hash
30
 */
31
32
// #define PHK
33
34
#include "config.h"
35
36
#include <stdlib.h>
37
38
#include "cache/cache_varnishd.h"
39
#include "cache/cache_objhead.h"
40
41
#include "hash/hash_slinger.h"
42
#include "vmb.h"
43
#include "vtim.h"
44
45
static struct lock hcb_mtx;
46
47
/*---------------------------------------------------------------------
48
 * Table for finding out how many bits two bytes have in common,
49
 * counting from the MSB towards the LSB.
50
 * ie:
51
 *      hcb_bittbl[0x01 ^ 0x22] == 2
52
 *      hcb_bittbl[0x10 ^ 0x0b] == 3
53
 *
54
 */
55
56
static unsigned char hcb_bittbl[256];
57
58
static unsigned char
59 165120
hcb_bits(unsigned char x, unsigned char y)
60
{
61 165120
        return (hcb_bittbl[x ^ y]);
62
}
63
64
static void
65 36591
hcb_build_bittbl(void)
66
{
67
        unsigned char x;
68
        unsigned y;
69
70 36591
        y = 0;
71 329319
        for (x = 0; x < 8; x++)
72 4976376
                for (; y < (1U << x); y++)
73 4976376
                        hcb_bittbl[y] = 8 - x;
74
75
        /* Quick asserts for sanity check */
76 36591
        assert(hcb_bits(0x34, 0x34) == 8);
77 36591
        AZ(hcb_bits(0xaa, 0x55));
78 36591
        assert(hcb_bits(0x01, 0x22) == 2);
79 36591
        assert(hcb_bits(0x10, 0x0b) == 3);
80 36591
}
81
82
/*---------------------------------------------------------------------
83
 * For space reasons we overload the two pointers with two different
84
 * kinds of of pointers.  We cast them to uintptr_t's and abuse the
85
 * low two bits to tell them apart, assuming that Varnish will never
86
 * run on machines with less than 32bit alignment.
87
 *
88
 * Asserts will explode if these assumptions are not met.
89
 */
90
91
struct hcb_y {
92
        unsigned                magic;
93
#define HCB_Y_MAGIC             0x125c4bd2
94
        unsigned short          critbit;
95
        unsigned char           ptr;
96
        unsigned char           bitmask;
97
        volatile uintptr_t      leaf[2];
98
        VSTAILQ_ENTRY(hcb_y)    list;
99
};
100
101
#define HCB_BIT_NODE            (1<<0)
102
#define HCB_BIT_Y               (1<<1)
103
104
struct hcb_root {
105
        volatile uintptr_t      origo;
106
};
107
108
static struct hcb_root  hcb_root;
109
110
static VSTAILQ_HEAD(, hcb_y)    cool_y = VSTAILQ_HEAD_INITIALIZER(cool_y);
111
static VSTAILQ_HEAD(, hcb_y)    dead_y = VSTAILQ_HEAD_INITIALIZER(dead_y);
112
static VTAILQ_HEAD(, objhead)   cool_h = VTAILQ_HEAD_INITIALIZER(cool_h);
113
static VTAILQ_HEAD(, objhead)   dead_h = VTAILQ_HEAD_INITIALIZER(dead_h);
114
115
/*---------------------------------------------------------------------
116
 * Pointer accessor functions
117
 */
118
static int
119 89974
hcb_is_node(uintptr_t u)
120
{
121
122 89974
        return (u & HCB_BIT_NODE);
123
}
124
125
static int
126 188568
hcb_is_y(uintptr_t u)
127
{
128
129 188568
        return (u & HCB_BIT_Y);
130
}
131
132
static uintptr_t
133 57410
hcb_r_node(const struct objhead *n)
134
{
135
136 57410
        AZ((uintptr_t)n & (HCB_BIT_NODE | HCB_BIT_Y));
137 57410
        return (HCB_BIT_NODE | (uintptr_t)n);
138
}
139
140
static struct objhead *
141 89973
hcb_l_node(uintptr_t u)
142
{
143
144 89973
        assert(u & HCB_BIT_NODE);
145 89973
        AZ(u & HCB_BIT_Y);
146 89973
        return ((struct objhead *)(u & ~HCB_BIT_NODE));
147
}
148
149
static uintptr_t
150 18756
hcb_r_y(const struct hcb_y *y)
151
{
152
153 18756
        CHECK_OBJ_NOTNULL(y, HCB_Y_MAGIC);
154 18756
        AZ((uintptr_t)y & (HCB_BIT_NODE | HCB_BIT_Y));
155 18756
        return (HCB_BIT_Y | (uintptr_t)y);
156
}
157
158
static struct hcb_y *
159 80898
hcb_l_y(uintptr_t u)
160
{
161
162 80898
        AZ(u & HCB_BIT_NODE);
163 80898
        assert(u & HCB_BIT_Y);
164 80898
        return ((struct hcb_y *)(u & ~HCB_BIT_Y));
165
}
166
167
/*---------------------------------------------------------------------
168
 * Find the "critical" bit that separates these two digests
169
 */
170
171
static unsigned
172 18756
hcb_crit_bit(const uint8_t *digest, const struct objhead *oh2, struct hcb_y *y)
173
{
174
        unsigned char u, r;
175
176 18756
        CHECK_OBJ_NOTNULL(y, HCB_Y_MAGIC);
177 24356
        for (u = 0; u < DIGEST_LEN && digest[u] == oh2->digest[u]; u++)
178
                ;
179 18756
        assert(u < DIGEST_LEN);
180 18756
        r = hcb_bits(digest[u], oh2->digest[u]);
181 18756
        y->ptr = u;
182 18756
        y->bitmask = 0x80 >> r;
183 18756
        y->critbit = u * 8 + r;
184 18756
        return (y->critbit);
185
}
186
187
/*---------------------------------------------------------------------
188
 * Unless we have the lock, we need to be very careful about pointer
189
 * references into the tree, we cannot trust things to be the same
190
 * in two consecutive memory accesses.
191
 */
192
193
static struct objhead *
194 145939
hcb_insert(const struct worker *wrk, struct hcb_root *root,
195
    const uint8_t *digest, struct objhead **noh)
196
{
197
        volatile uintptr_t *p;
198
        uintptr_t pp;
199
        struct hcb_y *y, *y2;
200
        struct objhead *oh2;
201
        unsigned s, s2;
202
203 145939
        p = &root->origo;
204 145939
        pp = *p;
205 145939
        if (pp == 0) {
206 55964
                if (noh == NULL)
207 28017
                        return (NULL);
208 27947
                oh2 = *noh;
209 27947
                *noh = NULL;
210 27947
                memcpy(oh2->digest, digest, sizeof oh2->digest);
211 27947
                *p = hcb_r_node(oh2);
212 27947
                return (oh2);
213
        }
214
215 149679
        while (hcb_is_y(pp)) {
216 59704
                y = hcb_l_y(pp);
217 59704
                CHECK_OBJ_NOTNULL(y, HCB_Y_MAGIC);
218 59704
                assert(y->ptr < DIGEST_LEN);
219 59704
                s = (digest[y->ptr] & y->bitmask) != 0;
220 59704
                assert(s < 2);
221 59704
                p = &y->leaf[s];
222 59704
                pp = *p;
223
        }
224
225 89975
        if (pp == 0) {
226
                /* We raced hcb_delete and got a NULL pointer */
227 0
                assert(noh == NULL);
228 0
                return (NULL);
229
        }
230
231 89975
        assert(hcb_is_node(pp));
232
233
        /* We found a node, does it match ? */
234 89975
        oh2 = hcb_l_node(pp);
235 89975
        CHECK_OBJ_NOTNULL(oh2, OBJHEAD_MAGIC);
236 89975
        if (!memcmp(oh2->digest, digest, DIGEST_LEN))
237 52465
                return (oh2);
238
239 37510
        if (noh == NULL)
240 18754
                return (NULL);
241
242
        /* Insert */
243
244 18756
        TAKE_OBJ_NOTNULL(y2, &wrk->wpriv->nhashpriv, HCB_Y_MAGIC);
245 18756
        (void)hcb_crit_bit(digest, oh2, y2);
246 18756
        s2 = (digest[y2->ptr] & y2->bitmask) != 0;
247 18756
        assert(s2 < 2);
248 18756
        oh2 = *noh;
249 18756
        *noh = NULL;
250 18756
        memcpy(oh2->digest, digest, sizeof oh2->digest);
251 18756
        y2->leaf[s2] = hcb_r_node(oh2);
252 18756
        s2 = 1-s2;
253
254 18756
        p = &root->origo;
255 18756
        AN(*p);
256
257 32810
        while (hcb_is_y(*p)) {
258 17505
                y = hcb_l_y(*p);
259 17505
                CHECK_OBJ_NOTNULL(y, HCB_Y_MAGIC);
260 17505
                assert(y->critbit != y2->critbit);
261 17505
                if (y->critbit > y2->critbit)
262 3451
                        break;
263 14054
                assert(y->ptr < DIGEST_LEN);
264 14054
                s = (digest[y->ptr] & y->bitmask) != 0;
265 14054
                assert(s < 2);
266 14054
                p = &y->leaf[s];
267
        }
268 18756
        y2->leaf[s2] = *p;
269 18756
        VWMB();
270 18756
        *p = hcb_r_y(y2);
271 18756
        return (oh2);
272 145939
}
273
274
/*--------------------------------------------------------------------*/
275
276
static void
277 7018
hcb_delete(struct hcb_root *r, const struct objhead *oh)
278
{
279
        struct hcb_y *y;
280
        volatile uintptr_t *p;
281
        unsigned s;
282
283 7018
        if (r->origo == hcb_r_node(oh)) {
284 4627
                r->origo = 0;
285 4627
                return;
286
        }
287 2391
        p = &r->origo;
288 2391
        assert(hcb_is_y(*p));
289
290 2391
        y = NULL;
291 3689
        while (1) {
292 3689
                assert(hcb_is_y(*p));
293 3689
                y = hcb_l_y(*p);
294 3689
                assert(y->ptr < DIGEST_LEN);
295 3689
                s = (oh->digest[y->ptr] & y->bitmask) != 0;
296 3689
                assert(s < 2);
297 3689
                if (y->leaf[s] == hcb_r_node(oh)) {
298 2391
                        *p = y->leaf[1 - s];
299 2391
                        VSTAILQ_INSERT_TAIL(&cool_y, y, list);
300 2391
                        return;
301
                }
302 1298
                p = &y->leaf[s];
303
        }
304 7018
}
305
306
/*--------------------------------------------------------------------*/
307
308
static void * v_matchproto_(bgthread_t)
309 0
hcb_cleaner(struct worker *wrk, void *priv)
310
{
311
        struct hcb_y *y, *y2;
312
        struct objhead *oh, *oh2;
313
314 0
        (void)priv;
315 36591
        while (1) {
316 36591
                VSTAILQ_FOREACH_SAFE(y, &dead_y, list, y2) {
317 0
                        CHECK_OBJ_NOTNULL(y, HCB_Y_MAGIC);
318 0
                        VSTAILQ_REMOVE_HEAD(&dead_y, list);
319 0
                        FREE_OBJ(y);
320 0
                }
321 36591
                VTAILQ_FOREACH_SAFE(oh, &dead_h, hoh_list, oh2) {
322 0
                        CHECK_OBJ(oh, OBJHEAD_MAGIC);
323 0
                        VTAILQ_REMOVE(&dead_h, oh, hoh_list);
324 0
                        HSH_DeleteObjHead(wrk, oh);
325 0
                }
326 36591
                Lck_Lock(&hcb_mtx);
327 36591
                VSTAILQ_CONCAT(&dead_y, &cool_y);
328 36591
                VTAILQ_CONCAT(&dead_h, &cool_h, hoh_list);
329 36591
                Lck_Unlock(&hcb_mtx);
330 36591
                Pool_Sumstat(wrk);
331 36591
                VTIM_sleep(cache_param->critbit_cooloff);
332
        }
333
        NEEDLESS(return (NULL));
334
}
335
336
/*--------------------------------------------------------------------*/
337
338
static void v_matchproto_(hash_start_f)
339 36591
hcb_start(void)
340
{
341 36591
        struct objhead *oh = NULL;
342
        pthread_t tp;
343
344 36591
        (void)oh;
345 36591
        Lck_New(&hcb_mtx, lck_hcb);
346 36591
        WRK_BgThread(&tp, "hcb-cleaner", hcb_cleaner, NULL);
347 36591
        memset(&hcb_root, 0, sizeof hcb_root);
348 36591
        hcb_build_bittbl();
349 36591
}
350
351
static int v_matchproto_(hash_deref_f)
352 57714
hcb_deref(struct worker *wrk, struct objhead *oh)
353
{
354
        int r;
355
356 57714
        (void)wrk;
357 57714
        CHECK_OBJ_NOTNULL(oh, OBJHEAD_MAGIC);
358 57714
        Lck_AssertHeld(&oh->mtx);
359 57714
        assert(oh->refcnt > 0);
360 57714
        r = --oh->refcnt;
361 57714
        if (oh->refcnt == 0) {
362 7018
                Lck_Lock(&hcb_mtx);
363 7018
                hcb_delete(&hcb_root, oh);
364 7018
                VTAILQ_INSERT_TAIL(&cool_h, oh, hoh_list);
365 7018
                Lck_Unlock(&hcb_mtx);
366 7018
        }
367 57714
        Lck_Unlock(&oh->mtx);
368
#ifdef PHK
369
        fprintf(stderr, "hcb_defef %d %d <%s>\n", __LINE__, r, oh->hash);
370
#endif
371 57714
        return (r);
372
}
373
374
static struct objhead * v_matchproto_(hash_lookup_f)
375 99173
hcb_lookup(struct worker *wrk, const void *digest, struct objhead **noh)
376
{
377
        struct objhead *oh;
378
        struct hcb_y *y;
379
        unsigned u;
380
381 99173
        CHECK_OBJ_NOTNULL(wrk, WORKER_MAGIC);
382 99173
        AN(digest);
383 99173
        if (noh != NULL) {
384 99164
                CHECK_OBJ_NOTNULL(*noh, OBJHEAD_MAGIC);
385 99164
                assert((*noh)->refcnt == 1);
386 99164
        }
387
388
        /* First try in read-only mode without holding a lock */
389
390 99173
        wrk->stats->hcb_nolock++;
391 99173
        oh = hcb_insert(wrk, &hcb_root, digest, NULL);
392 99173
        if (oh != NULL) {
393 52396
                Lck_Lock(&oh->mtx);
394
                /*
395
                 * A refcount of zero indicates that the tree changed
396
                 * under us, so fall through and try with the lock held.
397
                 */
398 52396
                u = oh->refcnt;
399 52396
                if (u > 0) {
400 52396
                        oh->refcnt++;
401 52396
                        return (oh);
402
                }
403 0
                Lck_Unlock(&oh->mtx);
404 0
        }
405
406 46777
        while (1) {
407
                /* No luck, try with lock held, so we can modify tree */
408 46777
                CAST_OBJ_NOTNULL(y, wrk->wpriv->nhashpriv, HCB_Y_MAGIC);
409 46777
                Lck_Lock(&hcb_mtx);
410 46777
                VSC_C_main->hcb_lock++;
411 46777
                oh = hcb_insert(wrk, &hcb_root, digest, noh);
412 46777
                Lck_Unlock(&hcb_mtx);
413
414 46777
                if (oh == NULL)
415 0
                        return (NULL);
416
417 46777
                Lck_Lock(&oh->mtx);
418
419 46777
                CHECK_OBJ_NOTNULL(oh, OBJHEAD_MAGIC);
420 46777
                if (noh != NULL && *noh == NULL) {
421 46703
                        assert(oh->refcnt > 0);
422 46703
                        VSC_C_main->hcb_insert++;
423 46703
                        return (oh);
424
                }
425
                /*
426
                 * A refcount of zero indicates that the tree changed
427
                 * under us, so fall through and try with the lock held.
428
                 */
429 74
                u = oh->refcnt;
430 74
                if (u > 0) {
431 74
                        oh->refcnt++;
432 74
                        return (oh);
433
                }
434 0
                Lck_Unlock(&oh->mtx);
435
        }
436 99173
}
437
438
static void v_matchproto_(hash_prep_f)
439 101074
hcb_prep(struct worker *wrk)
440
{
441
        struct hcb_y *y;
442
443 101074
        if (wrk->wpriv->nhashpriv == NULL) {
444 47121
                ALLOC_OBJ(y, HCB_Y_MAGIC);
445 47121
                AN(y);
446 47121
                wrk->wpriv->nhashpriv = y;
447 47121
        }
448 101074
}
449
450
const struct hash_slinger hcb_slinger = {
451
        .magic  =       SLINGER_MAGIC,
452
        .name   =       "critbit",
453
        .start  =       hcb_start,
454
        .lookup =       hcb_lookup,
455
        .prep =         hcb_prep,
456
        .deref  =       hcb_deref,
457
};