varnish-cache/bin/varnishd/hash/hash_critbit.c
0
/*-
1
 * Copyright (c) 2008-2011 Varnish Software AS
2
 * All rights reserved.
3
 *
4
 * Author: Poul-Henning Kamp <phk@phk.freebsd.dk>
5
 *
6
 * SPDX-License-Identifier: BSD-2-Clause
7
 *
8
 * Redistribution and use in source and binary forms, with or without
9
 * modification, are permitted provided that the following conditions
10
 * are met:
11
 * 1. Redistributions of source code must retain the above copyright
12
 *    notice, this list of conditions and the following disclaimer.
13
 * 2. Redistributions in binary form must reproduce the above copyright
14
 *    notice, this list of conditions and the following disclaimer in the
15
 *    documentation and/or other materials provided with the distribution.
16
 *
17
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20
 * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
21
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27
 * SUCH DAMAGE.
28
 *
29
 * A Crit Bit tree based hash
30
 */
31
32
// #define PHK
33
34
#include "config.h"
35
36
#include <stdlib.h>
37
38
#include "cache/cache_varnishd.h"
39
#include "cache/cache_objhead.h"
40
41
#include "hash/hash_slinger.h"
42
#include "vmb.h"
43
#include "vtim.h"
44
45
static struct lock hcb_mtx;
46
47
/*---------------------------------------------------------------------
48
 * Table for finding out how many bits two bytes have in common,
49
 * counting from the MSB towards the LSB.
50
 * ie:
51
 *      hcb_bittbl[0x01 ^ 0x22] == 2
52
 *      hcb_bittbl[0x10 ^ 0x0b] == 3
53
 *
54
 */
55
56
static unsigned char hcb_bittbl[256];
57
58
static unsigned char
59 100122
hcb_bits(unsigned char x, unsigned char y)
60
{
61 100122
        return (hcb_bittbl[x ^ y]);
62
}
63
64
static void
65 22144
hcb_build_bittbl(void)
66
{
67
        unsigned char x;
68
        unsigned y;
69
70 22144
        y = 0;
71 199296
        for (x = 0; x < 8; x++)
72 3011584
                for (; y < (1U << x); y++)
73 3011584
                        hcb_bittbl[y] = 8 - x;
74
75
        /* Quick asserts for sanity check */
76 22144
        assert(hcb_bits(0x34, 0x34) == 8);
77 22144
        AZ(hcb_bits(0xaa, 0x55));
78 22144
        assert(hcb_bits(0x01, 0x22) == 2);
79 22144
        assert(hcb_bits(0x10, 0x0b) == 3);
80 22144
}
81
82
/*---------------------------------------------------------------------
83
 * For space reasons we overload the two pointers with two different
84
 * kinds of of pointers.  We cast them to uintptr_t's and abuse the
85
 * low two bits to tell them apart, assuming that Varnish will never
86
 * run on machines with less than 32bit alignment.
87
 *
88
 * Asserts will explode if these assumptions are not met.
89
 */
90
91
struct hcb_y {
92
        unsigned                magic;
93
#define HCB_Y_MAGIC             0x125c4bd2
94
        unsigned short          critbit;
95
        unsigned char           ptr;
96
        unsigned char           bitmask;
97
        volatile uintptr_t      leaf[2];
98
        VSTAILQ_ENTRY(hcb_y)    list;
99
};
100
101
#define HCB_BIT_NODE            (1<<0)
102
#define HCB_BIT_Y               (1<<1)
103
104
struct hcb_root {
105
        volatile uintptr_t      origo;
106
};
107
108
static struct hcb_root  hcb_root;
109
110
static VSTAILQ_HEAD(, hcb_y)    cool_y = VSTAILQ_HEAD_INITIALIZER(cool_y);
111
static VSTAILQ_HEAD(, hcb_y)    dead_y = VSTAILQ_HEAD_INITIALIZER(dead_y);
112
static VTAILQ_HEAD(, objhead)   cool_h = VTAILQ_HEAD_INITIALIZER(cool_h);
113
static VTAILQ_HEAD(, objhead)   dead_h = VTAILQ_HEAD_INITIALIZER(dead_h);
114
115
/*---------------------------------------------------------------------
116
 * Pointer accessor functions
117
 */
118
static int
119 54645
hcb_is_node(uintptr_t u)
120
{
121
122 54645
        return (u & HCB_BIT_NODE);
123
}
124
125
static int
126 115453
hcb_is_y(uintptr_t u)
127
{
128
129 115453
        return (u & HCB_BIT_Y);
130
}
131
132
static uintptr_t
133 35289
hcb_r_node(const struct objhead *n)
134
{
135
136 35289
        AZ((uintptr_t)n & (HCB_BIT_NODE | HCB_BIT_Y));
137 35289
        return (HCB_BIT_NODE | (uintptr_t)n);
138
}
139
140
static struct objhead *
141 54648
hcb_l_node(uintptr_t u)
142
{
143
144 54648
        assert(u & HCB_BIT_NODE);
145 54648
        AZ(u & HCB_BIT_Y);
146 54648
        return ((struct objhead *)(u & ~HCB_BIT_NODE));
147
}
148
149
static uintptr_t
150 11546
hcb_r_y(const struct hcb_y *y)
151
{
152
153 11546
        CHECK_OBJ_NOTNULL(y, HCB_Y_MAGIC);
154 11546
        AZ((uintptr_t)y & (HCB_BIT_NODE | HCB_BIT_Y));
155 11546
        return (HCB_BIT_Y | (uintptr_t)y);
156
}
157
158
static struct hcb_y *
159 49949
hcb_l_y(uintptr_t u)
160
{
161
162 49949
        AZ(u & HCB_BIT_NODE);
163 49949
        assert(u & HCB_BIT_Y);
164 49949
        return ((struct hcb_y *)(u & ~HCB_BIT_Y));
165
}
166
167
/*---------------------------------------------------------------------
168
 * Find the "critical" bit that separates these two digests
169
 */
170
171
static unsigned
172 11546
hcb_crit_bit(const uint8_t *digest, const struct objhead *oh2, struct hcb_y *y)
173
{
174
        unsigned char u, r;
175
176 11546
        CHECK_OBJ_NOTNULL(y, HCB_Y_MAGIC);
177 15046
        for (u = 0; u < DIGEST_LEN && digest[u] == oh2->digest[u]; u++)
178
                ;
179 11546
        assert(u < DIGEST_LEN);
180 11546
        r = hcb_bits(digest[u], oh2->digest[u]);
181 11546
        y->ptr = u;
182 11546
        y->bitmask = 0x80 >> r;
183 11546
        y->critbit = u * 8 + r;
184 11546
        return (y->critbit);
185
}
186
187
/*---------------------------------------------------------------------
188
 * Unless we have the lock, we need to be very careful about pointer
189
 * references into the tree, we cannot trust things to be the same
190
 * in two consecutive memory accesses.
191
 */
192
193
static struct objhead *
194 89129
hcb_insert(const struct worker *wrk, struct hcb_root *root,
195
    const uint8_t *digest, struct objhead **noh)
196
{
197
        volatile uintptr_t *p;
198
        uintptr_t pp;
199
        struct hcb_y *y, *y2;
200
        struct objhead *oh2;
201
        unsigned s, s2;
202
203 89129
        p = &root->origo;
204 89129
        pp = *p;
205 89129
        if (pp == 0) {
206 34479
                if (noh == NULL)
207 17256
                        return (NULL);
208 17223
                oh2 = *noh;
209 17223
                *noh = NULL;
210 17223
                memcpy(oh2->digest, digest, sizeof oh2->digest);
211 17223
                *p = hcb_r_node(oh2);
212 17223
                return (oh2);
213
        }
214
215 91582
        while (hcb_is_y(pp)) {
216 36932
                y = hcb_l_y(pp);
217 36932
                CHECK_OBJ_NOTNULL(y, HCB_Y_MAGIC);
218 36932
                assert(y->ptr < DIGEST_LEN);
219 36932
                s = (digest[y->ptr] & y->bitmask) != 0;
220 36932
                assert(s < 2);
221 36932
                p = &y->leaf[s];
222 36932
                pp = *p;
223
        }
224
225 54650
        if (pp == 0) {
226
                /* We raced hcb_delete and got a NULL pointer */
227 0
                assert(noh == NULL);
228 0
                return (NULL);
229
        }
230
231 54650
        assert(hcb_is_node(pp));
232
233
        /* We found a node, does it match ? */
234 54650
        oh2 = hcb_l_node(pp);
235 54650
        CHECK_OBJ_NOTNULL(oh2, OBJHEAD_MAGIC);
236 54650
        if (!memcmp(oh2->digest, digest, DIGEST_LEN))
237 31565
                return (oh2);
238
239 23085
        if (noh == NULL)
240 11539
                return (NULL);
241
242
        /* Insert */
243
244 11546
        TAKE_OBJ_NOTNULL(y2, &wrk->wpriv->nhashpriv, HCB_Y_MAGIC);
245 11546
        (void)hcb_crit_bit(digest, oh2, y2);
246 11546
        s2 = (digest[y2->ptr] & y2->bitmask) != 0;
247 11546
        assert(s2 < 2);
248 11546
        oh2 = *noh;
249 11546
        *noh = NULL;
250 11546
        memcpy(oh2->digest, digest, sizeof oh2->digest);
251 11546
        y2->leaf[s2] = hcb_r_node(oh2);
252 11546
        s2 = 1-s2;
253
254 11546
        p = &root->origo;
255 11546
        AN(*p);
256
257 20229
        while (hcb_is_y(*p)) {
258 10813
                y = hcb_l_y(*p);
259 10813
                CHECK_OBJ_NOTNULL(y, HCB_Y_MAGIC);
260 10813
                assert(y->critbit != y2->critbit);
261 10813
                if (y->critbit > y2->critbit)
262 2130
                        break;
263 8683
                assert(y->ptr < DIGEST_LEN);
264 8683
                s = (digest[y->ptr] & y->bitmask) != 0;
265 8683
                assert(s < 2);
266 8683
                p = &y->leaf[s];
267
        }
268 11546
        y2->leaf[s2] = *p;
269 11546
        VWMB();
270 11546
        *p = hcb_r_y(y2);
271 11546
        return (oh2);
272 89129
}
273
274
/*--------------------------------------------------------------------*/
275
276
static void
277 4317
hcb_delete(struct hcb_root *r, const struct objhead *oh)
278
{
279
        struct hcb_y *y;
280
        volatile uintptr_t *p;
281
        unsigned s;
282
283 4317
        if (r->origo == hcb_r_node(oh)) {
284 2873
                r->origo = 0;
285 2873
                return;
286
        }
287 1444
        p = &r->origo;
288 1444
        assert(hcb_is_y(*p));
289
290 1444
        y = NULL;
291 2203
        while (1) {
292 2203
                assert(hcb_is_y(*p));
293 2203
                y = hcb_l_y(*p);
294 2203
                assert(y->ptr < DIGEST_LEN);
295 2203
                s = (oh->digest[y->ptr] & y->bitmask) != 0;
296 2203
                assert(s < 2);
297 2203
                if (y->leaf[s] == hcb_r_node(oh)) {
298 1444
                        *p = y->leaf[1 - s];
299 1444
                        VSTAILQ_INSERT_TAIL(&cool_y, y, list);
300 1444
                        return;
301
                }
302 759
                p = &y->leaf[s];
303
        }
304 4317
}
305
306
/*--------------------------------------------------------------------*/
307
308
static void * v_matchproto_(bgthread_t)
309 0
hcb_cleaner(struct worker *wrk, void *priv)
310
{
311
        struct hcb_y *y, *y2;
312
        struct objhead *oh, *oh2;
313
314 0
        (void)priv;
315 22144
        while (1) {
316 22144
                VSTAILQ_FOREACH_SAFE(y, &dead_y, list, y2) {
317 0
                        CHECK_OBJ_NOTNULL(y, HCB_Y_MAGIC);
318 0
                        VSTAILQ_REMOVE_HEAD(&dead_y, list);
319 0
                        FREE_OBJ(y);
320 0
                }
321 22144
                VTAILQ_FOREACH_SAFE(oh, &dead_h, hoh_list, oh2) {
322 0
                        CHECK_OBJ(oh, OBJHEAD_MAGIC);
323 0
                        VTAILQ_REMOVE(&dead_h, oh, hoh_list);
324 0
                        HSH_DeleteObjHead(wrk, oh);
325 0
                }
326 22144
                Lck_Lock(&hcb_mtx);
327 22144
                VSTAILQ_CONCAT(&dead_y, &cool_y);
328 22144
                VTAILQ_CONCAT(&dead_h, &cool_h, hoh_list);
329 22144
                Lck_Unlock(&hcb_mtx);
330 22144
                Pool_Sumstat(wrk);
331 22144
                VTIM_sleep(cache_param->critbit_cooloff);
332
        }
333
        NEEDLESS(return (NULL));
334
}
335
336
/*--------------------------------------------------------------------*/
337
338
static void v_matchproto_(hash_start_f)
339 22144
hcb_start(void)
340
{
341 22144
        struct objhead *oh = NULL;
342
        pthread_t tp;
343
344 22144
        (void)oh;
345 22144
        Lck_New(&hcb_mtx, lck_hcb);
346 22144
        WRK_BgThread(&tp, "hcb-cleaner", hcb_cleaner, NULL);
347 22144
        memset(&hcb_root, 0, sizeof hcb_root);
348 22144
        hcb_build_bittbl();
349 22144
}
350
351
static int v_matchproto_(hash_deref_f)
352 34771
hcb_deref(struct worker *wrk, struct objhead *oh)
353
{
354
        int r;
355
356 34771
        (void)wrk;
357 34771
        CHECK_OBJ_NOTNULL(oh, OBJHEAD_MAGIC);
358 34771
        Lck_AssertHeld(&oh->mtx);
359 34771
        assert(oh->refcnt > 0);
360 34771
        r = --oh->refcnt;
361 34771
        if (oh->refcnt == 0) {
362 4317
                Lck_Lock(&hcb_mtx);
363 4317
                hcb_delete(&hcb_root, oh);
364 4317
                VTAILQ_INSERT_TAIL(&cool_h, oh, hoh_list);
365 4317
                Lck_Unlock(&hcb_mtx);
366 4317
        }
367 34771
        Lck_Unlock(&oh->mtx);
368
#ifdef PHK
369
        fprintf(stderr, "hcb_defef %d %d <%s>\n", __LINE__, r, oh->hash);
370
#endif
371 34771
        return (r);
372
}
373
374
static struct objhead * v_matchproto_(hash_lookup_f)
375 60333
hcb_lookup(struct worker *wrk, const void *digest, struct objhead **noh)
376
{
377
        struct objhead *oh;
378
        struct hcb_y *y;
379
        unsigned u;
380
381 60333
        CHECK_OBJ_NOTNULL(wrk, WORKER_MAGIC);
382 60333
        AN(digest);
383 60333
        if (noh != NULL) {
384 60329
                CHECK_OBJ_NOTNULL(*noh, OBJHEAD_MAGIC);
385 60329
                assert((*noh)->refcnt == 1);
386 60329
        }
387
388
        /* First try in read-only mode without holding a lock */
389
390 60333
        wrk->stats->hcb_nolock++;
391 60333
        oh = hcb_insert(wrk, &hcb_root, digest, NULL);
392 60333
        if (oh != NULL) {
393 31533
                Lck_Lock(&oh->mtx);
394
                /*
395
                 * A refcount of zero indicates that the tree changed
396
                 * under us, so fall through and try with the lock held.
397
                 */
398 31533
                u = oh->refcnt;
399 31533
                if (u > 0) {
400 31532
                        oh->refcnt++;
401 31532
                        return (oh);
402
                }
403 1
                Lck_Unlock(&oh->mtx);
404 1
        }
405
406 28801
        while (1) {
407
                /* No luck, try with lock held, so we can modify tree */
408 28801
                CAST_OBJ_NOTNULL(y, wrk->wpriv->nhashpriv, HCB_Y_MAGIC);
409 28801
                Lck_Lock(&hcb_mtx);
410 28801
                VSC_C_main->hcb_lock++;
411 28801
                oh = hcb_insert(wrk, &hcb_root, digest, noh);
412 28801
                Lck_Unlock(&hcb_mtx);
413
414 28801
                if (oh == NULL)
415 0
                        return (NULL);
416
417 28801
                Lck_Lock(&oh->mtx);
418
419 28801
                CHECK_OBJ_NOTNULL(oh, OBJHEAD_MAGIC);
420 28801
                if (noh != NULL && *noh == NULL) {
421 28769
                        assert(oh->refcnt > 0);
422 28769
                        VSC_C_main->hcb_insert++;
423 28769
                        return (oh);
424
                }
425
                /*
426
                 * A refcount of zero indicates that the tree changed
427
                 * under us, so fall through and try with the lock held.
428
                 */
429 32
                u = oh->refcnt;
430 32
                if (u > 0) {
431 32
                        oh->refcnt++;
432 32
                        return (oh);
433
                }
434 0
                Lck_Unlock(&oh->mtx);
435
        }
436 60333
}
437
438
static void v_matchproto_(hash_prep_f)
439 61491
hcb_prep(struct worker *wrk)
440
{
441
        struct hcb_y *y;
442
443 61491
        if (wrk->wpriv->nhashpriv == NULL) {
444 28953
                ALLOC_OBJ(y, HCB_Y_MAGIC);
445 28953
                AN(y);
446 28953
                wrk->wpriv->nhashpriv = y;
447 28953
        }
448 61491
}
449
450
const struct hash_slinger hcb_slinger = {
451
        .magic  =       SLINGER_MAGIC,
452
        .name   =       "critbit",
453
        .start  =       hcb_start,
454
        .lookup =       hcb_lookup,
455
        .prep =         hcb_prep,
456
        .deref  =       hcb_deref,
457
};