varnish-cache/lib/libvarnishapi/vsl_dispatch.c
0
/*-
1
 * Copyright (c) 2006 Verdens Gang AS
2
 * Copyright (c) 2006-2015 Varnish Software AS
3
 * All rights reserved.
4
 *
5
 * Author: Martin Blix Grydeland <martin@varnish-software.com>
6
 *
7
 * SPDX-License-Identifier: BSD-2-Clause
8
 *
9
 * Redistribution and use in source and binary forms, with or without
10
 * modification, are permitted provided that the following conditions
11
 * are met:
12
 * 1. Redistributions of source code must retain the above copyright
13
 *    notice, this list of conditions and the following disclaimer.
14
 * 2. Redistributions in binary form must reproduce the above copyright
15
 *    notice, this list of conditions and the following disclaimer in the
16
 *    documentation and/or other materials provided with the distribution.
17
 *
18
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
19
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21
 * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
22
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28
 * SUCH DAMAGE.
29
 *
30
 */
31
32
#include "config.h"
33
34
#include <stdarg.h>
35
#include <stdint.h>
36
#include <stdio.h>
37
#include <stdlib.h>
38
#include <string.h>
39
40
#include "vdef.h"
41
#include "vas.h"
42
#include "miniobj.h"
43
44
#include "vqueue.h"
45
#include "vre.h"
46
#include "vtim.h"
47
#include "vtree.h"
48
49
#include "vapi/vsl.h"
50
51
#include "vsl_api.h"
52
53
#define VTX_CACHE 10
54
#define VTX_BUFSIZE_MIN 64
55
#define VTX_SHMCHUNKS 3
56
57
static const char * const vsl_t_names[VSL_t__MAX] = {
58
        [VSL_t_unknown] = "unknown",
59
        [VSL_t_sess]    = "sess",
60
        [VSL_t_req]     = "req",
61
        [VSL_t_bereq]   = "bereq",
62
        [VSL_t_raw]     = "raw",
63
};
64
65
static const char * const vsl_r_names[VSL_r__MAX] = {
66
        [VSL_r_unknown] = "unknown",
67
        [VSL_r_http_1]  = "HTTP/1",
68
        [VSL_r_rxreq]   = "rxreq",
69
        [VSL_r_esi]     = "esi",
70
        [VSL_r_restart] = "restart",
71
        [VSL_r_pass]    = "pass",
72
        [VSL_r_fetch]   = "fetch",
73
        [VSL_r_bgfetch] = "bgfetch",
74
        [VSL_r_pipe]    = "pipe",
75
};
76
77
struct vtx;
78
VTAILQ_HEAD(vtxhead, vtx);
79
80
struct vslc_raw {
81
        unsigned                magic;
82
#define VSLC_RAW_MAGIC          0x247EBD44
83
84
        struct VSL_cursor       cursor;
85
86
        const uint32_t          *ptr;
87
};
88
89
struct synth {
90
        unsigned                magic;
91
#define SYNTH_MAGIC             0xC654479F
92
93
        VTAILQ_ENTRY(synth)     list;
94
        size_t                  offset;
95
        uint32_t                data[VSL_OVERHEAD + VSL_WORDS(64)];
96
};
97
VTAILQ_HEAD(synthhead, synth);
98
99
enum chunk_t {
100
        chunk_t__unassigned,
101
        chunk_t_shm,
102
        chunk_t_buf,
103
};
104
105
struct chunk {
106
        unsigned                                magic;
107
#define CHUNK_MAGIC                             0x48DC0194
108
        enum chunk_t                            type;
109
        union {
110
                struct {
111
                        struct VSLC_ptr         start;
112
                        VTAILQ_ENTRY(chunk)     shmref;
113
                } shm;
114
                struct {
115
                        uint32_t                *data;
116
                        size_t                  space;
117
                } buf;
118
        };
119
        size_t                                  len;
120
        struct vtx                              *vtx;
121
        VTAILQ_ENTRY(chunk)                     list;
122
};
123
VTAILQ_HEAD(chunkhead, chunk);
124
125
struct vslc_vtx {
126
        unsigned                magic;
127
#define VSLC_VTX_MAGIC          0x74C6523F
128
129
        struct VSL_cursor       cursor;
130
131
        struct vtx              *vtx;
132
        struct synth            *synth;
133
        struct chunk            *chunk;
134
        size_t                  chunkstart;
135
        size_t                  offset;
136
};
137
138
struct vtx_key {
139
        uint64_t                vxid;
140
        VRBT_ENTRY(vtx_key)     entry;
141
};
142
VRBT_HEAD(vtx_tree, vtx_key);
143
144
struct vtx {
145
        struct vtx_key          key;
146
        unsigned                magic;
147
#define VTX_MAGIC               0xACC21D09
148
        VTAILQ_ENTRY(vtx)       list_child;
149
        VTAILQ_ENTRY(vtx)       list_vtx;
150
151
        double                  t_start;
152
        unsigned                flags;
153
#define VTX_F_BEGIN             0x1 /* Begin record processed */
154
#define VTX_F_END               0x2 /* End record processed */
155
#define VTX_F_COMPLETE          0x4 /* Marked complete. No new children
156
                                       should be appended */
157
#define VTX_F_READY             0x8 /* This vtx and all it's children are
158
                                       complete */
159
160
        enum VSL_transaction_e  type;
161
        enum VSL_reason_e       reason;
162
163
        struct vtx              *parent;
164
        struct vtxhead          child;
165
        unsigned                n_child;
166
        unsigned                n_childready;
167
        unsigned                n_descend;
168
169
        struct synthhead        synth;
170
171
        struct chunk            shmchunks[VTX_SHMCHUNKS];
172
        struct chunkhead        shmchunks_free;
173
174
        struct chunkhead        chunks;
175
        size_t                  len;
176
177
        struct vslc_vtx         c;
178
};
179
180
struct VSLQ {
181
        unsigned                magic;
182
#define VSLQ_MAGIC              0x23A8BE97
183
184
        struct VSL_data         *vsl;
185
        struct VSL_cursor       *c;
186
        struct vslq_query       *query;
187
188
        enum VSL_grouping_e     grouping;
189
190
        /* Structured mode */
191
        struct vtx_tree         tree;
192
        struct vtxhead          ready;
193
        struct vtxhead          incomplete;
194
        int                     n_outstanding;
195
        struct chunkhead        shmrefs;
196
        struct vtxhead          cache;
197
        unsigned                n_cache;
198
199
        /* Rate limiting */
200
        double                  credits;
201
        vtim_mono               last_use;
202
203
        /* Raw mode */
204
        struct {
205
                struct vslc_raw         c;
206
                struct VSL_transaction  trans;
207
                struct VSL_transaction  *ptrans[2];
208
                struct VSLC_ptr         start;
209
                ssize_t                 len;
210
                ssize_t                 offset;
211
        } raw;
212
};
213
214
static void vtx_synth_rec(struct vtx *vtx, unsigned tag, const char *fmt, ...);
215
/*lint -esym(534, vtx_diag) */
216
static int vtx_diag(struct vtx *vtx, const char *msg);
217
/*lint -esym(534, vtx_diag_tag) */
218
static int vtx_diag_tag(struct vtx *vtx, const uint32_t *ptr,
219
    const char *reason);
220
221
static inline int
222 504506
vtx_keycmp(const struct vtx_key *a, const struct vtx_key *b)
223
{
224 504506
        if (a->vxid < b->vxid)
225 14157
                return (-1);
226 490349
        if (a->vxid > b->vxid)
227 198444
                return (1);
228 291905
        return (0);
229 504506
}
230
231 33822
VRBT_GENERATE_REMOVE_COLOR(vtx_tree, vtx_key, entry, static)
232 83069
VRBT_GENERATE_REMOVE(vtx_tree, vtx_key, entry, static)
233 41374
VRBT_GENERATE_INSERT_COLOR(vtx_tree, vtx_key, entry, static)
234 50704
VRBT_GENERATE_INSERT_FINISH(vtx_tree, vtx_key, entry, static)
235 93373
VRBT_GENERATE_INSERT(vtx_tree, vtx_key, entry, vtx_keycmp, static)
236 537433
VRBT_GENERATE_FIND(vtx_tree, vtx_key, entry, vtx_keycmp, static)
237
238
static enum vsl_status v_matchproto_(vslc_next_f)
239 908025
vslc_raw_next(const struct VSL_cursor *cursor)
240
{
241
        struct vslc_raw *c;
242
243 908025
        CAST_OBJ_NOTNULL(c, cursor->priv_data, VSLC_RAW_MAGIC);
244 908025
        assert(&c->cursor == cursor);
245
246 908025
        AN(c->ptr);
247 908025
        if (c->cursor.rec.ptr == NULL) {
248 456731
                c->cursor.rec.ptr = c->ptr;
249 456731
                return (vsl_more);
250
        } else {
251 451294
                c->cursor.rec.ptr = NULL;
252 451294
                return (vsl_end);
253
        }
254 908025
}
255
256
static enum vsl_status v_matchproto_(vslc_reset_f)
257 132096
vslc_raw_reset(const struct VSL_cursor *cursor)
258
{
259
        struct vslc_raw *c;
260
261 132096
        CAST_OBJ_NOTNULL(c, cursor->priv_data, VSLC_RAW_MAGIC);
262 132096
        assert(&c->cursor == cursor);
263
264 132096
        AN(c->ptr);
265 132096
        c->cursor.rec.ptr = NULL;
266
267 132096
        return (vsl_end);
268
}
269
270
static const struct vslc_tbl vslc_raw_tbl = {
271
        .magic  = VSLC_TBL_MAGIC,
272
        .delete = NULL,
273
        .next   = vslc_raw_next,
274
        .reset  = vslc_raw_reset,
275
        .check  = NULL,
276
};
277
278
static enum vsl_status v_matchproto_(vslc_next_f)
279 3445286
vslc_vtx_next(const struct VSL_cursor *cursor)
280
{
281
        struct vslc_vtx *c;
282
        const uint32_t *ptr;
283
        unsigned overrun;
284
285 3445286
        CAST_OBJ_NOTNULL(c, cursor->priv_data, VSLC_VTX_MAGIC);
286 3445286
        assert(&c->cursor == cursor);
287 3445286
        CHECK_OBJ_NOTNULL(c->vtx, VTX_MAGIC);
288
289 3445286
        do {
290 3704584
                CHECK_OBJ_ORNULL(c->synth, SYNTH_MAGIC);
291 3704584
                if (c->synth != NULL && c->synth->offset == c->offset) {
292
                        /* We're at the offset of the next synth record,
293
                           point to it and advance the pointer */
294 11976
                        c->cursor.rec.ptr = c->synth->data;
295 11976
                        c->synth = VTAILQ_NEXT(c->synth, list);
296 11976
                } else {
297 3692608
                        overrun = c->offset > c->vtx->len;
298 3692608
                        AZ(overrun);
299 3692608
                        if (c->offset == c->vtx->len)
300 329117
                                return (vsl_end);
301
302
                        /* Advance chunk pointer */
303 3363491
                        if (c->chunk == NULL) {
304 99346
                                c->chunk = VTAILQ_FIRST(&c->vtx->chunks);
305 99346
                                c->chunkstart = 0;
306 99346
                        }
307 3363491
                        CHECK_OBJ_NOTNULL(c->chunk, CHUNK_MAGIC);
308 3452948
                        while (c->offset >= c->chunkstart + c->chunk->len) {
309 89457
                                c->chunkstart += c->chunk->len;
310 89457
                                c->chunk = VTAILQ_NEXT(c->chunk, list);
311 89457
                                CHECK_OBJ_NOTNULL(c->chunk, CHUNK_MAGIC);
312
                        }
313
314
                        /* Point to the next stored record */
315 3363491
                        if (c->chunk->type == chunk_t_shm)
316 2775282
                                ptr = c->chunk->shm.start.ptr;
317
                        else {
318 588209
                                assert(c->chunk->type == chunk_t_buf);
319 588209
                                ptr = c->chunk->buf.data;
320
                        }
321 3363491
                        c->cursor.rec.ptr = ptr + c->offset - c->chunkstart;
322 6726982
                        c->offset += VSL_NEXT(c->cursor.rec.ptr) -
323 3363491
                            c->cursor.rec.ptr;
324
                }
325 3375467
        } while (VSL_TAG(c->cursor.rec.ptr) == SLT__Batch);
326
327 3116169
        return (vsl_more);
328 3445286
}
329
330
static enum vsl_status v_matchproto_(vslc_reset_f)
331 139689
vslc_vtx_reset(const struct VSL_cursor *cursor)
332
{
333
        struct vslc_vtx *c;
334
335 139689
        CAST_OBJ_NOTNULL(c, cursor->priv_data, VSLC_VTX_MAGIC);
336 139689
        assert(&c->cursor == cursor);
337 139689
        CHECK_OBJ_NOTNULL(c->vtx, VTX_MAGIC);
338 139689
        c->synth = VTAILQ_FIRST(&c->vtx->synth);
339 139689
        c->chunk = NULL;
340 139689
        c->chunkstart = 0;
341 139689
        c->offset = 0;
342 139689
        c->cursor.rec.ptr = NULL;
343
344 139689
        return (vsl_end);
345
}
346
347
static const struct vslc_tbl vslc_vtx_tbl = {
348
        .magic  = VSLC_TBL_MAGIC,
349
        .delete = NULL,
350
        .next   = vslc_vtx_next,
351
        .reset  = vslc_vtx_reset,
352
        .check  = NULL,
353
};
354
355
/* Create a buf chunk */
356
static struct chunk *
357 17172
chunk_newbuf(struct vtx *vtx, const uint32_t *ptr, size_t len)
358
{
359
        struct chunk *chunk;
360
361 17172
        ALLOC_OBJ(chunk, CHUNK_MAGIC);
362 17170
        XXXAN(chunk);
363 17170
        chunk->type = chunk_t_buf;
364 17170
        chunk->vtx = vtx;
365 17170
        chunk->buf.space = VTX_BUFSIZE_MIN;
366 17170
        while (chunk->buf.space < len)
367 0
                chunk->buf.space *= 2;
368 17170
        chunk->buf.data = malloc(sizeof (uint32_t) * chunk->buf.space);
369 17170
        AN(chunk->buf.data);
370 17170
        memcpy(chunk->buf.data, ptr, sizeof (uint32_t) * len);
371 17170
        chunk->len = len;
372 17170
        return (chunk);
373
}
374
375
/* Free a buf chunk */
376
static void
377 17167
chunk_freebuf(struct chunk **pchunk)
378
{
379
        struct chunk *chunk;
380
381 17167
        TAKE_OBJ_NOTNULL(chunk, pchunk, CHUNK_MAGIC);
382 17167
        assert(chunk->type == chunk_t_buf);
383 17167
        free(chunk->buf.data);
384 17167
        FREE_OBJ(chunk);
385 17167
}
386
387
/* Append a set of records to a chunk */
388
static void
389 230141
chunk_appendbuf(struct chunk *chunk, const uint32_t *ptr, size_t len)
390
{
391
392 230141
        CHECK_OBJ_NOTNULL(chunk, CHUNK_MAGIC);
393 230141
        assert(chunk->type == chunk_t_buf);
394 230141
        if (chunk->buf.space < chunk->len + len) {
395 72604
                while (chunk->buf.space < chunk->len + len)
396 36302
                        chunk->buf.space *= 2;
397 72604
                chunk->buf.data = realloc(chunk->buf.data,
398 36302
                    sizeof (uint32_t) * chunk->buf.space);
399 36302
        }
400 230141
        memcpy(chunk->buf.data + chunk->len, ptr, sizeof (uint32_t) * len);
401 230141
        chunk->len += len;
402 230141
}
403
404
/* Transform a shm chunk to a buf chunk */
405
static void
406 0
chunk_shm_to_buf(struct VSLQ *vslq, struct chunk *chunk)
407
{
408
        struct vtx *vtx;
409
        struct chunk *buf;
410
411 0
        CHECK_OBJ_NOTNULL(chunk, CHUNK_MAGIC);
412 0
        assert(chunk->type == chunk_t_shm);
413 0
        vtx = chunk->vtx;
414 0
        CHECK_OBJ_NOTNULL(vtx, VTX_MAGIC);
415
416 0
        buf = VTAILQ_PREV(chunk, chunkhead, list);
417 0
        if (buf != NULL && buf->type == chunk_t_buf)
418
                /* Previous is a buf chunk, append to it */
419 0
                chunk_appendbuf(buf, chunk->shm.start.ptr, chunk->len);
420
        else {
421
                /* Create a new buf chunk and insert it before this */
422 0
                buf = chunk_newbuf(vtx, chunk->shm.start.ptr, chunk->len);
423 0
                AN(buf);
424 0
                VTAILQ_INSERT_BEFORE(chunk, buf, list);
425
        }
426
427
        /* Reset cursor chunk pointer, vslc_vtx_next will set it correctly */
428 0
        vtx->c.chunk = NULL;
429
430
        /* Remove from the shmref list and vtx, and put chunk back
431
           on the free list */
432 0
        VTAILQ_REMOVE(&vslq->shmrefs, chunk, shm.shmref);
433 0
        VTAILQ_REMOVE(&vtx->chunks, chunk, list);
434 0
        VTAILQ_INSERT_HEAD(&vtx->shmchunks_free, chunk, list);
435 0
}
436
437
/* Append a set of records to a vtx structure */
438
static enum vsl_status
439 334112
vtx_append(struct VSLQ *vslq, struct vtx *vtx, const struct VSLC_ptr *start,
440
    size_t len)
441
{
442
        struct chunk *chunk;
443
        enum vsl_check i;
444
445 334112
        AN(vtx);
446 334112
        AN(len);
447 334112
        AN(start);
448
449 334112
        i = VSL_Check(vslq->c, start);
450 334112
        if (i == vsl_check_e_inval)
451 0
                return (vsl_e_overrun);
452
453 334112
        if (i == vsl_check_valid && !VTAILQ_EMPTY(&vtx->shmchunks_free)) {
454
                /* Shmref it */
455 86796
                chunk = VTAILQ_FIRST(&vtx->shmchunks_free);
456 86796
                CHECK_OBJ_NOTNULL(chunk, CHUNK_MAGIC);
457 86796
                assert(chunk->type == chunk_t_shm);
458 86796
                assert(chunk->vtx == vtx);
459 86796
                VTAILQ_REMOVE(&vtx->shmchunks_free, chunk, list);
460 86796
                chunk->shm.start = *start;
461 86796
                chunk->len = len;
462 86796
                VTAILQ_INSERT_TAIL(&vtx->chunks, chunk, list);
463
464
                /* Append to shmref list */
465 86796
                VTAILQ_INSERT_TAIL(&vslq->shmrefs, chunk, shm.shmref);
466 86796
        } else {
467
                /* Buffer it */
468 247316
                chunk = VTAILQ_LAST(&vtx->chunks, chunkhead);
469 247316
                CHECK_OBJ_ORNULL(chunk, CHUNK_MAGIC);
470 247300
                if (chunk != NULL && chunk->type == chunk_t_buf) {
471
                        /* Tail is a buf chunk, append to that */
472 230133
                        chunk_appendbuf(chunk, start->ptr, len);
473 230133
                } else {
474
                        /* Append new buf chunk */
475 17167
                        chunk = chunk_newbuf(vtx, start->ptr, len);
476 17167
                        AN(chunk);
477 17167
                        VTAILQ_INSERT_TAIL(&vtx->chunks, chunk, list);
478
                }
479
        }
480 334096
        vtx->len += len;
481 334096
        return (vsl_more);
482 334096
}
483
484
/* Allocate a new vtx structure */
485
static struct vtx *
486 50722
vtx_new(struct VSLQ *vslq)
487
{
488
        struct vtx *vtx;
489
        int i;
490
491 50722
        AN(vslq);
492 50722
        if (vslq->n_cache) {
493 27457
                AZ(VTAILQ_EMPTY(&vslq->cache));
494 27457
                vtx = VTAILQ_FIRST(&vslq->cache);
495 27457
                VTAILQ_REMOVE(&vslq->cache, vtx, list_child);
496 27457
                vslq->n_cache--;
497 27457
        } else {
498 23265
                ALLOC_OBJ(vtx, VTX_MAGIC);
499 23257
                AN(vtx);
500
501 23257
                VTAILQ_INIT(&vtx->child);
502 23257
                VTAILQ_INIT(&vtx->shmchunks_free);
503 93016
                for (i = 0; i < VTX_SHMCHUNKS; i++) {
504 69759
                        vtx->shmchunks[i].magic = CHUNK_MAGIC;
505 69759
                        vtx->shmchunks[i].type = chunk_t_shm;
506 69759
                        vtx->shmchunks[i].vtx = vtx;
507 69759
                        VTAILQ_INSERT_TAIL(&vtx->shmchunks_free,
508
                            &vtx->shmchunks[i], list);
509 69759
                }
510 23257
                VTAILQ_INIT(&vtx->chunks);
511 23257
                VTAILQ_INIT(&vtx->synth);
512 23257
                vtx->c.magic = VSLC_VTX_MAGIC;
513 23257
                vtx->c.vtx = vtx;
514 23257
                vtx->c.cursor.priv_tbl = &vslc_vtx_tbl;
515 23257
                vtx->c.cursor.priv_data = &vtx->c;
516
        }
517
518 50714
        CHECK_OBJ_NOTNULL(vtx, VTX_MAGIC);
519 50714
        vtx->key.vxid = 0;
520 50714
        vtx->t_start = VTIM_mono();
521 50714
        vtx->flags = 0;
522 50714
        vtx->type = VSL_t_unknown;
523 50714
        vtx->reason = VSL_r_unknown;
524 50714
        vtx->parent = NULL;
525 50714
        vtx->n_child = 0;
526 50714
        vtx->n_childready = 0;
527 50714
        vtx->n_descend = 0;
528 50714
        vtx->len = 0;
529 50714
        AN(vslc_vtx_reset(&vtx->c.cursor) == vsl_end);
530
531 50714
        return (vtx);
532
}
533
534
/* Disuse a vtx and all it's children, freeing any resources held. Free or
535
   cache the vtx for later use */
536
static void
537 50709
vtx_retire(struct VSLQ *vslq, struct vtx **pvtx)
538
{
539
        struct vtx *vtx;
540
        struct vtx *child;
541
        struct synth *synth;
542
        struct chunk *chunk;
543
544 50709
        AN(vslq);
545 50709
        TAKE_OBJ_NOTNULL(vtx, pvtx, VTX_MAGIC);
546
547 50709
        AN(vtx->flags & VTX_F_COMPLETE);
548 50709
        AN(vtx->flags & VTX_F_READY);
549 50709
        AZ(vtx->parent);
550
551 56118
        while (!VTAILQ_EMPTY(&vtx->child)) {
552 5409
                child = VTAILQ_FIRST(&vtx->child);
553 5409
                assert(child->parent == vtx);
554 5409
                AN(vtx->n_child);
555 5409
                assert(vtx->n_descend >= child->n_descend + 1);
556 5409
                VTAILQ_REMOVE(&vtx->child, child, list_child);
557 5409
                child->parent = NULL;
558 5409
                vtx->n_child--;
559 5409
                vtx->n_descend -= child->n_descend + 1;
560 5409
                vtx_retire(vslq, &child);
561 5409
                AZ(child);
562
        }
563 50709
        AZ(vtx->n_child);
564 50709
        AZ(vtx->n_descend);
565 50709
        vtx->n_childready = 0;
566
        // remove rval is no way to check if element was present
567 50709
        (void)VRBT_REMOVE(vtx_tree, &vslq->tree, &vtx->key);
568 50709
        vtx->key.vxid = 0;
569 50709
        vtx->flags = 0;
570
571 62525
        while (!VTAILQ_EMPTY(&vtx->synth)) {
572 11816
                synth = VTAILQ_FIRST(&vtx->synth);
573 11816
                CHECK_OBJ_NOTNULL(synth, SYNTH_MAGIC);
574 11816
                VTAILQ_REMOVE(&vtx->synth, synth, list);
575 11816
                FREE_OBJ(synth);
576
        }
577
578 154670
        while (!VTAILQ_EMPTY(&vtx->chunks)) {
579 103961
                chunk = VTAILQ_FIRST(&vtx->chunks);
580 103961
                CHECK_OBJ_NOTNULL(chunk, CHUNK_MAGIC);
581 103961
                VTAILQ_REMOVE(&vtx->chunks, chunk, list);
582 103961
                if (chunk->type == chunk_t_shm) {
583 86795
                        VTAILQ_REMOVE(&vslq->shmrefs, chunk, shm.shmref);
584 86795
                        VTAILQ_INSERT_HEAD(&vtx->shmchunks_free, chunk, list);
585 86795
                } else {
586 17166
                        assert(chunk->type == chunk_t_buf);
587 17166
                        chunk_freebuf(&chunk);
588 17166
                        AZ(chunk);
589
                }
590
        }
591 50709
        vtx->len = 0;
592 50709
        AN(vslq->n_outstanding);
593 50709
        vslq->n_outstanding--;
594
595 50709
        if (vslq->n_cache < VTX_CACHE) {
596 49874
                VTAILQ_INSERT_HEAD(&vslq->cache, vtx, list_child);
597 49874
                vslq->n_cache++;
598 49874
        } else
599 835
                FREE_OBJ(vtx);
600
601 50709
}
602
603
/* Lookup a vtx by vxid from the managed list */
604
static struct vtx *
605 367463
vtx_lookup(const struct VSLQ *vslq, uint64_t vxid)
606
{
607
        struct vtx_key lkey, *key;
608
        struct vtx *vtx;
609
610 367463
        AN(vslq);
611 367463
        lkey.vxid = vxid;
612 367463
        key = VRBT_FIND(vtx_tree, &vslq->tree, &lkey);
613 367463
        if (key == NULL)
614 75547
                return (NULL);
615 291916
        CAST_OBJ_NOTNULL(vtx, (void *)key, VTX_MAGIC);
616 291916
        return (vtx);
617 367463
}
618
619
/* Insert a new vtx into the managed list */
620
static struct vtx *
621 50706
vtx_add(struct VSLQ *vslq, uint64_t vxid)
622
{
623
        struct vtx *vtx;
624
625 50706
        AN(vslq);
626 50706
        vtx = vtx_new(vslq);
627 50706
        AN(vtx);
628 50706
        vtx->key.vxid = vxid;
629 50706
        AZ(VRBT_INSERT(vtx_tree, &vslq->tree, &vtx->key));
630 50706
        VTAILQ_INSERT_TAIL(&vslq->incomplete, vtx, list_vtx);
631 50706
        vslq->n_outstanding++;
632 50706
        return (vtx);
633
}
634
635
/* Mark a vtx complete, update child counters and if possible push it or
636
   it's top parent to the ready state */
637
static void
638 50712
vtx_mark_complete(struct VSLQ *vslq, struct vtx *vtx)
639
{
640
641 50712
        AN(vslq);
642 50712
        AN(vtx->flags & VTX_F_END);
643 50712
        AZ(vtx->flags & VTX_F_COMPLETE);
644
645 50712
        if (vtx->type == VSL_t_unknown)
646 0
                vtx_diag(vtx, "vtx of unknown type marked complete");
647
648 50712
        vtx->flags |= VTX_F_COMPLETE;
649 50712
        VTAILQ_REMOVE(&vslq->incomplete, vtx, list_vtx);
650
651 56119
        while (1) {
652 56119
                AZ(vtx->flags & VTX_F_READY);
653 56119
                if (vtx->flags & VTX_F_COMPLETE &&
654 50943
                    vtx->n_child == vtx->n_childready)
655 50704
                        vtx->flags |= VTX_F_READY;
656
                else
657 5415
                        return;
658 50704
                if (vtx->parent == NULL) {
659
                        /* Top level vtx ready */
660 45297
                        VTAILQ_INSERT_TAIL(&vslq->ready, vtx, list_vtx);
661 45297
                        return;
662
                }
663 5407
                vtx = vtx->parent;
664 5407
                vtx->n_childready++;
665 5407
                assert(vtx->n_child >= vtx->n_childready);
666
        }
667 50712
}
668
669
/* Add a child to a parent, and update child counters */
670
static void
671 5402
vtx_set_parent(struct vtx *parent, struct vtx *child)
672
{
673
674 5402
        CHECK_OBJ_NOTNULL(parent, VTX_MAGIC);
675 5402
        CHECK_OBJ_NOTNULL(child, VTX_MAGIC);
676 5402
        assert(parent != child);
677 5402
        AZ(parent->flags & VTX_F_COMPLETE);
678 5402
        AZ(child->flags & VTX_F_COMPLETE);
679 5402
        AZ(child->parent);
680 5402
        child->parent = parent;
681 5402
        VTAILQ_INSERT_TAIL(&parent->child, child, list_child);
682 5402
        parent->n_child++;
683 5402
        do
684 6441
                parent->n_descend += 1 + child->n_descend;
685 6441
        while ((parent = parent->parent) != NULL);
686 5402
}
687
688
/* Parse a begin or link record. Returns the number of elements that was
689
   successfully parsed. */
690
static int
691 135935
vtx_parse_link(const char *str, enum VSL_transaction_e *ptype,
692
    uint64_t *pvxid, enum VSL_reason_e *preason, uint64_t *psub)
693
{
694
        char type[16], reason[16];
695
        uintmax_t vxid, sub;
696
        int i;
697
        enum VSL_transaction_e et;
698
        enum VSL_reason_e er;
699
700 135935
        AN(str);
701 135935
        AN(ptype);
702 135935
        AN(pvxid);
703 135935
        AN(preason);
704
705 135935
        i = sscanf(str, "%15s %ju %15s %ju", type, &vxid, reason, &sub);
706 135935
        if (i < 1)
707 0
                return (0);
708
709
        /* transaction type */
710 418778
        for (et = VSL_t_unknown; et < VSL_t__MAX; et++)
711 418755
                if (!strcmp(type, vsl_t_names[et]))
712 135912
                        break;
713 135935
        if (et >= VSL_t__MAX)
714 0
                et = VSL_t_unknown;
715 135901
        *ptype = et;
716 135901
        if (i == 1)
717 0
                return (1);
718
719
        /* vxid */
720 135901
        assert((vxid & ~VSL_IDENTMASK) == 0);
721 135901
        *pvxid = vxid;
722 135901
        if (i == 2)
723 0
                return (2);
724
725
        /* transaction reason */
726 564835
        for (er = VSL_r_unknown; er < VSL_r__MAX; er++)
727 561957
                if (!strcmp(reason, vsl_r_names[er]))
728 133023
                        break;
729 135901
        if (er >= VSL_r__MAX)
730 2882
                er = VSL_r_unknown;
731 135901
        *preason = er;
732 135901
        if (i == 3)
733 129821
                return (3);
734
735
        /* request sub-level */
736 6080
        if (psub != NULL)
737 2200
                *psub = sub;
738 6080
        return (4);
739 135901
}
740
741
/* Parse and process a begin record */
742
static int
743 50709
vtx_scan_begin(struct VSLQ *vslq, struct vtx *vtx, const uint32_t *ptr)
744
{
745
        int i;
746
        enum VSL_transaction_e type;
747
        enum VSL_reason_e reason;
748
        uint64_t p_vxid;
749
        struct vtx *p_vtx;
750
751 50709
        assert(VSL_TAG(ptr) == SLT_Begin);
752
753 50709
        AZ(vtx->flags & VTX_F_READY);
754
755 50709
        i = vtx_parse_link(VSL_CDATA(ptr), &type, &p_vxid, &reason, NULL);
756 50709
        if (i < 3)
757 0
                return (vtx_diag_tag(vtx, ptr, "parse error"));
758 50709
        if (type == VSL_t_unknown)
759 0
                (void)vtx_diag_tag(vtx, ptr, "unknown vxid type");
760
761
        /* Check/set vtx type */
762 50709
        if (vtx->type != VSL_t_unknown && vtx->type != type)
763
                /* Type not matching the one previously set by a link
764
                   record */
765 0
                (void)vtx_diag_tag(vtx, ptr, "type mismatch");
766 50709
        vtx->type = type;
767 50709
        vtx->reason = reason;
768
769 50709
        if (p_vxid == 0)
770
                /* Zero means no parent */
771 14657
                return (0);
772 36052
        if (p_vxid == vtx->key.vxid)
773 0
                return (vtx_diag_tag(vtx, ptr, "link to self"));
774
775 36052
        if (vslq->grouping == VSL_g_vxid)
776 29531
                return (0);     /* No links */
777 6521
        if (vslq->grouping == VSL_g_request && vtx->type == VSL_t_req &&
778 1960
            vtx->reason == VSL_r_rxreq)
779 1120
                return (0);     /* No links */
780
781 5401
        if (vtx->parent != NULL) {
782 2481
                if (vtx->parent->key.vxid != p_vxid) {
783
                        /* This vtx already belongs to a different
784
                           parent */
785 0
                        return (vtx_diag_tag(vtx, ptr, "link mismatch"));
786
                } else
787
                        /* Link already exists */
788 2481
                        return (0);
789
        }
790
791 2920
        p_vtx = vtx_lookup(vslq, p_vxid);
792 2920
        if (p_vtx == NULL) {
793
                /* Not seen parent yet. Create it. */
794 1240
                p_vtx = vtx_add(vslq, p_vxid);
795 1240
                AN(p_vtx);
796 1240
        } else {
797 1680
                CHECK_OBJ_NOTNULL(p_vtx, VTX_MAGIC);
798 1680
                if (p_vtx->flags & VTX_F_COMPLETE)
799 0
                        return (vtx_diag_tag(vtx, ptr, "link too late"));
800
        }
801
802
        /* Create link */
803 2920
        vtx_set_parent(p_vtx, vtx);
804
805 2920
        return (0);
806 50709
}
807
808
/* Parse and process a link record */
809
static int
810 37384
vtx_scan_link(struct VSLQ *vslq, struct vtx *vtx, const uint32_t *ptr)
811
{
812
        int i;
813
        enum VSL_transaction_e c_type;
814
        enum VSL_reason_e c_reason;
815
        uint64_t c_vxid;
816
        struct vtx *c_vtx;
817
818 37384
        assert(VSL_TAG(ptr) == SLT_Link);
819
820 37384
        AZ(vtx->flags & VTX_F_READY);
821
822 37384
        i = vtx_parse_link(VSL_CDATA(ptr), &c_type, &c_vxid, &c_reason, NULL);
823 37384
        if (i < 3)
824 0
                return (vtx_diag_tag(vtx, ptr, "parse error"));
825 37384
        if (c_type == VSL_t_unknown)
826 0
                (void)vtx_diag_tag(vtx, ptr, "unknown vxid type");
827
828 37384
        if (vslq->grouping == VSL_g_vxid)
829 31979
                return (0);     /* No links */
830 5405
        if (vslq->grouping == VSL_g_request && vtx->type == VSL_t_sess)
831 0
                return (0);     /* No links */
832
833 5405
        if (c_vxid == 0)
834 0
                return (vtx_diag_tag(vtx, ptr, "illegal link vxid"));
835 5405
        if (c_vxid == vtx->key.vxid)
836 0
                return (vtx_diag_tag(vtx, ptr, "link to self"));
837
838
        /* Lookup and check child vtx */
839 5405
        c_vtx = vtx_lookup(vslq, c_vxid);
840 5405
        if (c_vtx == NULL) {
841
                /* Child not seen before. Insert it and create link */
842 2485
                c_vtx = vtx_add(vslq, c_vxid);
843 2485
                AN(c_vtx);
844 2485
                AZ(c_vtx->parent);
845 2485
                c_vtx->type = c_type;
846 2485
                c_vtx->reason = c_reason;
847 2485
                vtx_set_parent(vtx, c_vtx);
848 2485
                return (0);
849
        }
850
851 2920
        CHECK_OBJ_NOTNULL(c_vtx, VTX_MAGIC);
852 2920
        if (c_vtx->parent == vtx)
853
                /* Link already exists */
854 2920
                return (0);
855 0
        if (c_vtx->parent != NULL && c_vtx->parent != vtx)
856 0
                return (vtx_diag_tag(vtx, ptr, "duplicate link"));
857 0
        if (c_vtx->flags & VTX_F_COMPLETE)
858 0
                return (vtx_diag_tag(vtx, ptr, "link too late"));
859 0
        if (c_vtx->type != VSL_t_unknown && c_vtx->type != c_type)
860 0
                (void)vtx_diag_tag(vtx, ptr, "type mismatch");
861
862 0
        c_vtx->type = c_type;
863 0
        c_vtx->reason = c_reason;
864 0
        vtx_set_parent(vtx, c_vtx);
865 0
        return (0);
866 37384
}
867
868
/* Scan the records of a vtx, performing processing actions on specific
869
   records */
870
static void
871 345463
vtx_scan(struct VSLQ *vslq, struct vtx *vtx)
872
{
873
        const uint32_t *ptr;
874
        enum VSL_tag_e tag;
875
876 3878261
        while (!(vtx->flags & VTX_F_COMPLETE) &&
877 1912478
            vslc_vtx_next(&vtx->c.cursor) == 1) {
878 1620320
                ptr = vtx->c.cursor.rec.ptr;
879 1620320
                if (VSL_ID(ptr) != vtx->key.vxid) {
880 0
                        (void)vtx_diag_tag(vtx, ptr, "vxid mismatch");
881 0
                        continue;
882
                }
883
884 1620320
                tag = VSL_TAG(ptr);
885 1620320
                assert(tag != SLT__Batch);
886
887 1620320
                switch (tag) {
888
                case SLT_Begin:
889 50709
                        if (vtx->flags & VTX_F_BEGIN)
890 0
                                (void)vtx_diag_tag(vtx, ptr, "duplicate begin");
891
                        else {
892 50709
                                (void)vtx_scan_begin(vslq, vtx, ptr);
893 50709
                                vtx->flags |= VTX_F_BEGIN;
894
                        }
895 50709
                        break;
896
897
                case SLT_Link:
898 37367
                        (void)vtx_scan_link(vslq, vtx, ptr);
899 37367
                        break;
900
901
                case SLT_End:
902 50711
                        AZ(vtx->flags & VTX_F_END);
903 50711
                        vtx->flags |= VTX_F_END;
904 50711
                        vtx_mark_complete(vslq, vtx);
905 50711
                        break;
906
907
                default:
908 1481533
                        break;
909
                }
910
        }
911 345463
}
912
913
/* Force a vtx into complete status by synthing the necessary outstanding
914
   records */
915
static void
916 5907
vtx_force(struct VSLQ *vslq, struct vtx *vtx, const char *reason)
917
{
918
919 5907
        AZ(vtx->flags & VTX_F_COMPLETE);
920 5907
        AZ(vtx->flags & VTX_F_READY);
921 5907
        vtx_scan(vslq, vtx);
922 5907
        if (!(vtx->flags & VTX_F_BEGIN))
923 4
                vtx_synth_rec(vtx, SLT_Begin, "%s %u synth",
924 2
                    vsl_t_names[vtx->type], 0);
925 5907
        vtx_diag(vtx, reason);
926 5907
        if (!(vtx->flags & VTX_F_END))
927 5907
                vtx_synth_rec(vtx, SLT_End, "synth");
928 5907
        vtx_scan(vslq, vtx);
929 5907
        AN(vtx->flags & VTX_F_COMPLETE);
930 5907
}
931
932
static int
933 440
vslq_ratelimit(struct VSLQ *vslq)
934
{
935
        vtim_mono now;
936
        vtim_dur delta;
937
938 440
        CHECK_OBJ_NOTNULL(vslq, VSLQ_MAGIC);
939 440
        CHECK_OBJ_NOTNULL(vslq->vsl, VSL_MAGIC);
940
941 440
        now = VTIM_mono();
942 440
        delta = now - vslq->last_use;
943 440
        vslq->credits += (delta / vslq->vsl->R_opt_p) * vslq->vsl->R_opt_l;
944 440
        vslq->credits = vmin_t(double, vslq->credits, vslq->vsl->R_opt_l);
945 440
        vslq->last_use = now;
946
947 440
        if (vslq->credits < 1.0)
948 0
                return (0);
949
950 440
        vslq->credits -= 1.0;
951 440
        return (1);
952 440
}
953
954
/* Build transaction array, do the query and callback. Returns 0 or the
955
   return value from func */
956
static int
957 39480
vslq_callback(struct VSLQ *vslq, struct vtx *vtx, VSLQ_dispatch_f *func,
958
    void *priv)
959
{
960 39480
        unsigned n = vtx->n_descend + 1;
961 39480
        struct vtx *vtxs[n];
962 39480
        struct VSL_transaction trans[n];
963 39480
        struct VSL_transaction *ptrans[n + 1];
964
        unsigned i, j;
965
966 39480
        AN(vslq);
967 39480
        CHECK_OBJ_NOTNULL(vtx, VTX_MAGIC);
968 39480
        AN(vtx->flags & VTX_F_READY);
969 39480
        AN(func);
970
971 39480
        if (vslq->grouping == VSL_g_session &&
972 870
            vtx->type != VSL_t_sess)
973 0
                return (0);
974 39480
        if (vslq->grouping == VSL_g_request &&
975 1120
            vtx->type != VSL_t_req)
976 0
                return (0);
977
978
        /* Build transaction array */
979 39480
        AN(vslc_vtx_reset(&vtx->c.cursor) == vsl_end);
980 39480
        vtxs[0] = vtx;
981 39480
        trans[0].level = 1;
982 39480
        trans[0].vxid = vtx->key.vxid;
983 39480
        trans[0].vxid_parent = 0;
984 39480
        trans[0].type = vtx->type;
985 39480
        trans[0].reason = vtx->reason;
986 39480
        trans[0].c = &vtx->c.cursor;
987 39480
        i = 1;
988 39480
        j = 0;
989 83740
        while (j < i) {
990 49031
                VTAILQ_FOREACH(vtx, &vtxs[j]->child, list_child) {
991 4771
                        assert(i < n);
992 4771
                        AN(vslc_vtx_reset(&vtx->c.cursor) == vsl_end);
993 4771
                        vtxs[i] = vtx;
994 4771
                        if (vtx->reason == VSL_r_restart)
995
                                /* Restarts stay at the same level as parent */
996 80
                                trans[i].level = trans[j].level;
997
                        else
998 4691
                                trans[i].level = trans[j].level + 1;
999 4771
                        trans[i].vxid = vtx->key.vxid;
1000 4771
                        trans[i].vxid_parent = trans[j].vxid;
1001 4771
                        trans[i].type = vtx->type;
1002 4771
                        trans[i].reason = vtx->reason;
1003 4771
                        trans[i].c = &vtx->c.cursor;
1004 4771
                        i++;
1005 4771
                }
1006 44260
                j++;
1007
        }
1008 39480
        assert(i == n);
1009
1010
        /* Build pointer array */
1011 83739
        for (i = 0; i < n; i++)
1012 44259
                ptrans[i] = &trans[i];
1013 39480
        ptrans[i] = NULL;
1014
1015
        /* Query test goes here */
1016 39480
        if (vslq->query != NULL && !vslq_runquery(vslq->query, ptrans))
1017 14080
                return (0);
1018
1019 25400
        if (vslq->vsl->R_opt_l != 0 && !vslq_ratelimit(vslq))
1020 0
                return (0);
1021
1022
        /* Callback */
1023 25400
        return ((func)(vslq->vsl, ptrans, priv));
1024 39480
}
1025
1026
/* Create a synthetic log record. The record will be inserted at the
1027
   current cursor offset */
1028
static void
1029 11816
vtx_synth_rec(struct vtx *vtx, unsigned tag, const char *fmt, ...)
1030
{
1031
        struct synth *synth, *it;
1032
        va_list ap;
1033
        char *buf;
1034
        int l, buflen;
1035
        uint64_t vxid;
1036
1037 11816
        ALLOC_OBJ(synth, SYNTH_MAGIC);
1038 11816
        AN(synth);
1039
1040 11816
        buf = VSL_DATA(synth->data);
1041 11816
        buflen = sizeof(synth->data) - VSL_BYTES(VSL_OVERHEAD);
1042 11816
        va_start(ap, fmt);
1043 11816
        l = vsnprintf(buf, buflen, fmt, ap);
1044 11816
        assert(l >= 0);
1045 11816
        va_end(ap);
1046 11816
        if (l > buflen - 1)
1047 0
                l = buflen - 1;
1048 11816
        buf[l++] = '\0';        /* NUL-terminated */
1049 11816
        vxid = vtx->key.vxid;
1050 11816
        switch (vtx->type) {
1051
        case VSL_t_req:
1052 646
                vxid |= VSL_CLIENTMARKER;
1053 646
                break;
1054
        case VSL_t_bereq:
1055 80
                vxid |= VSL_BACKENDMARKER;
1056 80
                break;
1057
        default:
1058 11090
                break;
1059
        }
1060 11816
        synth->data[2] = vxid >> 32;
1061 11816
        synth->data[1] = vxid;
1062 23632
        synth->data[0] = (((tag & VSL_IDMASK) << VSL_IDSHIFT) |
1063 11816
            (VSL_VERSION_3 << VSL_VERSHIFT) | l);
1064 11816
        synth->offset = vtx->c.offset;
1065
1066 11816
        VTAILQ_FOREACH_REVERSE(it, &vtx->synth, synthhead, list) {
1067
                /* Make sure the synth list is sorted on offset */
1068 5909
                CHECK_OBJ_NOTNULL(it, SYNTH_MAGIC);
1069 5909
                if (synth->offset >= it->offset)
1070 5909
                        break;
1071 0
        }
1072 11816
        if (it != NULL)
1073 5909
                VTAILQ_INSERT_AFTER(&vtx->synth, it, synth, list);
1074
        else
1075 5907
                VTAILQ_INSERT_HEAD(&vtx->synth, synth, list);
1076
1077
        /* Update cursor */
1078 11816
        CHECK_OBJ_ORNULL(vtx->c.synth, SYNTH_MAGIC);
1079 11816
        if (vtx->c.synth == NULL || vtx->c.synth->offset > synth->offset)
1080 5907
                vtx->c.synth = synth;
1081 11816
}
1082
1083
/* Add a diagnostic SLT_VSL synth record to the vtx. */
1084
static int
1085 5907
vtx_diag(struct vtx *vtx, const char *msg)
1086
{
1087
1088 5907
        vtx_synth_rec(vtx, SLT_VSL, msg);
1089 5907
        return (-1);
1090
}
1091
1092
/* Add a SLT_VSL diag synth record to the vtx. Takes an offending record
1093
   that will be included in the log record */
1094
static int
1095 0
vtx_diag_tag(struct vtx *vtx, const uint32_t *ptr, const char *reason)
1096
{
1097
1098 0
        vtx_synth_rec(vtx, SLT_VSL, "%s (%ju:%s \"%.*s\")", reason, VSL_ID(ptr),
1099 0
            VSL_tags[VSL_TAG(ptr)], (int)VSL_LEN(ptr), VSL_CDATA(ptr));
1100 0
        return (-1);
1101
}
1102
1103
struct VSLQ *
1104 15360
VSLQ_New(struct VSL_data *vsl, struct VSL_cursor **cp,
1105
    enum VSL_grouping_e grouping, const char *querystring)
1106
{
1107
        struct vslq_query *query;
1108
        struct VSLQ *vslq;
1109
1110 15360
        CHECK_OBJ_NOTNULL(vsl, VSL_MAGIC);
1111 15360
        if (grouping >= VSL_g__MAX) {
1112 0
                (void)vsl_diag(vsl, "Illegal query grouping");
1113 0
                return (NULL);
1114
        }
1115 15360
        if (querystring != NULL) {
1116 7000
                query = vslq_newquery(vsl, grouping, querystring);
1117 7000
                if (query == NULL)
1118 1280
                        return (NULL);
1119 5720
        } else
1120 8360
                query = NULL;
1121
1122 14080
        ALLOC_OBJ(vslq, VSLQ_MAGIC);
1123 14080
        AN(vslq);
1124 14080
        vslq->vsl = vsl;
1125 14080
        if (cp != NULL) {
1126 10680
                vslq->c = *cp;
1127 10680
                *cp = NULL;
1128 10680
        }
1129 14080
        vslq->grouping = grouping;
1130 14080
        vslq->query = query;
1131 14080
        if (vslq->vsl->R_opt_l != 0) {
1132 80
                vslq->last_use = VTIM_mono();
1133 80
                vslq->credits = 1;
1134 80
        }
1135
1136
        /* Setup normal mode */
1137 14080
        VRBT_INIT(&vslq->tree);
1138 14080
        VTAILQ_INIT(&vslq->ready);
1139 14080
        VTAILQ_INIT(&vslq->incomplete);
1140 14080
        VTAILQ_INIT(&vslq->shmrefs);
1141 14080
        VTAILQ_INIT(&vslq->cache);
1142
1143
        /* Setup raw mode */
1144 14080
        vslq->raw.c.magic = VSLC_RAW_MAGIC;
1145 14080
        vslq->raw.c.cursor.priv_tbl = &vslc_raw_tbl;
1146 14080
        vslq->raw.c.cursor.priv_data = &vslq->raw.c;
1147 14080
        vslq->raw.trans.level = 0;
1148 14080
        vslq->raw.trans.type = VSL_t_raw;
1149 14080
        vslq->raw.trans.reason = VSL_r_unknown;
1150 14080
        vslq->raw.trans.c = &vslq->raw.c.cursor;
1151 14080
        vslq->raw.ptrans[0] = &vslq->raw.trans;
1152 14080
        vslq->raw.ptrans[1] = NULL;
1153
1154 14080
        return (vslq);
1155 15360
}
1156
1157
void
1158 13840
VSLQ_Delete(struct VSLQ **pvslq)
1159
{
1160
        struct VSLQ *vslq;
1161
        struct vtx *vtx;
1162
1163 13840
        TAKE_OBJ_NOTNULL(vslq, pvslq, VSLQ_MAGIC);
1164
1165 13840
        (void)VSLQ_Flush(vslq, NULL, NULL);
1166 13840
        AZ(vslq->n_outstanding);
1167
1168 13840
        if (vslq->c != NULL) {
1169 13840
                VSL_DeleteCursor(vslq->c);
1170 13840
                vslq->c = NULL;
1171 13840
        }
1172
1173 13840
        if (vslq->query != NULL)
1174 5720
                vslq_deletequery(&vslq->query);
1175 13840
        AZ(vslq->query);
1176
1177 36268
        while (!VTAILQ_EMPTY(&vslq->cache)) {
1178 22428
                AN(vslq->n_cache);
1179 22428
                vtx = VTAILQ_FIRST(&vslq->cache);
1180 22428
                CHECK_OBJ_NOTNULL(vtx, VTX_MAGIC);
1181 22428
                VTAILQ_REMOVE(&vslq->cache, vtx, list_child);
1182 22428
                vslq->n_cache--;
1183 22428
                FREE_OBJ(vtx);
1184
        }
1185
1186 13840
        FREE_OBJ(vslq);
1187 13840
}
1188
1189
void
1190 3160
VSLQ_SetCursor(struct VSLQ *vslq, struct VSL_cursor **cp)
1191
{
1192
1193 3160
        CHECK_OBJ_NOTNULL(vslq, VSLQ_MAGIC);
1194
1195 3160
        if (vslq->c != NULL) {
1196 0
                (void)VSLQ_Flush(vslq, NULL, NULL);
1197 0
                AZ(vslq->n_outstanding);
1198 0
                VSL_DeleteCursor(vslq->c);
1199 0
                vslq->c = NULL;
1200 0
        }
1201
1202 3160
        if (cp != NULL) {
1203 3160
                AN(*cp);
1204 3160
                vslq->c = *cp;
1205 3160
                *cp = NULL;
1206 3160
        }
1207 3160
}
1208
1209
/* Regard each log line as a single transaction, feed it through the query
1210
   and do the callback */
1211
static int
1212 709059
vslq_raw(struct VSLQ *vslq, VSLQ_dispatch_f *func, void *priv)
1213
{
1214 709059
        enum vsl_status r = vsl_more;
1215
        int i;
1216
1217 709059
        assert(vslq->grouping == VSL_g_raw);
1218
1219 709059
        assert(vslq->raw.offset <= vslq->raw.len);
1220 709059
        do {
1221 777686
                if (vslq->raw.offset == vslq->raw.len) {
1222 417505
                        r = VSL_Next(vslq->c);
1223 417505
                        if (r != vsl_more)
1224 226820
                                return (r);
1225 190685
                        AN(vslq->c->rec.ptr);
1226 190685
                        vslq->raw.start = vslq->c->rec;
1227 190685
                        if (VSL_TAG(vslq->c->rec.ptr) == SLT__Batch)
1228 137272
                                vslq->raw.len = VSL_END(vslq->c->rec.ptr,
1229 68636
                                    VSL_BATCHLEN(vslq->c->rec.ptr)) -
1230 68636
                                    vslq->c->rec.ptr;
1231
                        else
1232 244098
                                vslq->raw.len = VSL_NEXT(vslq->raw.start.ptr) -
1233 122049
                                    vslq->raw.start.ptr;
1234 190685
                        assert(vslq->raw.len > 0);
1235 190685
                        vslq->raw.offset = 0;
1236 190685
                }
1237
1238 550866
                vslq->raw.c.ptr = vslq->raw.start.ptr + vslq->raw.offset;
1239 550866
                vslq->raw.c.cursor.rec.ptr = NULL;
1240 550866
                vslq->raw.trans.vxid = VSL_ID(vslq->raw.c.ptr);
1241 550866
                vslq->raw.offset += VSL_NEXT(vslq->raw.c.ptr) - vslq->raw.c.ptr;
1242 550866
        } while (VSL_TAG(vslq->raw.c.ptr) == SLT__Batch);
1243
1244 482239
        assert (r == vsl_more);
1245
1246 482239
        if (func == NULL)
1247 0
                return (r);
1248
1249 482239
        if (vslq->query != NULL &&
1250 81240
            !vslq_runquery(vslq->query, vslq->raw.ptrans))
1251 76360
                return (r);
1252
1253 405879
        if (vslq->vsl->R_opt_l != 0 && !vslq_ratelimit(vslq))
1254 0
                return (r);
1255
1256 405879
        i = (func)(vslq->vsl, vslq->raw.ptrans, priv);
1257 405879
        if (i)
1258 3720
                return (i);
1259
1260 402159
        return (r);
1261 709059
}
1262
1263
/* Check the beginning of the shmref list, and buffer refs that are at
1264
 * warning level.
1265
 */
1266
static enum vsl_status
1267 460388
vslq_shmref_check(struct VSLQ *vslq)
1268
{
1269
        struct chunk *chunk;
1270
        enum vsl_check i;
1271
1272 460388
        while ((chunk = VTAILQ_FIRST(&vslq->shmrefs)) != NULL) {
1273 339614
                CHECK_OBJ_NOTNULL(chunk, CHUNK_MAGIC);
1274 339614
                assert(chunk->type == chunk_t_shm);
1275 339614
                i = VSL_Check(vslq->c, &chunk->shm.start);
1276 339614
                switch (i) {
1277
                case vsl_check_valid:
1278
                        /* First on list is OK, refs behind it must also
1279
                           be OK */
1280 339614
                        return (vsl_more);
1281
                case vsl_check_warn:
1282
                        /* Buffer this chunk */
1283 0
                        chunk_shm_to_buf(vslq, chunk);
1284 0
                        break;
1285
                default:
1286
                        /* Too late to buffer */
1287 0
                        return (vsl_e_overrun);
1288
                }
1289
        }
1290
1291 120774
        return (vsl_more);
1292 460388
}
1293
1294
static unsigned
1295 56292
vslq_candidate(struct VSLQ *vslq, const uint32_t *ptr)
1296
{
1297
        enum VSL_transaction_e type;
1298
        enum VSL_reason_e reason;
1299
        struct VSL_data *vsl;
1300
        enum VSL_tag_e tag;
1301
        uint64_t p_vxid, sub;
1302
        int i;
1303
1304 56292
        CHECK_OBJ_NOTNULL(vslq, VSLQ_MAGIC);
1305 56292
        AN(ptr);
1306
1307 56292
        assert(vslq->grouping != VSL_g_raw);
1308 56292
        if (vslq->grouping == VSL_g_session)
1309 4276
                return (1); /* All are needed */
1310
1311 52016
        vsl = vslq->vsl;
1312 52016
        CHECK_OBJ_NOTNULL(vsl, VSL_MAGIC);
1313 52016
        if (vslq->grouping == VSL_g_vxid) {
1314 47862
                if (!vsl->c_opt && !vsl->b_opt)
1315 35222
                        AZ(vsl->E_opt);
1316 12640
                else if (!vsl->b_opt && !VSL_CLIENT(ptr))
1317 2840
                        return (0);
1318 9800
                else if (!vsl->c_opt && !VSL_BACKEND(ptr))
1319 1360
                        return (0);
1320
                /* Need to parse the Begin tag - fallthrough to below */
1321 43662
        }
1322
1323 47816
        tag = VSL_TAG(ptr);
1324 47816
        assert(tag == SLT_Begin);
1325 47816
        i = vtx_parse_link(VSL_CDATA(ptr), &type, &p_vxid, &reason, &sub);
1326 47816
        if (i < 3 || type == VSL_t_unknown)
1327 2
                return (0);
1328
1329 47816
        if (vslq->grouping == VSL_g_request && type == VSL_t_sess)
1330 798
                return (0);
1331
1332 47018
        if (vslq->grouping == VSL_g_vxid && i > 3 && sub > 0 && !vsl->E_opt)
1333 600
                return (0);
1334
1335 46418
        return (1);
1336 56292
}
1337
1338
/* Process next input record */
1339
static enum vsl_status
1340 859367
vslq_next(struct VSLQ *vslq)
1341
{
1342
        const uint32_t *ptr;
1343
        struct VSL_cursor *c;
1344
        enum vsl_status r;
1345
        enum VSL_tag_e tag;
1346
        ssize_t len;
1347
        uint64_t vxid;
1348
        unsigned keep;
1349
        struct vtx *vtx;
1350
1351 859367
        c = vslq->c;
1352 859367
        r = VSL_Next(c);
1353 859367
        if (r != vsl_more)
1354 397762
                return (r);
1355
1356 461605
        assert (r == vsl_more);
1357
1358 461605
        tag = (enum VSL_tag_e)VSL_TAG(c->rec.ptr);
1359 461605
        if (tag == SLT__Batch) {
1360 145330
                vxid = VSL_BATCHID(c->rec.ptr);
1361 290660
                len = VSL_END(c->rec.ptr, VSL_BATCHLEN(c->rec.ptr)) -
1362 145330
                    c->rec.ptr;
1363 145330
                if (len == 0)
1364 0
                        return (r);
1365 145330
                ptr = VSL_NEXT(c->rec.ptr);
1366 145330
                tag = (enum VSL_tag_e)VSL_TAG(ptr);
1367 145330
        } else {
1368 316275
                vxid = VSL_ID(c->rec.ptr);
1369 316275
                len = VSL_NEXT(c->rec.ptr) - c->rec.ptr;
1370 316275
                ptr = c->rec.ptr;
1371
        }
1372 461605
        assert(len > 0);
1373 461605
        if (vxid == 0)
1374
                /* Skip non-transactional records */
1375 102485
                return (r);
1376
1377 359120
        vtx = vtx_lookup(vslq, vxid);
1378 359120
        keep = tag != SLT_Begin || vslq_candidate(vslq, ptr);
1379 359120
        if (vtx == NULL && tag == SLT_Begin && keep) {
1380 46984
                vtx = vtx_add(vslq, vxid);
1381 46984
                AN(vtx);
1382 46984
        }
1383 359120
        if (vtx != NULL) {
1384 334246
                AN(keep);
1385 334246
                r = vtx_append(vslq, vtx, &c->rec, len);
1386 334246
                if (r == vsl_more)
1387 333736
                        vtx_scan(vslq, vtx);
1388 334256
        }
1389
1390 359130
        return (r);
1391 859377
}
1392
1393
/* Test query and report any ready transactions */
1394
static int
1395 53319
vslq_process_ready(struct VSLQ *vslq, VSLQ_dispatch_f *func, void *priv)
1396
{
1397
        struct vtx *vtx;
1398 53319
        int i = 0;
1399
1400 53319
        AN(vslq);
1401
1402 91619
        while (!VTAILQ_EMPTY(&vslq->ready)) {
1403 45300
                vtx = VTAILQ_FIRST(&vslq->ready);
1404 45300
                CHECK_OBJ_NOTNULL(vtx, VTX_MAGIC);
1405 45300
                VTAILQ_REMOVE(&vslq->ready, vtx, list_vtx);
1406 45300
                AN(vtx->flags & VTX_F_READY);
1407 45300
                if (func != NULL)
1408 39477
                        i = vslq_callback(vslq, vtx, func, priv);
1409 45300
                vtx_retire(vslq, &vtx);
1410 45300
                AZ(vtx);
1411 45300
                if (i)
1412 7000
                        return (i);
1413
        }
1414
1415 46319
        return (0);
1416 53319
}
1417
1418
/* Process the input cursor, calling the callback function on matching
1419
   transaction sets */
1420
int
1421 1568228
VSLQ_Dispatch(struct VSLQ *vslq, VSLQ_dispatch_f *func, void *priv)
1422
{
1423
        enum vsl_status r;
1424
        int i;
1425
        double now;
1426
        struct vtx *vtx;
1427
1428 1568228
        CHECK_OBJ_NOTNULL(vslq, VSLQ_MAGIC);
1429
1430
        /* Check that we have a cursor */
1431 1568228
        if (vslq->c == NULL)
1432 0
                return (vsl_e_abandon);
1433
1434 1568228
        if (vslq->grouping == VSL_g_raw)
1435 709059
                return (vslq_raw(vslq, func, priv));
1436
1437
        /* Process next cursor input */
1438 859169
        r = vslq_next(vslq);
1439 859169
        if (r != vsl_more)
1440
                /* At end of log or cursor reports error condition */
1441 397436
                return (r);
1442
1443
        /* Check shmref list and buffer if necessary */
1444 461733
        r = vslq_shmref_check(vslq);
1445 461733
        if (r != vsl_more)
1446
                /* Buffering of shm ref failed */
1447 0
                return (r);
1448
1449 461733
        assert (r == vsl_more);
1450
1451
        /* Check vtx timeout */
1452 461733
        now = VTIM_mono();
1453 461813
        while (!VTAILQ_EMPTY(&vslq->incomplete)) {
1454 333870
                vtx = VTAILQ_FIRST(&vslq->incomplete);
1455 333870
                CHECK_OBJ_NOTNULL(vtx, VTX_MAGIC);
1456 333870
                if (now - vtx->t_start < vslq->vsl->T_opt)
1457 333790
                        break;
1458 80
                vtx_force(vslq, vtx, "timeout");
1459 80
                AN(vtx->flags & VTX_F_COMPLETE);
1460
        }
1461
1462
        /* Check store limit */
1463 461733
        while (vslq->n_outstanding > vslq->vsl->L_opt &&
1464 0
            !(VTAILQ_EMPTY(&vslq->incomplete))) {
1465 0
                vtx = VTAILQ_FIRST(&vslq->incomplete);
1466 0
                CHECK_OBJ_NOTNULL(vtx, VTX_MAGIC);
1467 0
                vtx_force(vslq, vtx, "store overflow");
1468 0
                AN(vtx->flags & VTX_F_COMPLETE);
1469 0
                i = vslq_process_ready(vslq, func, priv);
1470 0
                if (i)
1471
                        /* User return code */
1472 0
                        return (i);
1473
        }
1474
1475
        /* Check ready list */
1476 461733
        if (!VTAILQ_EMPTY(&vslq->ready)) {
1477 39478
                i = vslq_process_ready(vslq, func, priv);
1478 39478
                if (i)
1479
                        /* User return code */
1480 7000
                        return (i);
1481 32478
        }
1482
1483 454733
        return (vsl_more);
1484 1568228
}
1485
1486
/* Flush any incomplete vtx held on to. Do callbacks if func != NULL */
1487
int
1488 13840
VSLQ_Flush(struct VSLQ *vslq, VSLQ_dispatch_f *func, void *priv)
1489
{
1490
        struct vtx *vtx;
1491
1492 13840
        CHECK_OBJ_NOTNULL(vslq, VSLQ_MAGIC);
1493
1494 19667
        while (!VTAILQ_EMPTY(&vslq->incomplete)) {
1495 5827
                vtx = VTAILQ_FIRST(&vslq->incomplete);
1496 5827
                CHECK_OBJ_NOTNULL(vtx, VTX_MAGIC);
1497 5827
                AZ(vtx->flags & VTX_F_COMPLETE);
1498 5827
                vtx_force(vslq, vtx, "flush");
1499
        }
1500
1501 13840
        return (vslq_process_ready(vslq, func, priv));
1502
}