varnish-cache/lib/libvarnishapi/vxp_lexer.c
0
/*-
1
 * Copyright (c) 2006 Verdens Gang AS
2
 * Copyright (c) 2006-2015 Varnish Software AS
3
 * All rights reserved.
4
 *
5
 * Author: Martin Blix Grydeland <martin@varnish-software.com>
6
 *
7
 * SPDX-License-Identifier: BSD-2-Clause
8
 *
9
 * Redistribution and use in source and binary forms, with or without
10
 * modification, are permitted provided that the following conditions
11
 * are met:
12
 * 1. Redistributions of source code must retain the above copyright
13
 *    notice, this list of conditions and the following disclaimer.
14
 * 2. Redistributions in binary form must reproduce the above copyright
15
 *    notice, this list of conditions and the following disclaimer in the
16
 *    documentation and/or other materials provided with the distribution.
17
 *
18
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
19
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21
 * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
22
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28
 * SUCH DAMAGE.
29
 *
30
 */
31
32
#include "config.h"
33
34
#include <ctype.h>
35
#include <stdlib.h>
36
#include <string.h>
37
#include <stdint.h>
38
#include <unistd.h> /* for MUSL */
39
40
#include "vdef.h"
41
#include "vas.h"
42
#include "vqueue.h"
43
44
#include "vre.h"
45
#include "vsb.h"
46
47
#include "vxp.h"
48
49
static void
50 7560
vxp_append_token(struct vxp *vxp, unsigned tok, const char *b, const char *e)
51
{
52
        struct token *t;
53
54 7560
        t = vxp_Alloc(vxp, sizeof *t);
55 7560
        AN(t);
56 7560
        t->tok = tok;
57 7560
        t->b = b;
58 7560
        t->e = e;
59 7560
        VTAILQ_INSERT_TAIL(&vxp->tokens, t, list);
60 7560
        vxp->t = t;
61 7560
}
62
63
/* Unquote and unescape string */
64
static void
65 306
vxp_decstr(struct vxp *vxp)
66
{
67
        const char *b, *e, *p;
68
        char *s;
69 306
        int esc = 0;
70
71 306
        assert(vxp->t->tok == VAL);
72
73 306
        b = vxp->t->b;
74 306
        e = vxp->t->e;
75 306
        assert(e - b >= 2);
76 306
        b++;
77 306
        e--;
78
79 306
        s = vxp->t->dec = vxp_Alloc(vxp, (e - b) + 1);
80 306
        AN(vxp->t->dec);
81 2196
        for (p = b; p < e; p++) {
82 1890
                if (!esc && *p == '\\') {
83 9
                        esc = 1;
84 9
                        continue;
85
                }
86 1881
                esc = 0;
87 1881
                *s++ = *p;
88 1881
        }
89 306
        *s = '\0';
90 306
}
91
92
/*
93
 * Build a token list
94
 */
95
96
void
97 1584
vxp_Lexer(struct vxp *vxp)
98
{
99
        const char *p, *q;
100
        unsigned u;
101
        char quote;
102
103 10989
        for (p = vxp->b; p < vxp->e; ) {
104
105
                /* Skip any space or tab */
106 9441
                if (isblank(*p)) {
107 3294
                        p++;
108 3294
                        continue;
109
                }
110
111 6147
                if (*p == '\\' && p[1] == '\n') {
112 18
                        p += 2;
113 18
                        continue;
114
                }
115
116
                /* Skip comments */
117 6129
                if (*p == '#') {
118 1638
                        while (p < vxp->e && *p != '\n')
119 1521
                                p++;
120 117
                        continue;
121
                }
122
123
                /* Match for the fixed tokens */
124 6012
                u = vxp_fixed_token(p, &q);
125 6012
                if (u != 0) {
126 2475
                        AN(q);
127 2475
                        vxp_append_token(vxp, u, p, q);
128 2475
                        p = q;
129 2475
                        continue;
130
                }
131
132
                /* Match quoted strings */
133 3537
                if (*p == '"' || *p == '\'') {
134 333
                        quote = *p;
135 2493
                        for (q = p + 1; q < vxp->e; q++) {
136 2484
                                if (*q == '\\') {
137 27
                                        q++;
138 27
                                        if (q == vxp->e || *q == '\n')
139 9
                                                break;
140 2475
                                } else if (*q == '\n') {
141 9
                                        break;
142 2448
                                } else if (*q == quote) {
143 306
                                        q++;
144 306
                                        quote = '\0';
145 306
                                        break;
146
                                }
147 2160
                        }
148 333
                        vxp_append_token(vxp, VAL, p, q);
149 333
                        if (quote != '\0') {
150 27
                                VSB_cat(vxp->sb, "Unterminated string ");
151 27
                                vxp_ErrWhere(vxp, vxp->t, q - p);
152 27
                                return;
153
                        }
154 306
                        vxp_decstr(vxp);
155 306
                        p = q;
156 306
                        continue;
157
                }
158
159
                /* Match bareword */
160 3204
                if (isword(*p)) {
161 20448
                        for (q = p; q < vxp->e; q++)
162 19377
                                if (!isword(*q))
163 1854
                                        break;
164 2925
                        vxp_append_token(vxp, VAL, p, q);
165 2925
                        vxp->t->dec = vxp_Alloc(vxp, (q - p) + 1);
166 2925
                        AN(vxp->t->dec);
167 2925
                        memcpy(vxp->t->dec, p, q - p);
168 2925
                        vxp->t->dec[q - p] = '\0';
169 2925
                        p = q;
170 2925
                        continue;
171
                }
172
173
                /* On to the next query */
174 279
                if (*p == '\n') {
175 270
                        vxp_append_token(vxp, EOI, p, p + 1);
176 270
                        p++;
177 270
                        continue;
178
                }
179
180
                /* Error */
181 9
                vxp_append_token(vxp, EOI, p, p + 1);
182 9
                VSB_cat(vxp->sb, "Syntax error ");
183 9
                vxp_ErrWhere(vxp, vxp->t, q - p);
184 9
                return;
185
        }
186
187
        /* Finished */
188 1548
        vxp_append_token(vxp, EOI, vxp->e, vxp->e);
189 1584
}
190
191
#ifdef VXP_DEBUG
192
#include <stdio.h>
193
void
194 27
vxp_PrintTokens(const struct vxp *vxp)
195
{
196
        struct token *t;
197
198 27
        fprintf(stderr, "Token list:\n");
199 27
        fprintf(stderr, "  %-5s %-20s %s\n", "TOK", "SUBSTR", "DECODED");
200 351
        VTAILQ_FOREACH(t, &vxp->tokens, list) {
201 324
                fprintf(stderr, "  ");
202 324
                fprintf(stderr, "%-5s", vxp_tnames[t->tok]);
203 324
                fprintf(stderr, " %-20.*s", (unsigned)(t->e - t->b), t->b);
204 324
                if (t->dec)
205 171
                        fprintf(stderr, " '%s'", t->dec);
206 324
                fprintf(stderr, "\n");
207 324
        }
208 27
        fprintf(stderr, "\n");
209 27
}
210
#endif /* VXP_DEBUG */