libidav/davqlparser.c

changeset 1
b5bb7b3cd597
child 49
2f71f4ee247a
equal deleted inserted replaced
0:2483f517c562 1:b5bb7b3cd597
1 /*
2 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
3 *
4 * Copyright 2018 Olaf Wintermann. All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions are met:
8 *
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 *
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
17 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
20 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
21 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
22 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
23 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
24 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
25 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
26 * POSSIBILITY OF SUCH DAMAGE.
27 */
28
29 #include "davqlparser.h"
30 #include <cx/utils.h>
31 #include <cx/linked_list.h>
32 #include <cx/printf.h>
33 #include <string.h>
34 #include <stdio.h>
35 #include <ctype.h>
36
37 #define sfmtarg(s) ((int)(s).length), (s).ptr
38
39 // ------------------------------------------------------------------------
40 // D E B U G E R
41 // ------------------------------------------------------------------------
42
43 static const char* _map_querytype(davqltype_t type) {
44 switch(type) {
45 case DAVQL_ERROR: return "ERROR";
46 case DAVQL_SELECT: return "SELECT";
47 case DAVQL_SET: return "SET";
48 default: return "unknown";
49 }
50 }
51
52 static const char* _map_exprtype(davqlexprtype_t type) {
53 switch(type) {
54 case DAVQL_UNDEFINED_TYPE: return "undefined";
55 case DAVQL_NUMBER: return "NUMBER";
56 case DAVQL_STRING: return "STRING";
57 case DAVQL_TIMESTAMP: return "TIMESTAMP";
58 case DAVQL_IDENTIFIER: return "IDENTIFIER";
59 case DAVQL_UNARY: return "UNARY";
60 case DAVQL_BINARY: return "BINARY";
61 case DAVQL_LOGICAL: return "LOGICAL";
62 case DAVQL_FUNCCALL: return "FUNCCALL";
63 default: return "unknown";
64 }
65 }
66
67 static const char* _map_specialfield(int info) {
68 switch(info) {
69 case 0: return "";
70 case 1: return "with wildcard";
71 case 2: return "(resource data only)";
72 default: return "with mysterious identifier";
73 }
74 }
75
76 static const char* _map_operator(davqloperator_t op) {
77 // don't use string array, because enum values may change
78 switch(op) {
79 case DAVQL_NOOP: return "no operator";
80 case DAVQL_CALL: return "function call"; case DAVQL_ARGLIST: return ",";
81 case DAVQL_ADD: return "+"; case DAVQL_SUB: return "-";
82 case DAVQL_MUL: return "*"; case DAVQL_DIV: return "/";
83 case DAVQL_AND: return "&"; case DAVQL_OR: return "|";
84 case DAVQL_XOR: return "^"; case DAVQL_NEG: return "~";
85 case DAVQL_NOT: return "NOT"; case DAVQL_LAND: return "AND";
86 case DAVQL_LOR: return "OR"; case DAVQL_LXOR: return "XOR";
87 case DAVQL_EQ: return "="; case DAVQL_NEQ: return "!=";
88 case DAVQL_LT: return "<"; case DAVQL_GT: return ">";
89 case DAVQL_LE: return "<="; case DAVQL_GE: return ">=";
90 case DAVQL_LIKE: return "LIKE"; case DAVQL_UNLIKE: return "UNLIKE";
91 default: return "unknown";
92 }
93 }
94
95 static void dav_debug_ql_fnames_print(DavQLStatement *stmt) {
96 if (stmt->fields) {
97 printf("Field names: ");
98 CxIterator i = cxListIterator(stmt->fields);
99 cx_foreach(DavQLField *, f, i) {
100 printf("%.*s, ", (int)f->name.length, f->name.ptr);
101 }
102 printf("\b\b \b\b\n");
103 }
104 }
105
106 static void dav_debug_ql_stmt_print(DavQLStatement *stmt) {
107 // Basic information
108 size_t fieldcount = stmt->fields ? stmt->fields->size : 0;
109 int specialfield = 0;
110 if (stmt->fields && stmt->fields->size > 0) {
111 DavQLField* firstfield = (DavQLField*)cxListAt(stmt->fields, 0);
112 if (firstfield->expr->type == DAVQL_IDENTIFIER) {
113 switch (firstfield->expr->srctext.ptr[0]) {
114 case '*': specialfield = 1; break;
115 case '-': specialfield = 2; break;
116 }
117 }
118 }
119 if (specialfield) {
120 fieldcount--;
121 }
122 printf("Statement: %.*s\nType: %s\nField count: %zu %s\n",
123 (int)stmt->srctext.length, stmt->srctext.ptr,
124 _map_querytype(stmt->type),
125 fieldcount,
126 _map_specialfield(specialfield));
127
128 dav_debug_ql_fnames_print(stmt);
129 printf("Path: %.*s\nHas where clause: %s\n",
130 (int)stmt->path.length, stmt->path.ptr,
131 stmt->where ? "yes" : "no");
132
133 // WITH attributes
134 if (stmt->depth == DAV_DEPTH_INFINITY) {
135 printf("Depth: infinity\n");
136 } else if (stmt->depth == DAV_DEPTH_PLACEHOLDER) {
137 printf("Depth: placeholder\n");
138 } else {
139 printf("Depth: %d\n", stmt->depth);
140 }
141
142 // order by clause
143 printf("Order by: ");
144 if (stmt->orderby) {
145 CxIterator i = cxListIterator(stmt->orderby);
146 cx_foreach(DavQLOrderCriterion*, critdata, i) {
147 printf("%.*s %s%s", (int)critdata->column->srctext.length, critdata->column->srctext.ptr,
148 critdata->descending ? "desc" : "asc",
149 i.index+1 < stmt->orderby->size ? ", " : "\n");
150 }
151 } else {
152 printf("nothing\n");
153 }
154
155 // error messages
156 if (stmt->errorcode) {
157 printf("\nError code: %d\nError: %s\n",
158 stmt->errorcode, stmt->errormessage);
159 }
160 }
161
162 static int dav_debug_ql_expr_selected(DavQLExpression *expr) {
163 if (!expr) {
164 printf("Currently no expression selected.\n");
165 return 0;
166 } else {
167 return 1;
168 }
169 }
170
171 static void dav_debug_ql_expr_print(DavQLExpression *expr) {
172 if (dav_debug_ql_expr_selected(expr)) {
173 cxstring empty = CX_STR("(empty)");
174 printf(
175 "Text: %.*s\nType: %s\nOperator: %s\n",
176 sfmtarg(expr->srctext),
177 _map_exprtype(expr->type),
178 _map_operator(expr->op));
179 if (expr->left || expr->right) {
180 printf("Left hand: %.*s\nRight hand: %.*s\n",
181 sfmtarg(expr->left?expr->left->srctext:empty),
182 sfmtarg(expr->right?expr->right->srctext:empty));
183 }
184 }
185 }
186
187 static void dav_debug_ql_field_print(DavQLField *field) {
188 if (field) {
189 printf("Name: %.*s\n", sfmtarg(field->name));
190 if (field->expr) {
191 dav_debug_ql_expr_print(field->expr);
192 } else {
193 printf("No expression.\n");
194 }
195 } else {
196 printf("No field selected.\n");
197 }
198 }
199
200 static void dav_debug_ql_tree_print(DavQLExpression *expr, int depth) {
201 if (expr) {
202 if (expr->left) {
203 printf("%*c%s\n", depth, ' ', _map_operator(expr->op));
204 dav_debug_ql_tree_print(expr->left, depth+1);
205 dav_debug_ql_tree_print(expr->right, depth+1);
206 } else if (expr->type == DAVQL_UNARY) {
207 printf("%*c%s %.*s\n", depth, ' ', _map_operator(expr->op),
208 sfmtarg(expr->srctext));
209 } else {
210 printf("%*c%.*s\n", depth, ' ', sfmtarg(expr->srctext));
211 }
212 }
213 }
214
215 #define DQLD_CMD_Q 0
216 #define DQLD_CMD_PS 1
217 #define DQLD_CMD_PE 2
218 #define DQLD_CMD_PF 3
219 #define DQLD_CMD_PT 4
220 #define DQLD_CMD_F 10
221 #define DQLD_CMD_W 11
222 #define DQLD_CMD_O 12
223 #define DQLD_CMD_L 21
224 #define DQLD_CMD_R 22
225 #define DQLD_CMD_N 23
226 #define DQLD_CMD_P 24
227 #define DQLD_CMD_H 100
228
229 static int dav_debug_ql_command() {
230 printf("> ");
231
232 char buffer[8];
233 fgets(buffer, 8, stdin);
234 // discard remaining chars
235 if (!strchr(buffer, '\n')) {
236 int chr;
237 while ((chr = fgetc(stdin) != '\n') && chr != EOF);
238 }
239
240 if (!strcmp(buffer, "q\n")) {
241 return DQLD_CMD_Q;
242 } else if (!strcmp(buffer, "ps\n")) {
243 return DQLD_CMD_PS;
244 } else if (!strcmp(buffer, "pe\n")) {
245 return DQLD_CMD_PE;
246 } else if (!strcmp(buffer, "pf\n")) {
247 return DQLD_CMD_PF;
248 } else if (!strcmp(buffer, "pt\n")) {
249 return DQLD_CMD_PT;
250 } else if (!strcmp(buffer, "l\n")) {
251 return DQLD_CMD_L;
252 } else if (!strcmp(buffer, "r\n")) {
253 return DQLD_CMD_R;
254 } else if (!strcmp(buffer, "h\n")) {
255 return DQLD_CMD_H;
256 } else if (!strcmp(buffer, "f\n")) {
257 return DQLD_CMD_F;
258 } else if (!strcmp(buffer, "w\n")) {
259 return DQLD_CMD_W;
260 } else if (!strcmp(buffer, "o\n")) {
261 return DQLD_CMD_O;
262 } else if (!strcmp(buffer, "n\n")) {
263 return DQLD_CMD_N;
264 } else if (!strcmp(buffer, "p\n")) {
265 return DQLD_CMD_P;
266 } else {
267 return -1;
268 }
269 }
270
271 void dav_debug_statement(DavQLStatement *stmt) {
272 if (!stmt) {
273 fprintf(stderr, "Debug DavQLStatement failed: null pointer");
274 return;
275 }
276
277 printf("Starting DavQL debugger (type 'h' for help)...\n\n");
278 dav_debug_ql_stmt_print(stmt);
279
280 if (stmt->errorcode) {
281 return;
282 }
283
284 DavQLExpression *examineexpr = NULL;
285 CxList *examineelem = NULL;
286 int examineclause = 0;
287
288 while(1) {
289 int cmd = dav_debug_ql_command();
290 switch (cmd) {
291 case DQLD_CMD_Q: return;
292 case DQLD_CMD_PS: dav_debug_ql_stmt_print(stmt); break;
293 case DQLD_CMD_PE: dav_debug_ql_expr_print(examineexpr); break;
294 case DQLD_CMD_PT: dav_debug_ql_tree_print(examineexpr, 1); break;
295 case DQLD_CMD_PF: dav_debug_ql_fnames_print(stmt); break;
296 case DQLD_CMD_F:
297 examineclause = DQLD_CMD_F;
298 examineelem = stmt->fields;
299 if (stmt->fields && stmt->fields->size > 0) {
300 DavQLField* field = cxListAt(stmt->fields, 0);
301 examineexpr = field->expr;
302 dav_debug_ql_field_print(field);
303 } else {
304 examineexpr = NULL;
305 }
306 break;
307 case DQLD_CMD_W:
308 examineclause = 0; examineelem = NULL;
309 examineexpr = stmt->where;
310 dav_debug_ql_expr_print(examineexpr);
311 break;
312 case DQLD_CMD_O:
313 examineclause = DQLD_CMD_O;
314 examineelem = stmt->orderby;
315 examineexpr = stmt->orderby && stmt->orderby->size > 0 ?
316 ((DavQLOrderCriterion*)cxListAt(stmt->orderby, 0))->column : NULL;
317 dav_debug_ql_expr_print(examineexpr);
318 break;
319 case DQLD_CMD_N:
320 case DQLD_CMD_P:
321 printf("TODO: port code to ucx 3\n");
322 /*
323 if (examineelem) {
324 CxList *newelem = (cmd == DQLD_CMD_N ?
325 examineelem->next : examineelem->prev);
326 if (newelem) {
327 examineelem = newelem;
328 if (examineclause == DQLD_CMD_O) {
329 examineexpr = ((DavQLOrderCriterion*)
330 examineelem->data)->column;
331 dav_debug_ql_expr_print(examineexpr);
332 } else if (examineclause == DQLD_CMD_F) {
333 DavQLField* field = (DavQLField*)examineelem->data;
334 examineexpr = field->expr;
335 dav_debug_ql_field_print(field);
336 } else {
337 printf("Examining unknown clause type.");
338 }
339 } else {
340 printf("Reached end of list.\n");
341 }
342 } else {
343 printf("Currently not examining an expression list.\n");
344 }
345 */
346 break;
347 case DQLD_CMD_L:
348 if (dav_debug_ql_expr_selected(examineexpr)) {
349 if (examineexpr->left) {
350 examineexpr = examineexpr->left;
351 dav_debug_ql_expr_print(examineexpr);
352 } else {
353 printf("There is no left subtree.\n");
354 }
355 }
356 break;
357 case DQLD_CMD_R:
358 if (dav_debug_ql_expr_selected(examineexpr)) {
359 if (examineexpr->right) {
360 examineexpr = examineexpr->right;
361 dav_debug_ql_expr_print(examineexpr);
362 } else {
363 printf("There is no right subtree.\n");
364 }
365 }
366 break;
367 case DQLD_CMD_H:
368 printf(
369 "\nCommands:\n"
370 "ps: print statement information\n"
371 "o: examine order by clause\n"
372 "f: examine field list\n"
373 "pf: print field names\n"
374 "w: examine where clause\n"
375 "n: examine next expression "
376 "(in order by clause or field list)\n"
377 "p: examine previous expression "
378 "(in order by clause or field list)\n"
379 "q: quit\n\n"
380 "\nExpression examination:\n"
381 "pe: print expression information\n"
382 "pt: print full syntax tree of current (sub-)expression\n"
383 "l: enter left subtree\n"
384 "r: enter right subtree\n");
385 break;
386 default: printf("unknown command\n");
387 }
388 }
389 }
390
391 // ------------------------------------------------------------------------
392 // P A R S E R
393 // ------------------------------------------------------------------------
394
395 #define _error_context "(%.*s[->]%.*s%.*s)"
396 #define _error_invalid "invalid statement"
397 #define _error_out_of_memory "out of memory"
398 #define _error_unexpected_token "unexpected token " _error_context
399 #define _error_invalid_token "invalid token " _error_context
400 #define _error_missing_path "expected path " _error_context
401 #define _error_missing_from "expecting FROM keyword " _error_context
402 #define _error_missing_at "expecting AT keyword " _error_context
403 #define _error_missing_by "expecting BY keyword " _error_context
404 #define _error_missing_as "expecting alias ('as <identifier>') " _error_context
405 #define _error_missing_identifier "expecting identifier " _error_context
406 #define _error_missing_par "missing closed parenthesis " _error_context
407 #define _error_missing_assign "expecting assignment ('=') " _error_context
408 #define _error_missing_where "SET statements must have a WHERE clause or " \
409 "explicitly use ANYWHERE " _error_context
410 #define _error_invalid_depth "invalid depth " _error_context
411 #define _error_missing_expr "missing expression " _error_context
412 #define _error_invalid_expr "invalid expression " _error_context
413 #define _error_invalid_unary_op "invalid unary operator " _error_context
414 #define _error_invalid_logical_op "invalid logical operator " _error_context
415 #define _error_invalid_fmtspec "invalid format specifier " _error_context
416 #define _error_invalid_string "string expected " _error_context
417 #define _error_invalid_order_criterion "invalid order criterion " _error_context
418
419 #define token_sstr(token) ((token)->value)
420
421 static void dav_error_in_context(int errorcode, const char *errormsg,
422 DavQLStatement *stmt, DavQLToken *token) {
423
424 // we try to achieve two things: get as many information as possible
425 // and recover the concrete source string (and not the token strings)
426 cxstring emptystring = CX_STR("");
427 cxstring prev = token->prev ? (token->prev->prev ?
428 token_sstr(token->prev->prev) : token_sstr(token->prev))
429 : emptystring;
430 cxstring tokenstr = token_sstr(token);
431 cxstring next = token->next ? (token->next->next ?
432 token_sstr(token->next->next) : token_sstr(token->next))
433 : emptystring;
434
435 int lp = prev.length == 0 ? 0 : tokenstr.ptr-prev.ptr;
436 const char *pn = tokenstr.ptr + tokenstr.length;
437 int ln = next.ptr+next.length - pn;
438
439 stmt->errorcode = errorcode;
440 stmt->errormessage = cx_asprintf(errormsg,
441 lp, prev.ptr,
442 sfmtarg(tokenstr),
443 ln, pn).ptr;
444 }
445
446 #define dqlsec_alloc_failed(ptr, stmt) \
447 if (!(ptr)) do { \
448 (stmt)->errorcode = DAVQL_ERROR_OUT_OF_MEMORY; \
449 return 0; \
450 } while(0)
451 #define dqlsec_malloc(stmt, ptr, type) \
452 dqlsec_alloc_failed(ptr = malloc(sizeof(type)), stmt)
453 #define dqlsec_mallocz(stmt, ptr, type) \
454 dqlsec_alloc_failed(ptr = calloc(1, sizeof(type)), stmt)
455
456
457 // special symbols are single tokens - the % sign MUST NOT be a special symbol
458 static const char *special_token_symbols = ",()+-*/&|^~=!<>";
459
460 static _Bool iskeyword(DavQLToken *token) {
461 cxstring keywords[] ={CX_STR("select"), CX_STR("set"), CX_STR("from"), CX_STR("at"), CX_STR("as"),
462 CX_STR("where"), CX_STR("anywhere"), CX_STR("like"), CX_STR("unlike"), CX_STR("and"),
463 CX_STR("or"), CX_STR("not"), CX_STR("xor"), CX_STR("with"), CX_STR("infinity"),
464 CX_STR("order"), CX_STR("by"), CX_STR("asc"), CX_STR("desc")
465 };
466 for (int i = 0 ; i < sizeof(keywords)/sizeof(cxstring) ; i++) {
467 if (!cx_strcasecmp(token->value, keywords[i])) {
468 return 1;
469 }
470 }
471 return 0;
472 }
473
474 static _Bool islongoperator(DavQLToken *token) {
475 cxstring operators[] = {CX_STR("and"), CX_STR("or"), CX_STR("not"), CX_STR("xor"),
476 CX_STR("like"), CX_STR("unlike")
477 };
478 for (int i = 0 ; i < sizeof(operators)/sizeof(cxstring) ; i++) {
479 if (!cx_strcasecmp(token->value, operators[i])) {
480 return 1;
481 }
482 }
483 return 0;
484 }
485
486 static int dav_stmt_add_field(DavQLStatement *stmt, DavQLField *field) {
487 if(!stmt->fields) {
488 stmt->fields = cxLinkedListCreateSimple(CX_STORE_POINTERS);
489 if(!stmt->fields) {
490 stmt->errorcode = DAVQL_ERROR_OUT_OF_MEMORY;
491 return 1;
492 }
493 }
494
495 if(cxListAdd(stmt->fields, field)) {
496 stmt->errorcode = DAVQL_ERROR_OUT_OF_MEMORY;
497 return 1;
498 }
499
500 return 0;
501 }
502
503
504 static void tokenlist_free(DavQLToken *tokenlist) {
505 DavQLToken *token = tokenlist;
506 while(token) {
507 DavQLToken *next = token->next;
508 free(token);
509 token = next;
510 }
511 }
512
513 static int dav_parse_add_token(DavQLToken **begin, DavQLToken **end, DavQLToken *token) {
514
515 // determine token class (order of if-statements is very important!)
516 char firstchar = token->value.ptr[0];
517
518 if (isdigit(firstchar)) {
519 token->tokenclass = DAVQL_TOKEN_NUMBER;
520 // check, if all characters are digits
521 for (size_t i = 1 ; i < token->value.length ; i++) {
522 if (!isdigit(token->value.ptr[i])) {
523 token->tokenclass = DAVQL_TOKEN_INVALID;
524 break;
525 }
526 }
527 } else if (firstchar == '%') {
528 token->tokenclass = DAVQL_TOKEN_FMTSPEC;
529 } else if (token->value.length == 1) {
530 switch (firstchar) {
531 case '(': token->tokenclass = DAVQL_TOKEN_OPENP; break;
532 case ')': token->tokenclass = DAVQL_TOKEN_CLOSEP; break;
533 case ',': token->tokenclass = DAVQL_TOKEN_COMMA; break;
534 default:
535 token->tokenclass = strchr(special_token_symbols, firstchar) ?
536 DAVQL_TOKEN_OPERATOR : DAVQL_TOKEN_IDENTIFIER;
537 }
538 } else if (islongoperator(token)) {
539 token->tokenclass = DAVQL_TOKEN_OPERATOR;
540 } else if (firstchar == '\'') {
541 token->tokenclass = DAVQL_TOKEN_STRING;
542 } else if (firstchar == '`') {
543 token->tokenclass = DAVQL_TOKEN_IDENTIFIER;
544 } else if (iskeyword(token)) {
545 token->tokenclass = DAVQL_TOKEN_KEYWORD;
546 } else {
547 token->tokenclass = DAVQL_TOKEN_IDENTIFIER;
548 // TODO: check for illegal characters
549 }
550
551 // remove quotes (extreme cool feature)
552 if (token->tokenclass == DAVQL_TOKEN_STRING ||
553 (token->tokenclass == DAVQL_TOKEN_IDENTIFIER && firstchar == '`')) {
554
555 char lastchar = token->value.ptr[token->value.length-1];
556 if (firstchar == lastchar) {
557 token->value.ptr++;
558 token->value.length -= 2;
559 } else {
560 token->tokenclass = DAVQL_TOKEN_INVALID;
561 }
562 }
563
564 cx_linked_list_add((void**)begin, (void**)end, offsetof(DavQLToken, prev), offsetof(DavQLToken, next), token);
565 return 0;
566 }
567
568
569
570 static DavQLToken* dav_parse_tokenize(cxstring src) {
571 #define alloc_token() do {token = calloc(1, sizeof(DavQLToken));\
572 if(!token) {tokenlist_free(tokens_begin); return NULL;}} while(0)
573 #define add_token() if(dav_parse_add_token(&tokens_begin, &tokens_end, token)) return NULL;
574
575 DavQLToken *tokens_begin = NULL;
576 DavQLToken *tokens_end = NULL;
577
578 DavQLToken *token = NULL;
579
580 char insequence = '\0';
581 for (size_t i = 0 ; i < src.length ; i++) {
582 // quoted strings / identifiers are a single token
583 if (src.ptr[i] == '\'' || src.ptr[i] == '`') {
584 if (src.ptr[i] == insequence) {
585 // lookahead for escaped string quotes
586 if (src.ptr[i] == '\'' && i+2 < src.length &&
587 src.ptr[i+1] == src.ptr[i] && src.ptr[i+2] == src.ptr[i]) {
588 token->value.length += 3;
589 i += 2;
590 } else {
591 // add quoted token to list
592 token->value.length++;
593 add_token();
594 token = NULL;
595 insequence = '\0';
596 }
597 } else if (insequence == '\0') {
598 insequence = src.ptr[i];
599 // always create new token for quoted strings
600 if (token) {
601 add_token();
602 }
603 alloc_token();
604 token->value.ptr = src.ptr + i;
605 token->value.length = 1;
606 } else {
607 // add other kind of quotes to token
608 token->value.length++;
609 }
610 } else if (insequence) {
611 token->value.length++;
612 } else if (isspace(src.ptr[i])) {
613 // add token before spaces to list (if any)
614 if (token) {
615 add_token();
616 token = NULL;
617 }
618 } else if (strchr(special_token_symbols, src.ptr[i])) {
619 // add token before special symbol to list (if any)
620 if (token) {
621 add_token();
622 token = NULL;
623 }
624 // add special symbol as single token to list
625 alloc_token();
626 token->value.ptr = src.ptr + i;
627 token->value.length = 1;
628 add_token();
629 // set tokenizer ready to read more tokens
630 token = NULL;
631 } else {
632 // if this is a new token, create memory for it
633 if (!token) {
634 alloc_token();
635 token->value.ptr = src.ptr + i;
636 token->value.length = 0;
637 }
638 // extend token length when reading more bytes
639 token->value.length++;
640 }
641 }
642
643 if (token) {
644 add_token();
645 }
646
647 alloc_token();
648 token->tokenclass = DAVQL_TOKEN_END;
649 token->value = CX_STR("");
650
651 cx_linked_list_add((void**)&tokens_begin, (void**)&tokens_end, offsetof(DavQLToken, prev), offsetof(DavQLToken, next), token);
652 return tokens_begin;
653 #undef alloc_token
654 #undef add_token
655 }
656
657 static void dav_free_expression(DavQLExpression *expr) {
658 if (expr) {
659 if (expr->left) {
660 dav_free_expression(expr->left);
661 }
662 if (expr->right) {
663 dav_free_expression(expr->right);
664 }
665 free(expr);
666 }
667 }
668
669 static void dav_free_field(DavQLField *field) {
670 dav_free_expression(field->expr);
671 free(field);
672 }
673
674 static void dav_free_order_criterion(DavQLOrderCriterion *crit) {
675 if (crit->column) { // do it null-safe though column is expected to be set
676 dav_free_expression(crit->column);
677 }
678 }
679
680 #define token_is(token, expectedclass) (token && \
681 (token->tokenclass == expectedclass))
682
683 #define tokenvalue_is(token, expectedvalue) (token && \
684 !cx_strcasecmp(token->value, cx_str(expectedvalue)))
685
686 typedef int(*exprparser_f)(DavQLStatement*,DavQLToken*,DavQLExpression*);
687
688 static int dav_parse_binary_expr(DavQLStatement* stmt, DavQLToken* token,
689 DavQLExpression* expr, exprparser_f parseL, char* opc, int* opv,
690 exprparser_f parseR) {
691
692 if (!token) {
693 return 0;
694 }
695
696 int total_consumed = 0, consumed;
697
698 // save temporarily on stack (copy to heap later on)
699 DavQLExpression left, right;
700
701 // RULE: LEFT, [Operator, RIGHT]
702 memset(&left, 0, sizeof(DavQLExpression));
703 consumed = parseL(stmt, token, &left);
704 if (!consumed || stmt->errorcode) {
705 return 0;
706 }
707 total_consumed += consumed;
708 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
709
710 char *op;
711 if (token_is(token, DAVQL_TOKEN_OPERATOR) &&
712 (op = strchr(opc, token_sstr(token).ptr[0]))) {
713 expr->op = opv[op-opc];
714 expr->type = DAVQL_BINARY;
715 total_consumed++;
716 token = token->next;
717 memset(&right, 0, sizeof(DavQLExpression));
718 consumed = parseR(stmt, token, &right);
719 if (stmt->errorcode) {
720 return 0;
721 }
722 if (!consumed) {
723 dav_error_in_context(DAVQL_ERROR_MISSING_EXPR,
724 _error_missing_expr, stmt, token);
725 return 0;
726 }
727 total_consumed += consumed;
728 }
729
730 if (expr->op == DAVQL_NOOP) {
731 memcpy(expr, &left, sizeof(DavQLExpression));
732 } else {
733 dqlsec_malloc(stmt, expr->left, DavQLExpression);
734 memcpy(expr->left, &left, sizeof(DavQLExpression));
735 dqlsec_malloc(stmt, expr->right, DavQLExpression);
736 memcpy(expr->right, &right, sizeof(DavQLExpression));
737
738 expr->srctext.ptr = expr->left->srctext.ptr;
739 expr->srctext.length =
740 expr->right->srctext.ptr -
741 expr->left->srctext.ptr + expr->right->srctext.length;
742 }
743
744 return total_consumed;
745 }
746
747 static void fmt_args_add(DavQLStatement *stmt, void *data) {
748 if(!stmt->args) {
749 stmt->args = cxLinkedListCreateSimple(CX_STORE_POINTERS);
750 }
751 cxListAdd(stmt->args, data);
752 }
753
754 static void dav_add_fmt_args(DavQLStatement *stmt, cxstring str) {
755 int placeholder = 0;
756 for (size_t i=0;i<str.length;i++) {
757 char c = str.ptr[i];
758 if (placeholder) {
759 if (c != '%') {
760 fmt_args_add(stmt, (void*)(intptr_t)c);
761 }
762 placeholder = 0;
763 } else if (c == '%') {
764 placeholder = 1;
765 }
766 }
767 }
768
769 static int dav_parse_literal(DavQLStatement* stmt, DavQLToken* token,
770 DavQLExpression* expr) {
771
772 expr->srctext = token_sstr(token);
773 if (token_is(token, DAVQL_TOKEN_NUMBER)) {
774 expr->type = DAVQL_NUMBER;
775 } else if (token_is(token, DAVQL_TOKEN_STRING)) {
776 expr->type = DAVQL_STRING;
777 // check for format specifiers and add args
778 dav_add_fmt_args(stmt, expr->srctext);
779 } else if (token_is(token, DAVQL_TOKEN_TIMESTAMP)) {
780 expr->type = DAVQL_TIMESTAMP;
781 } else if (token_is(token, DAVQL_TOKEN_FMTSPEC)
782 && expr->srctext.length == 2) {
783 switch (expr->srctext.ptr[1]) {
784 case 'd': expr->type = DAVQL_NUMBER; break;
785 case 's': expr->type = DAVQL_STRING; break;
786 case 't': expr->type = DAVQL_TIMESTAMP; break;
787 default:
788 dav_error_in_context(DAVQL_ERROR_INVALID_FMTSPEC,
789 _error_invalid_fmtspec, stmt, token);
790 return 0;
791 }
792 // add fmtspec type to query arg list
793 fmt_args_add(stmt, (void*)(intptr_t)expr->srctext.ptr[1]);
794 } else {
795 return 0;
796 }
797
798 return 1;
799 }
800
801 // forward declaration
802 static int dav_parse_expression(DavQLStatement* stmt, DavQLToken* token,
803 DavQLExpression* expr);
804
805 static int dav_parse_arglist(DavQLStatement* stmt, DavQLToken* token,
806 DavQLExpression* expr) {
807
808 expr->srctext.ptr = token_sstr(token).ptr;
809 expr->srctext.length = 0;
810 expr->left = expr->right = NULL; // in case we fail, we want them to be sane
811
812 int total_consumed = 0;
813
814 // RULE: Expression, {",", Expression};
815 DavQLExpression *arglist = expr;
816 DavQLExpression arg;
817 const char *lastchar = expr->srctext.ptr;
818 int consumed;
819 do {
820 memset(&arg, 0, sizeof(DavQLExpression));
821 consumed = dav_parse_expression(stmt, token, &arg);
822 if (consumed) {
823 lastchar = arg.srctext.ptr + arg.srctext.length;
824 total_consumed += consumed;
825 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
826 // look ahead for a comma
827 if (token_is(token, DAVQL_TOKEN_COMMA)) {
828 total_consumed++;
829 token = token->next;
830 /* we have more arguments, so put the current argument to the
831 * left subtree and create a new node to the right
832 */
833 dqlsec_malloc(stmt, arglist->left, DavQLExpression);
834 memcpy(arglist->left, &arg, sizeof(DavQLExpression));
835 arglist->srctext.ptr = arg.srctext.ptr;
836 arglist->op = DAVQL_ARGLIST;
837 arglist->type = DAVQL_FUNCCALL;
838 dqlsec_mallocz(stmt, arglist->right, DavQLExpression);
839 arglist = arglist->right;
840 } else {
841 // this was the last argument, so write it to the current node
842 memcpy(arglist, &arg, sizeof(DavQLExpression));
843 consumed = 0;
844 }
845 }
846 } while (consumed && !stmt->errorcode);
847
848 // recover source text
849 arglist = expr;
850 while (arglist && arglist->type == DAVQL_FUNCCALL) {
851 arglist->srctext.length = lastchar - arglist->srctext.ptr;
852 arglist = arglist->right;
853 }
854
855 return total_consumed;
856 }
857
858 static int dav_parse_funccall(DavQLStatement* stmt, DavQLToken* token,
859 DavQLExpression* expr) {
860
861 // RULE: Identifier, "(", ArgumentList, ")";
862 if (token_is(token, DAVQL_TOKEN_IDENTIFIER) &&
863 token_is(token->next, DAVQL_TOKEN_OPENP)) {
864
865 expr->type = DAVQL_FUNCCALL;
866 expr->op = DAVQL_CALL;
867
868 dqlsec_mallocz(stmt, expr->left, DavQLExpression);
869 expr->left->type = DAVQL_IDENTIFIER;
870 expr->left->srctext = token_sstr(token);
871 expr->right = NULL;
872
873 token = token->next->next;
874
875 DavQLExpression arg;
876 int argtokens = dav_parse_arglist(stmt, token, &arg);
877 if (stmt->errorcode) {
878 // if an error occurred while parsing the arglist, return now
879 return 2;
880 }
881 if (argtokens) {
882 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), argtokens);
883 dqlsec_malloc(stmt, expr->right, DavQLExpression);
884 memcpy(expr->right, &arg, sizeof(DavQLExpression));
885 } else {
886 // arg list may be empty
887 expr->right = NULL;
888 }
889
890 if (token_is(token, DAVQL_TOKEN_CLOSEP)) {
891 return 3 + argtokens;
892 } else {
893 dav_error_in_context(DAVQL_ERROR_MISSING_PAR, _error_missing_par,
894 stmt, token);
895 return 2; // it MUST be a function call, but it is invalid
896 }
897 } else {
898 return 0;
899 }
900 }
901
902 static int dav_parse_unary_expr(DavQLStatement* stmt, DavQLToken* token,
903 DavQLExpression* expr) {
904
905 DavQLToken *firsttoken = token; // save for srctext recovery
906
907 DavQLExpression* atom = expr;
908 int total_consumed = 0;
909
910 // optional unary operator
911 if (token_is(token, DAVQL_TOKEN_OPERATOR)) {
912 char *op = strchr("+-~", token_sstr(token).ptr[0]);
913 if (op) {
914 expr->type = DAVQL_UNARY;
915 switch (*op) {
916 case '+': expr->op = DAVQL_ADD; break;
917 case '-': expr->op = DAVQL_SUB; break;
918 case '~': expr->op = DAVQL_NEG; break;
919 }
920 dqlsec_mallocz(stmt, expr->left, DavQLExpression);
921 atom = expr->left;
922 total_consumed++;
923 token = token->next;
924 } else {
925 dav_error_in_context(DAVQL_ERROR_INVALID_UNARY_OP,
926 _error_invalid_unary_op, stmt, token);
927 return 0;
928 }
929 }
930
931 // RULE: (ParExpression | AtomicExpression)
932 if (token_is(token, DAVQL_TOKEN_OPENP)) {
933 token = token->next; total_consumed++;
934 // RULE: "(", Expression, ")"
935 int consumed = dav_parse_expression(stmt, token, atom);
936 if (stmt->errorcode) {
937 return 0;
938 }
939 if (!consumed) {
940 dav_error_in_context(DAVQL_ERROR_INVALID_EXPR,
941 _error_invalid_expr, stmt, token);
942 return 0;
943 }
944 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
945 total_consumed += consumed;
946 if (token_is(token, DAVQL_TOKEN_CLOSEP)) {
947 token = token->next; total_consumed++;
948 } else {
949 dav_error_in_context(DAVQL_ERROR_MISSING_PAR,
950 _error_missing_par, stmt, token);
951 return 0;
952 }
953 } else {
954 // RULE: FunctionCall
955 int consumed = dav_parse_funccall(stmt, token, atom);
956 if (consumed) {
957 total_consumed += consumed;
958 } else if (token_is(token, DAVQL_TOKEN_IDENTIFIER)) {
959 // RULE: Identifier
960 total_consumed++;
961 atom->type = DAVQL_IDENTIFIER;
962 atom->srctext = token_sstr(token);
963 } else {
964 // RULE: Literal
965 total_consumed += dav_parse_literal(stmt, token, atom);
966 }
967 }
968
969 // recover source text
970 expr->srctext.ptr = token_sstr(firsttoken).ptr;
971 if (total_consumed > 0) {
972 cxstring lasttoken =
973 token_sstr((DavQLToken*)cx_linked_list_at(token, 0, offsetof(DavQLToken, next), total_consumed-1));
974 expr->srctext.length =
975 lasttoken.ptr - expr->srctext.ptr + lasttoken.length;
976 } else {
977 // the expression should not be used anyway, but we want to be safe
978 expr->srctext.length = 0;
979 }
980
981
982 return total_consumed;
983 }
984
985 static int dav_parse_bitexpr(DavQLStatement* stmt, DavQLToken* token,
986 DavQLExpression* expr) {
987
988 return dav_parse_binary_expr(stmt, token, expr,
989 dav_parse_unary_expr,
990 "&|^", (int[]){DAVQL_AND, DAVQL_OR, DAVQL_XOR},
991 dav_parse_bitexpr);
992 }
993
994 static int dav_parse_multexpr(DavQLStatement* stmt, DavQLToken* token,
995 DavQLExpression* expr) {
996
997 return dav_parse_binary_expr(stmt, token, expr,
998 dav_parse_bitexpr,
999 "*/", (int[]){DAVQL_MUL, DAVQL_DIV},
1000 dav_parse_multexpr);
1001 }
1002
1003 static int dav_parse_expression(DavQLStatement* stmt, DavQLToken* token,
1004 DavQLExpression* expr) {
1005
1006 return dav_parse_binary_expr(stmt, token, expr,
1007 dav_parse_multexpr,
1008 "+-", (int[]){DAVQL_ADD, DAVQL_SUB},
1009 dav_parse_expression);
1010 }
1011
1012 static int dav_parse_named_field(DavQLStatement *stmt, DavQLToken *token,
1013 DavQLField *field) {
1014 int total_consumed = 0, consumed;
1015
1016 // RULE: Expression, " as ", Identifier;
1017 DavQLExpression *expr;
1018 dqlsec_mallocz(stmt, expr, DavQLExpression);
1019 consumed = dav_parse_expression(stmt, token, expr);
1020 if (stmt->errorcode) {
1021 dav_free_expression(expr);
1022 return 0;
1023 }
1024 if (expr->type == DAVQL_UNDEFINED_TYPE) {
1025 dav_free_expression(expr);
1026 dav_error_in_context(DAVQL_ERROR_INVALID_EXPR,
1027 _error_invalid_expr, stmt, token);
1028 return 0;
1029 }
1030
1031 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
1032 total_consumed += consumed;
1033
1034 if (token_is(token, DAVQL_TOKEN_KEYWORD) && tokenvalue_is(token, "as")) {
1035 token = token->next; total_consumed++;
1036 } else {
1037 dav_free_expression(expr);
1038 dav_error_in_context(DAVQL_ERROR_MISSING_TOKEN,
1039 _error_missing_as, stmt, token);
1040 return 0;
1041 }
1042
1043 if (token_is(token, DAVQL_TOKEN_IDENTIFIER)) {
1044 field->name = token_sstr(token);
1045 field->expr = expr;
1046 return total_consumed + 1;
1047 } else {
1048 dav_free_expression(expr);
1049 dav_error_in_context(DAVQL_ERROR_MISSING_TOKEN,
1050 _error_missing_identifier, stmt, token);
1051 return 0;
1052 }
1053 }
1054
1055 static int dav_parse_fieldlist(DavQLStatement *stmt, DavQLToken *token) {
1056
1057 // RULE: "-"
1058 if (token_is(token, DAVQL_TOKEN_OPERATOR) && tokenvalue_is(token, "-")) {
1059 DavQLField *field;
1060 dqlsec_malloc(stmt, field, DavQLField);
1061 if(dav_stmt_add_field(stmt, field)) {
1062 free(field);
1063 return 0;
1064 }
1065 dqlsec_mallocz(stmt, field->expr, DavQLExpression);
1066 field->expr->type = DAVQL_IDENTIFIER;
1067 field->expr->srctext = field->name = token_sstr(token);
1068 return 1;
1069 }
1070
1071 // RULE: "*", {",", NamedExpression}
1072 if (token_is(token, DAVQL_TOKEN_OPERATOR) && tokenvalue_is(token, "*")) {
1073 DavQLField *field;
1074 dqlsec_malloc(stmt, field, DavQLField);
1075 if(dav_stmt_add_field(stmt, field)) {
1076 free(field);
1077 return 0;
1078 }
1079 dqlsec_mallocz(stmt, field->expr, DavQLExpression);
1080 field->expr->type = DAVQL_IDENTIFIER;
1081 field->expr->srctext = field->name = token_sstr(token);
1082
1083 int total_consumed = 0;
1084 int consumed = 1;
1085
1086 do {
1087 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
1088 total_consumed += consumed;
1089
1090 if (token_is(token, DAVQL_TOKEN_COMMA)) {
1091 total_consumed++; token = token->next;
1092 DavQLField localfield;
1093 consumed = dav_parse_named_field(stmt, token, &localfield);
1094 if (!stmt->errorcode && consumed) {
1095 DavQLField *field;
1096 dqlsec_malloc(stmt, field, DavQLField);
1097 memcpy(field, &localfield, sizeof(DavQLField));
1098 if(dav_stmt_add_field(stmt, field)) {
1099 free(field);
1100 return 0;
1101 }
1102 }
1103 } else {
1104 consumed = 0;
1105 }
1106 } while (consumed > 0);
1107
1108 return total_consumed;
1109 }
1110
1111 // RULE: FieldExpression, {",", FieldExpression}
1112 {
1113 int total_consumed = 0, consumed;
1114 do {
1115 // RULE: NamedField | Identifier
1116 DavQLField localfield;
1117 consumed = dav_parse_named_field(stmt, token, &localfield);
1118 if (consumed) {
1119 DavQLField *field;
1120 dqlsec_malloc(stmt, field, DavQLField);
1121 memcpy(field, &localfield, sizeof(DavQLField));
1122 if(dav_stmt_add_field(stmt, field)) {
1123 free(field);
1124 return 0;
1125 }
1126 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
1127 total_consumed += consumed;
1128 } else if (token_is(token, DAVQL_TOKEN_IDENTIFIER)
1129 // look ahead, if the field is JUST the identifier
1130 && (token_is(token->next, DAVQL_TOKEN_COMMA) ||
1131 tokenvalue_is(token->next, "from"))) {
1132
1133 DavQLField *field;
1134 dqlsec_malloc(stmt, field, DavQLField);
1135 dqlsec_mallocz(stmt, field->expr, DavQLExpression);
1136 field->expr->type = DAVQL_IDENTIFIER;
1137 field->expr->srctext = field->name = token_sstr(token);
1138 if(dav_stmt_add_field(stmt, field)) {
1139 free(field);
1140 return 0;
1141 }
1142
1143 consumed = 1;
1144 total_consumed++;
1145 token = token->next;
1146
1147 // we found a valid solution, so erase any errors
1148 stmt->errorcode = 0;
1149 if (stmt->errormessage) {
1150 free(stmt->errormessage);
1151 stmt->errormessage = NULL;
1152 }
1153 } else {
1154 // dav_parse_named_field has already thrown a good error
1155 consumed = 0;
1156 }
1157
1158 // field has been parsed, now try to get a comma
1159 if (consumed) {
1160 consumed = token_is(token, DAVQL_TOKEN_COMMA) ? 1 : 0;
1161 if (consumed) {
1162 token = token->next;
1163 total_consumed++;
1164 }
1165 }
1166 } while (consumed);
1167
1168 return total_consumed;
1169 }
1170 }
1171
1172 // forward declaration
1173 static int dav_parse_logical_expr(DavQLStatement *stmt, DavQLToken *token,
1174 DavQLExpression *expr);
1175
1176 static int dav_parse_bool_prim(DavQLStatement *stmt, DavQLToken *token,
1177 DavQLExpression *expr) {
1178
1179 expr->type = DAVQL_LOGICAL;
1180 expr->srctext = token_sstr(token);
1181
1182 int total_consumed = 0;
1183
1184 DavQLExpression bexpr;
1185 memset(&bexpr, 0, sizeof(DavQLExpression));
1186 total_consumed = dav_parse_expression(stmt, token, &bexpr);
1187 if (!total_consumed || stmt->errorcode) {
1188 return 0;
1189 }
1190 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), total_consumed);
1191
1192 DavQLToken* optok = token;
1193 // RULE: Expression, (" like " | " unlike "), String
1194 if (token_is(optok, DAVQL_TOKEN_OPERATOR) && (tokenvalue_is(optok,
1195 "like") || tokenvalue_is(optok, "unlike"))) {
1196
1197 total_consumed++;
1198 token = token->next;
1199 if (token_is(token, DAVQL_TOKEN_STRING)) {
1200 expr->op = tokenvalue_is(optok, "like") ?
1201 DAVQL_LIKE : DAVQL_UNLIKE;
1202 dqlsec_malloc(stmt, expr->left, DavQLExpression);
1203 memcpy(expr->left, &bexpr, sizeof(DavQLExpression));
1204 dqlsec_mallocz(stmt, expr->right, DavQLExpression);
1205 expr->right->type = DAVQL_STRING;
1206 expr->right->srctext = token_sstr(token);
1207 expr->srctext.length = expr->right->srctext.ptr -
1208 expr->srctext.ptr + expr->right->srctext.length;
1209
1210 // fmt args
1211 dav_add_fmt_args(stmt, expr->right->srctext);
1212
1213 return total_consumed + 1;
1214 } else {
1215 dav_error_in_context(DAVQL_ERROR_INVALID_STRING,
1216 _error_invalid_string, stmt, token);
1217 return 0;
1218 }
1219 }
1220 // RULE: Expression, Comparison, Expression
1221 else if (token_is(optok, DAVQL_TOKEN_OPERATOR) && (
1222 tokenvalue_is(optok, "=") || tokenvalue_is(optok, "!") ||
1223 tokenvalue_is(optok, "<") || tokenvalue_is(optok, ">"))) {
1224
1225 total_consumed++;
1226 token = token->next;
1227
1228 if (tokenvalue_is(optok, "=")) {
1229 expr->op = DAVQL_EQ;
1230 } else {
1231 if (tokenvalue_is(token, "=")) {
1232 if (tokenvalue_is(optok, "!")) {
1233 expr->op = DAVQL_NEQ;
1234 } else if (tokenvalue_is(optok, "<")) {
1235 expr->op = DAVQL_LE;
1236 } else if (tokenvalue_is(optok, ">")) {
1237 expr->op = DAVQL_GE;
1238 }
1239 total_consumed++;
1240 token = token->next;
1241 } else {
1242 if (tokenvalue_is(optok, "<")) {
1243 expr->op = DAVQL_LT;
1244 } else if (tokenvalue_is(optok, ">")) {
1245 expr->op = DAVQL_GT;
1246 }
1247 }
1248 }
1249
1250 DavQLExpression rexpr;
1251 memset(&rexpr, 0, sizeof(DavQLExpression));
1252 int consumed = dav_parse_expression(stmt, token, &rexpr);
1253 if (stmt->errorcode) {
1254 return 0;
1255 }
1256 if (!consumed) {
1257 dav_error_in_context(
1258 DAVQL_ERROR_MISSING_EXPR, _error_missing_expr,
1259 stmt, token);
1260 return 0;
1261 }
1262
1263 total_consumed += consumed;
1264 dqlsec_malloc(stmt, expr->left, DavQLExpression);
1265 memcpy(expr->left, &bexpr, sizeof(DavQLExpression));
1266 dqlsec_malloc(stmt, expr->right, DavQLExpression);
1267 memcpy(expr->right, &rexpr, sizeof(DavQLExpression));
1268
1269 expr->srctext.length = expr->right->srctext.ptr -
1270 expr->srctext.ptr + expr->right->srctext.length;
1271
1272 return total_consumed;
1273 }
1274 // RULE: FunctionCall | Identifier;
1275 else if (bexpr.type == DAVQL_FUNCCALL || bexpr.type == DAVQL_IDENTIFIER) {
1276 memcpy(expr, &bexpr, sizeof(DavQLExpression));
1277
1278 return total_consumed;
1279 } else {
1280 return 0;
1281 }
1282 }
1283
1284 static int dav_parse_bool_expr(DavQLStatement *stmt, DavQLToken *token,
1285 DavQLExpression *expr) {
1286
1287 // RULE: "not ", LogicalExpression
1288 if (token_is(token, DAVQL_TOKEN_OPERATOR) && tokenvalue_is(token, "not")) {
1289 expr->type = DAVQL_LOGICAL;
1290 expr->op = DAVQL_NOT;
1291 dqlsec_mallocz(stmt, expr->left, DavQLExpression);
1292 expr->srctext = token_sstr(token);
1293
1294 token = token->next;
1295 int consumed = dav_parse_bool_expr(stmt, token, expr->left);
1296 if (stmt->errorcode) {
1297 return 0;
1298 }
1299 if (consumed) {
1300 cxstring lasttok = token_sstr((DavQLToken*)cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed-1));
1301 expr->srctext.length =
1302 lasttok.ptr - expr->srctext.ptr + lasttok.length;
1303 return consumed + 1;
1304 } else {
1305 dav_error_in_context(DAVQL_ERROR_MISSING_EXPR,
1306 _error_missing_expr, stmt, token);
1307 return 0;
1308 }
1309 }
1310 // RULE: "(", LogicalExpression, ")"
1311 else if (token_is(token, DAVQL_TOKEN_OPENP)) {
1312 int consumed = dav_parse_logical_expr(stmt, token->next, expr);
1313 if (consumed) {
1314 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
1315
1316 if (token_is(token, DAVQL_TOKEN_CLOSEP)) {
1317 token = token->next;
1318 return consumed + 2;
1319 } else {
1320 dav_error_in_context(DAVQL_ERROR_MISSING_PAR, _error_missing_par,
1321 stmt, token);
1322 return 0;
1323 }
1324 } else {
1325 // don't handle errors here, we can also try a boolean primary
1326 stmt->errorcode = 0;
1327 if (stmt->errormessage) {
1328 free(stmt->errormessage);
1329 }
1330 }
1331 }
1332
1333 // RULE: BooleanPrimary
1334 return dav_parse_bool_prim(stmt, token, expr);
1335 }
1336
1337 static int dav_parse_logical_expr(DavQLStatement *stmt, DavQLToken *token,
1338 DavQLExpression *expr) {
1339
1340 DavQLToken *firsttoken = token;
1341 int total_consumed = 0;
1342
1343 // RULE: BooleanLiteral, [LogicalOperator, LogicalExpression];
1344 DavQLExpression left, right;
1345 memset(&left, 0, sizeof(DavQLExpression));
1346 int consumed = dav_parse_bool_expr(stmt, token, &left);
1347 if (stmt->errorcode) {
1348 return 0;
1349 }
1350 if (!consumed) {
1351 dav_error_in_context(DAVQL_ERROR_MISSING_EXPR,
1352 _error_missing_expr, stmt, token);
1353 return 0;
1354 }
1355 total_consumed += consumed;
1356 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
1357
1358 if (token_is(token, DAVQL_TOKEN_OPERATOR)) {
1359 expr->type = DAVQL_LOGICAL;
1360
1361 davqloperator_t op = DAVQL_NOOP;
1362 if (tokenvalue_is(token, "and")) {
1363 op = DAVQL_LAND;
1364 } else if (tokenvalue_is(token, "or")) {
1365 op = DAVQL_LOR;
1366 } else if (tokenvalue_is(token, "xor")) {
1367 op = DAVQL_LXOR;
1368 }
1369
1370 if (op == DAVQL_NOOP) {
1371 dav_error_in_context(DAVQL_ERROR_INVALID_LOGICAL_OP,
1372 _error_invalid_logical_op, stmt, token);
1373 return 0;
1374 } else {
1375 expr->op = op;
1376 total_consumed++;
1377 token = token->next;
1378
1379 memset(&right, 0, sizeof(DavQLExpression));
1380 consumed = dav_parse_logical_expr(stmt, token, &right);
1381 if (stmt->errorcode) {
1382 return 0;
1383 }
1384 if (!consumed) {
1385 dav_error_in_context(DAVQL_ERROR_MISSING_EXPR,
1386 _error_missing_expr, stmt, token);
1387 return 0;
1388 }
1389 total_consumed += consumed;
1390 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
1391
1392 dqlsec_malloc(stmt, expr->left, DavQLExpression);
1393 memcpy(expr->left, &left, sizeof(DavQLExpression));
1394 dqlsec_malloc(stmt, expr->right, DavQLExpression);
1395 memcpy(expr->right, &right, sizeof(DavQLExpression));
1396 }
1397 } else {
1398 memcpy(expr, &left, sizeof(DavQLExpression));
1399 }
1400
1401 // set type and recover source text
1402 if (total_consumed > 0) {
1403 expr->srctext.ptr = token_sstr(firsttoken).ptr;
1404 cxstring lasttok = token_sstr((DavQLToken*)cx_linked_list_at(firsttoken, 0, offsetof(DavQLToken, next), total_consumed-1));
1405 expr->srctext.length = lasttok.ptr-expr->srctext.ptr+lasttok.length;
1406 }
1407
1408 return total_consumed;
1409 }
1410
1411 static int dav_parse_where_clause(DavQLStatement *stmt, DavQLToken *token) {
1412 dqlsec_mallocz(stmt, stmt->where, DavQLExpression);
1413
1414 return dav_parse_logical_expr(stmt, token, stmt->where);
1415 }
1416
1417 static int dav_parse_with_clause(DavQLStatement *stmt, DavQLToken *token) {
1418
1419 int total_consumed = 0;
1420
1421 // RULE: "depth", "=", (Number | "infinity")
1422 if (tokenvalue_is(token, "depth")) {
1423 token = token->next; total_consumed++;
1424 if (tokenvalue_is(token, "=")) {
1425 token = token->next; total_consumed++;
1426 if (tokenvalue_is(token, "infinity")) {
1427 stmt->depth = DAV_DEPTH_INFINITY;
1428 token = token->next; total_consumed++;
1429 } else {
1430 DavQLExpression *depthexpr;
1431 dqlsec_mallocz(stmt, depthexpr, DavQLExpression);
1432
1433 int consumed = dav_parse_expression(stmt, token, depthexpr);
1434
1435 if (consumed) {
1436 if (depthexpr->type == DAVQL_NUMBER) {
1437 if (depthexpr->srctext.ptr[0] == '%') {
1438 stmt->depth = DAV_DEPTH_PLACEHOLDER;
1439 } else {
1440 cxstring depthstr = depthexpr->srctext;
1441 char *conv = malloc(depthstr.length+1);
1442 if (!conv) {
1443 dav_free_expression(depthexpr);
1444 stmt->errorcode = DAVQL_ERROR_OUT_OF_MEMORY;
1445 return 0;
1446 }
1447 char *chk;
1448 memcpy(conv, depthstr.ptr, depthstr.length);
1449 conv[depthstr.length] = '\0';
1450 stmt->depth = strtol(conv, &chk, 10);
1451 if (*chk || stmt->depth < -1) {
1452 dav_error_in_context(DAVQL_ERROR_INVALID_DEPTH,
1453 _error_invalid_depth, stmt, token);
1454 }
1455 free(conv);
1456 }
1457 total_consumed += consumed;
1458 } else {
1459 dav_error_in_context(DAVQL_ERROR_INVALID_DEPTH,
1460 _error_invalid_depth, stmt, token);
1461 }
1462 }
1463
1464 dav_free_expression(depthexpr);
1465 }
1466 }
1467 }
1468
1469 return total_consumed;
1470 }
1471
1472 static int dav_parse_order_crit(DavQLStatement *stmt, DavQLToken *token,
1473 DavQLOrderCriterion *crit) {
1474
1475 // RULE: (Identifier | Number), [" asc"|" desc"];
1476 DavQLExpression expr;
1477 memset(&expr, 0, sizeof(DavQLExpression));
1478 int consumed = dav_parse_expression(stmt, token, &expr);
1479 if (stmt->errorcode || !consumed) {
1480 return 0;
1481 }
1482
1483 if (expr.type != DAVQL_IDENTIFIER && expr.type != DAVQL_NUMBER) {
1484 dav_error_in_context(DAVQL_ERROR_INVALID_ORDER_CRITERION,
1485 _error_invalid_order_criterion, stmt, token);
1486 return 0;
1487 }
1488
1489 dqlsec_malloc(stmt, crit->column, DavQLExpression);
1490 memcpy(crit->column, &expr, sizeof(DavQLExpression));
1491
1492 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
1493 if (token_is(token, DAVQL_TOKEN_KEYWORD) && (
1494 tokenvalue_is(token, "asc") || tokenvalue_is(token, "desc"))) {
1495
1496 crit->descending = tokenvalue_is(token, "desc");
1497
1498 return consumed+1;
1499 } else {
1500 crit->descending = 0;
1501 return consumed;
1502 }
1503 }
1504
1505 static int dav_parse_orderby_clause(DavQLStatement *stmt, DavQLToken *token) {
1506
1507 int total_consumed = 0, consumed;
1508
1509 DavQLOrderCriterion crit;
1510
1511 if(!stmt->orderby) {
1512 stmt->orderby = cxLinkedListCreateSimple(sizeof(DavQLOrderCriterion));
1513 if(!stmt->orderby) {
1514 return 0;
1515 }
1516 }
1517
1518 // RULE: OrderByCriterion, {",", OrderByCriterion};
1519 do {
1520 consumed = dav_parse_order_crit(stmt, token, &crit);
1521 if (stmt->errorcode) {
1522 return 0;
1523 }
1524 if (!consumed) {
1525 dav_error_in_context(DAVQL_ERROR_MISSING_EXPR, _error_missing_expr,
1526 stmt, token);
1527 return 0;
1528 }
1529 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
1530 total_consumed += consumed;
1531
1532 if(cxListAdd(stmt->orderby, &crit)) {
1533 stmt->errorcode = DAVQL_ERROR_OUT_OF_MEMORY;
1534 return 0;
1535 }
1536
1537 if (token_is(token, DAVQL_TOKEN_COMMA)) {
1538 total_consumed++;
1539 token = token->next;
1540 } else {
1541 consumed = 0;
1542 }
1543 } while (consumed);
1544
1545 return total_consumed;
1546 }
1547
1548
1549 static int dav_parse_assignments(DavQLStatement *stmt, DavQLToken *token) {
1550
1551 // RULE: Assignment, {",", Assignment}
1552 int total_consumed = 0, consumed;
1553 do {
1554 // RULE: Identifier, "=", Expression
1555 if (token_is(token, DAVQL_TOKEN_IDENTIFIER)) {
1556
1557 // Identifier
1558 DavQLField *field;
1559 dqlsec_malloc(stmt, field, DavQLField);
1560 field->name = token_sstr(token);
1561 total_consumed++;
1562 token = token->next;
1563
1564 // "="
1565 if (!token_is(token, DAVQL_TOKEN_OPERATOR)
1566 || !tokenvalue_is(token, "=")) {
1567 dav_free_field(field);
1568
1569 dav_error_in_context(DAVQL_ERROR_MISSING_ASSIGN,
1570 _error_missing_assign, stmt, token);
1571 return total_consumed;
1572 }
1573 total_consumed++;
1574 token = token->next;
1575
1576 // Expression
1577 dqlsec_mallocz(stmt, field->expr, DavQLExpression);
1578 consumed = dav_parse_expression(stmt, token, field->expr);
1579 if (stmt->errorcode) {
1580 dav_free_field(field);
1581 return total_consumed;
1582 }
1583 token = cx_linked_list_at(token, 0, offsetof(DavQLToken, next), consumed);
1584 total_consumed += consumed;
1585
1586 // Add assignment to list and check if there's another one
1587 if(dav_stmt_add_field(stmt, field)) {
1588 free(field);
1589 return 0;
1590 }
1591 consumed = token_is(token, DAVQL_TOKEN_COMMA) ? 1 : 0;
1592 if (consumed) {
1593 token = token->next;
1594 total_consumed++;
1595 }
1596 } else {
1597 dav_error_in_context(DAVQL_ERROR_MISSING_TOKEN,
1598 _error_missing_identifier, stmt, token);
1599 return total_consumed;
1600 }
1601 } while (consumed);
1602
1603 return total_consumed;
1604 }
1605
1606 static int dav_parse_path(DavQLStatement *stmt, DavQLToken *tokens) {
1607 if (token_is(tokens, DAVQL_TOKEN_STRING)) {
1608 stmt->path = token_sstr(tokens);
1609 tokens = tokens->next;
1610 return 1;
1611 } else if (token_is(tokens, DAVQL_TOKEN_OPERATOR)
1612 && tokenvalue_is(tokens, "/")) {
1613 stmt->path = token_sstr(tokens);
1614 tokens = tokens->next;
1615 int consumed = 1;
1616 while (!token_is(tokens, DAVQL_TOKEN_KEYWORD) &&
1617 !token_is(tokens, DAVQL_TOKEN_END)) {
1618 cxstring toksstr = token_sstr(tokens);
1619 stmt->path.length = toksstr.ptr-stmt->path.ptr+toksstr.length;
1620 tokens = tokens->next;
1621 consumed++;
1622 }
1623 return consumed;
1624 } else if (token_is(tokens, DAVQL_TOKEN_FMTSPEC) &&
1625 tokenvalue_is(tokens, "%s")) {
1626 stmt->path = token_sstr(tokens);
1627 tokens = tokens->next;
1628 fmt_args_add(stmt, (void*)(intptr_t)'s');
1629 return 1;
1630 } else {
1631 dav_error_in_context(DAVQL_ERROR_MISSING_TOKEN,
1632 _error_missing_path, stmt, tokens);
1633 return 0;
1634 }
1635 }
1636
1637 /**
1638 * Parser of a select statement.
1639 * @param stmt the statement object that shall contain the syntax tree
1640 * @param tokens the token list
1641 */
1642 static void dav_parse_select_statement(DavQLStatement *stmt, DavQLToken *tokens) {
1643 stmt->type = DAVQL_SELECT;
1644
1645 // Consume field list
1646 tokens = cx_linked_list_at(tokens, 0, offsetof(DavQLToken, next), dav_parse_fieldlist(stmt, tokens));
1647 if (stmt->errorcode) {
1648 return;
1649 }
1650
1651 // Consume FROM keyword
1652 if (token_is(tokens, DAVQL_TOKEN_KEYWORD)
1653 && tokenvalue_is(tokens, "from")) {
1654 tokens = tokens->next;
1655 } else {
1656 dav_error_in_context(DAVQL_ERROR_MISSING_TOKEN,
1657 _error_missing_from, stmt, tokens);
1658 return;
1659 }
1660
1661 // Consume path
1662 tokens = cx_linked_list_at(tokens, 0, offsetof(DavQLToken, next), dav_parse_path(stmt, tokens));
1663 if (stmt->errorcode) {
1664 return;
1665 }
1666 //dav_add_fmt_args(stmt, stmt->path); // add possible path args
1667
1668 // Consume with clause (if any)
1669 if (token_is(tokens, DAVQL_TOKEN_KEYWORD)
1670 && tokenvalue_is(tokens, "with")) {
1671 tokens = tokens->next;
1672 tokens = cx_linked_list_at(tokens, 0, offsetof(DavQLToken, next),
1673 dav_parse_with_clause(stmt, tokens));
1674 }
1675 if (stmt->errorcode) {
1676 return;
1677 }
1678
1679 // Consume where clause (if any)
1680 if (token_is(tokens, DAVQL_TOKEN_KEYWORD)
1681 && tokenvalue_is(tokens, "where")) {
1682 tokens = tokens->next;
1683 tokens = cx_linked_list_at(tokens, 0, offsetof(DavQLToken, next),
1684 dav_parse_where_clause(stmt, tokens));
1685 } else if (token_is(tokens, DAVQL_TOKEN_KEYWORD)
1686 && tokenvalue_is(tokens, "anywhere")) {
1687 // useless, but the user may want to explicitly express his intent
1688 tokens = tokens->next;
1689 stmt->where = NULL;
1690 }
1691 if (stmt->errorcode) {
1692 return;
1693 }
1694
1695 // Consume order by clause (if any)
1696 if (token_is(tokens, DAVQL_TOKEN_KEYWORD)
1697 && tokenvalue_is(tokens, "order")) {
1698 tokens = tokens->next;
1699 if (token_is(tokens, DAVQL_TOKEN_KEYWORD)
1700 && tokenvalue_is(tokens, "by")) {
1701 tokens = tokens->next;
1702 tokens = cx_linked_list_at(tokens, 0, offsetof(DavQLToken, next),
1703 dav_parse_orderby_clause(stmt, tokens));
1704 } else {
1705 dav_error_in_context(DAVQL_ERROR_MISSING_TOKEN,
1706 _error_missing_by, stmt, tokens);
1707 return;
1708 }
1709 }
1710 if (stmt->errorcode) {
1711 return;
1712 }
1713
1714
1715 if (tokens) {
1716 if (token_is(tokens, DAVQL_TOKEN_INVALID)) {
1717 dav_error_in_context(DAVQL_ERROR_INVALID_TOKEN,
1718 _error_invalid_token, stmt, tokens);
1719 } else if (!token_is(tokens, DAVQL_TOKEN_END)) {
1720 dav_error_in_context(DAVQL_ERROR_UNEXPECTED_TOKEN,
1721 _error_unexpected_token, stmt, tokens);
1722 }
1723 }
1724 }
1725
1726 static void dav_parse_set_statement(DavQLStatement *stmt, DavQLToken *tokens) {
1727 stmt->type = DAVQL_SET;
1728
1729 // Consume assignments
1730 tokens = cx_linked_list_at(tokens, 0, offsetof(DavQLToken, next), dav_parse_assignments(stmt, tokens));
1731 if (stmt->errorcode) {
1732 return;
1733 }
1734
1735 // Consume AT keyword
1736 if (token_is(tokens, DAVQL_TOKEN_KEYWORD)
1737 && tokenvalue_is(tokens, "at")) {
1738 tokens = tokens->next;
1739 } else {
1740 dav_error_in_context(DAVQL_ERROR_MISSING_TOKEN,
1741 _error_missing_at, stmt, tokens);
1742 return;
1743 }
1744
1745 // Consume path
1746 tokens = cx_linked_list_at(tokens, 0, offsetof(DavQLToken, next), dav_parse_path(stmt, tokens));
1747 if (stmt->errorcode) {
1748 return;
1749 }
1750
1751 // Consume with clause (if any)
1752 if (token_is(tokens, DAVQL_TOKEN_KEYWORD)
1753 && tokenvalue_is(tokens, "with")) {
1754 tokens = tokens->next;
1755 tokens = cx_linked_list_at(tokens, 0, offsetof(DavQLToken, next),
1756 dav_parse_with_clause(stmt, tokens));
1757 }
1758 if (stmt->errorcode) {
1759 return;
1760 }
1761
1762 // Consume mandatory where clause (or anywhere keyword)
1763 if (token_is(tokens, DAVQL_TOKEN_KEYWORD)
1764 && tokenvalue_is(tokens, "where")) {
1765 tokens = tokens->next;
1766 tokens = cx_linked_list_at(tokens, 0, offsetof(DavQLToken, next),
1767 dav_parse_where_clause(stmt, tokens));
1768 } else if (token_is(tokens, DAVQL_TOKEN_KEYWORD)
1769 && tokenvalue_is(tokens, "anywhere")) {
1770 // no-op, but we want the user to be explicit about this
1771 tokens = tokens->next;
1772 stmt->where = NULL;
1773 } else {
1774 dav_error_in_context(DAVQL_ERROR_MISSING_TOKEN,
1775 _error_missing_where, stmt, tokens);
1776 return;
1777 }
1778 }
1779
1780 DavQLStatement* dav_parse_statement(cxstring srctext) {
1781 DavQLStatement *stmt = calloc(1, sizeof(DavQLStatement));
1782
1783 // if we can't even get enough memory for the statement object or an error
1784 // message, we can simply die without returning anything
1785 if (!stmt) {
1786 return NULL;
1787 }
1788 char *oommsg = strdup(_error_out_of_memory);
1789 if (!oommsg) {
1790 free(stmt);
1791 return NULL;
1792 }
1793
1794 // default values
1795 stmt->type = -1;
1796 stmt->depth = 1;
1797
1798 // save trimmed source text
1799 stmt->srctext = cx_strtrim(srctext);
1800
1801 if (stmt->srctext.length) {
1802 // tokenization
1803 DavQLToken* tokens = dav_parse_tokenize(stmt->srctext);
1804
1805 if (tokens) {
1806 // use first token to determine query type
1807
1808 if (tokenvalue_is(tokens, "select")) {
1809 dav_parse_select_statement(stmt, tokens->next);
1810 } else if (tokenvalue_is(tokens, "set")) {
1811 dav_parse_set_statement(stmt, tokens->next);
1812 } else {
1813 stmt->type = DAVQL_ERROR;
1814 stmt->errorcode = DAVQL_ERROR_INVALID;
1815 stmt->errormessage = strdup(_error_invalid);
1816 }
1817
1818 // free token data
1819 tokenlist_free(tokens);
1820 } else {
1821 stmt->errorcode = DAVQL_ERROR_OUT_OF_MEMORY;
1822 }
1823 } else {
1824 stmt->type = DAVQL_ERROR;
1825 stmt->errorcode = DAVQL_ERROR_INVALID;
1826 stmt->errormessage = strdup(_error_invalid);
1827 }
1828
1829 if (stmt->errorcode == DAVQL_ERROR_OUT_OF_MEMORY) {
1830 stmt->type = DAVQL_ERROR;
1831 stmt->errormessage = oommsg;
1832 } else {
1833 free(oommsg);
1834 }
1835
1836 return stmt;
1837 }
1838
1839 void dav_free_statement(DavQLStatement *stmt) {
1840 if(stmt->fields) {
1841 stmt->fields->simple_destructor = (cx_destructor_func)dav_free_field;
1842 cxListDestroy(stmt->fields);
1843 }
1844
1845 if (stmt->where) {
1846 dav_free_expression(stmt->where);
1847 }
1848 if (stmt->errormessage) {
1849 free(stmt->errormessage);
1850 }
1851
1852 if(stmt->orderby) {
1853 stmt->orderby->simple_destructor = (cx_destructor_func)dav_free_order_criterion;
1854 cxListDestroy(stmt->orderby);
1855 }
1856 if(stmt->args) {
1857 cxListDestroy(stmt->args);
1858 }
1859 free(stmt);
1860 }

mercurial