123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146 |
- /*
- * sfparse
- *
- * Copyright (c) 2023 sfparse contributors
- * Copyright (c) 2019 nghttp3 contributors
- * Copyright (c) 2015 nghttp2 contributors
- *
- * Permission is hereby granted, free of charge, to any person obtaining
- * a copy of this software and associated documentation files (the
- * "Software"), to deal in the Software without restriction, including
- * without limitation the rights to use, copy, modify, merge, publish,
- * distribute, sublicense, and/or sell copies of the Software, and to
- * permit persons to whom the Software is furnished to do so, subject to
- * the following conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
- * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
- * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
- * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
- * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
- */
- #include "sfparse.h"
- #include <string.h>
- #include <assert.h>
- #include <stdlib.h>
- #define SF_STATE_DICT 0x08u
- #define SF_STATE_LIST 0x10u
- #define SF_STATE_ITEM 0x18u
- #define SF_STATE_INNER_LIST 0x04u
- #define SF_STATE_BEFORE 0x00u
- #define SF_STATE_BEFORE_PARAMS 0x01u
- #define SF_STATE_PARAMS 0x02u
- #define SF_STATE_AFTER 0x03u
- #define SF_STATE_OP_MASK 0x03u
- #define SF_SET_STATE_AFTER(NAME) (SF_STATE_##NAME | SF_STATE_AFTER)
- #define SF_SET_STATE_BEFORE_PARAMS(NAME) \
- (SF_STATE_##NAME | SF_STATE_BEFORE_PARAMS)
- #define SF_SET_STATE_INNER_LIST_BEFORE(NAME) \
- (SF_STATE_##NAME | SF_STATE_INNER_LIST | SF_STATE_BEFORE)
- #define SF_STATE_DICT_AFTER SF_SET_STATE_AFTER(DICT)
- #define SF_STATE_DICT_BEFORE_PARAMS SF_SET_STATE_BEFORE_PARAMS(DICT)
- #define SF_STATE_DICT_INNER_LIST_BEFORE SF_SET_STATE_INNER_LIST_BEFORE(DICT)
- #define SF_STATE_LIST_AFTER SF_SET_STATE_AFTER(LIST)
- #define SF_STATE_LIST_BEFORE_PARAMS SF_SET_STATE_BEFORE_PARAMS(LIST)
- #define SF_STATE_LIST_INNER_LIST_BEFORE SF_SET_STATE_INNER_LIST_BEFORE(LIST)
- #define SF_STATE_ITEM_AFTER SF_SET_STATE_AFTER(ITEM)
- #define SF_STATE_ITEM_BEFORE_PARAMS SF_SET_STATE_BEFORE_PARAMS(ITEM)
- #define SF_STATE_ITEM_INNER_LIST_BEFORE SF_SET_STATE_INNER_LIST_BEFORE(ITEM)
- #define SF_STATE_INITIAL 0x00u
- #define DIGIT_CASES \
- case '0': \
- case '1': \
- case '2': \
- case '3': \
- case '4': \
- case '5': \
- case '6': \
- case '7': \
- case '8': \
- case '9'
- #define LCALPHA_CASES \
- case 'a': \
- case 'b': \
- case 'c': \
- case 'd': \
- case 'e': \
- case 'f': \
- case 'g': \
- case 'h': \
- case 'i': \
- case 'j': \
- case 'k': \
- case 'l': \
- case 'm': \
- case 'n': \
- case 'o': \
- case 'p': \
- case 'q': \
- case 'r': \
- case 's': \
- case 't': \
- case 'u': \
- case 'v': \
- case 'w': \
- case 'x': \
- case 'y': \
- case 'z'
- #define UCALPHA_CASES \
- case 'A': \
- case 'B': \
- case 'C': \
- case 'D': \
- case 'E': \
- case 'F': \
- case 'G': \
- case 'H': \
- case 'I': \
- case 'J': \
- case 'K': \
- case 'L': \
- case 'M': \
- case 'N': \
- case 'O': \
- case 'P': \
- case 'Q': \
- case 'R': \
- case 'S': \
- case 'T': \
- case 'U': \
- case 'V': \
- case 'W': \
- case 'X': \
- case 'Y': \
- case 'Z'
- #define ALPHA_CASES \
- UCALPHA_CASES: \
- LCALPHA_CASES
- #define X20_21_CASES \
- case ' ': \
- case '!'
- #define X23_5B_CASES \
- case '#': \
- case '$': \
- case '%': \
- case '&': \
- case '\'': \
- case '(': \
- case ')': \
- case '*': \
- case '+': \
- case ',': \
- case '-': \
- case '.': \
- case '/': \
- DIGIT_CASES: \
- case ':': \
- case ';': \
- case '<': \
- case '=': \
- case '>': \
- case '?': \
- case '@': \
- UCALPHA_CASES: \
- case '['
- #define X5D_7E_CASES \
- case ']': \
- case '^': \
- case '_': \
- case '`': \
- LCALPHA_CASES: \
- case '{': \
- case '|': \
- case '}': \
- case '~'
- static int is_ws(uint8_t c) {
- switch (c) {
- case ' ':
- case '\t':
- return 1;
- default:
- return 0;
- }
- }
- static int parser_eof(sf_parser *sfp) { return sfp->pos == sfp->end; }
- static void parser_discard_ows(sf_parser *sfp) {
- for (; !parser_eof(sfp) && is_ws(*sfp->pos); ++sfp->pos)
- ;
- }
- static void parser_discard_sp(sf_parser *sfp) {
- for (; !parser_eof(sfp) && *sfp->pos == ' '; ++sfp->pos)
- ;
- }
- static void parser_set_op_state(sf_parser *sfp, uint32_t op) {
- sfp->state &= ~SF_STATE_OP_MASK;
- sfp->state |= op;
- }
- static void parser_unset_inner_list_state(sf_parser *sfp) {
- sfp->state &= ~SF_STATE_INNER_LIST;
- }
- static int parser_key(sf_parser *sfp, sf_vec *dest) {
- const uint8_t *base;
- switch (*sfp->pos) {
- case '*':
- LCALPHA_CASES:
- break;
- default:
- return SF_ERR_PARSE_ERROR;
- }
- base = sfp->pos++;
- for (; !parser_eof(sfp); ++sfp->pos) {
- switch (*sfp->pos) {
- case '_':
- case '-':
- case '.':
- case '*':
- DIGIT_CASES:
- LCALPHA_CASES:
- continue;
- }
- break;
- }
- if (dest) {
- dest->base = (uint8_t *)base;
- dest->len = (size_t)(sfp->pos - dest->base);
- }
- return 0;
- }
- static int parser_number(sf_parser *sfp, sf_value *dest) {
- int sign = 1;
- int64_t value = 0;
- size_t len = 0;
- size_t fpos = 0;
- if (*sfp->pos == '-') {
- ++sfp->pos;
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- sign = -1;
- }
- assert(!parser_eof(sfp));
- for (; !parser_eof(sfp); ++sfp->pos) {
- switch (*sfp->pos) {
- DIGIT_CASES:
- if (++len > 15) {
- return SF_ERR_PARSE_ERROR;
- }
- value *= 10;
- value += *sfp->pos - '0';
- continue;
- }
- break;
- }
- if (len == 0) {
- return SF_ERR_PARSE_ERROR;
- }
- if (parser_eof(sfp) || *sfp->pos != '.') {
- if (dest) {
- dest->type = SF_TYPE_INTEGER;
- dest->flags = SF_VALUE_FLAG_NONE;
- dest->integer = value * sign;
- }
- return 0;
- }
- /* decimal */
- if (len > 12) {
- return SF_ERR_PARSE_ERROR;
- }
- fpos = len;
- ++sfp->pos;
- for (; !parser_eof(sfp); ++sfp->pos) {
- switch (*sfp->pos) {
- DIGIT_CASES:
- if (++len > 15) {
- return SF_ERR_PARSE_ERROR;
- }
- value *= 10;
- value += *sfp->pos - '0';
- continue;
- }
- break;
- }
- if (fpos == len || len - fpos > 3) {
- return SF_ERR_PARSE_ERROR;
- }
- if (dest) {
- dest->type = SF_TYPE_DECIMAL;
- dest->flags = SF_VALUE_FLAG_NONE;
- dest->decimal.numer = value * sign;
- switch (len - fpos) {
- case 1:
- dest->decimal.denom = 10;
- break;
- case 2:
- dest->decimal.denom = 100;
- break;
- case 3:
- dest->decimal.denom = 1000;
- break;
- }
- }
- return 0;
- }
- static int parser_date(sf_parser *sfp, sf_value *dest) {
- int rv;
- sf_value val;
- /* The first byte has already been validated by the caller. */
- assert('@' == *sfp->pos);
- ++sfp->pos;
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- rv = parser_number(sfp, &val);
- if (rv != 0) {
- return rv;
- }
- if (val.type != SF_TYPE_INTEGER) {
- return SF_ERR_PARSE_ERROR;
- }
- if (dest) {
- *dest = val;
- dest->type = SF_TYPE_DATE;
- }
- return 0;
- }
- static int parser_string(sf_parser *sfp, sf_value *dest) {
- const uint8_t *base;
- uint32_t flags = SF_VALUE_FLAG_NONE;
- /* The first byte has already been validated by the caller. */
- assert('"' == *sfp->pos);
- base = ++sfp->pos;
- for (; !parser_eof(sfp); ++sfp->pos) {
- switch (*sfp->pos) {
- X20_21_CASES:
- X23_5B_CASES:
- X5D_7E_CASES:
- break;
- case '\\':
- ++sfp->pos;
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- switch (*sfp->pos) {
- case '"':
- case '\\':
- flags = SF_VALUE_FLAG_ESCAPED_STRING;
- break;
- default:
- return SF_ERR_PARSE_ERROR;
- }
- break;
- case '"':
- if (dest) {
- dest->type = SF_TYPE_STRING;
- dest->flags = flags;
- dest->vec.len = (size_t)(sfp->pos - base);
- dest->vec.base = dest->vec.len == 0 ? NULL : (uint8_t *)base;
- }
- ++sfp->pos;
- return 0;
- default:
- return SF_ERR_PARSE_ERROR;
- }
- }
- return SF_ERR_PARSE_ERROR;
- }
- static int parser_token(sf_parser *sfp, sf_value *dest) {
- const uint8_t *base;
- /* The first byte has already been validated by the caller. */
- base = sfp->pos++;
- for (; !parser_eof(sfp); ++sfp->pos) {
- switch (*sfp->pos) {
- case '!':
- case '#':
- case '$':
- case '%':
- case '&':
- case '\'':
- case '*':
- case '+':
- case '-':
- case '.':
- case '^':
- case '_':
- case '`':
- case '|':
- case '~':
- case ':':
- case '/':
- DIGIT_CASES:
- ALPHA_CASES:
- continue;
- }
- break;
- }
- if (dest) {
- dest->type = SF_TYPE_TOKEN;
- dest->flags = SF_VALUE_FLAG_NONE;
- dest->vec.base = (uint8_t *)base;
- dest->vec.len = (size_t)(sfp->pos - base);
- }
- return 0;
- }
- static int parser_byteseq(sf_parser *sfp, sf_value *dest) {
- const uint8_t *base;
- /* The first byte has already been validated by the caller. */
- assert(':' == *sfp->pos);
- base = ++sfp->pos;
- for (; !parser_eof(sfp); ++sfp->pos) {
- switch (*sfp->pos) {
- case '+':
- case '/':
- DIGIT_CASES:
- ALPHA_CASES:
- continue;
- case '=':
- switch ((sfp->pos - base) & 0x3) {
- case 0:
- case 1:
- return SF_ERR_PARSE_ERROR;
- case 2:
- switch (*(sfp->pos - 1)) {
- case 'A':
- case 'Q':
- case 'g':
- case 'w':
- break;
- default:
- return SF_ERR_PARSE_ERROR;
- }
- ++sfp->pos;
- if (parser_eof(sfp) || *sfp->pos != '=') {
- return SF_ERR_PARSE_ERROR;
- }
- break;
- case 3:
- switch (*(sfp->pos - 1)) {
- case 'A':
- case 'E':
- case 'I':
- case 'M':
- case 'Q':
- case 'U':
- case 'Y':
- case 'c':
- case 'g':
- case 'k':
- case 'o':
- case 's':
- case 'w':
- case '0':
- case '4':
- case '8':
- break;
- default:
- return SF_ERR_PARSE_ERROR;
- }
- break;
- }
- ++sfp->pos;
- if (parser_eof(sfp) || *sfp->pos != ':') {
- return SF_ERR_PARSE_ERROR;
- }
- goto fin;
- case ':':
- if ((sfp->pos - base) & 0x3) {
- return SF_ERR_PARSE_ERROR;
- }
- goto fin;
- default:
- return SF_ERR_PARSE_ERROR;
- }
- }
- return SF_ERR_PARSE_ERROR;
- fin:
- if (dest) {
- dest->type = SF_TYPE_BYTESEQ;
- dest->flags = SF_VALUE_FLAG_NONE;
- dest->vec.len = (size_t)(sfp->pos - base);
- dest->vec.base = dest->vec.len == 0 ? NULL : (uint8_t *)base;
- }
- ++sfp->pos;
- return 0;
- }
- static int parser_boolean(sf_parser *sfp, sf_value *dest) {
- int b;
- /* The first byte has already been validated by the caller. */
- assert('?' == *sfp->pos);
- ++sfp->pos;
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- switch (*sfp->pos) {
- case '0':
- b = 0;
- break;
- case '1':
- b = 1;
- break;
- default:
- return SF_ERR_PARSE_ERROR;
- }
- ++sfp->pos;
- if (dest) {
- dest->type = SF_TYPE_BOOLEAN;
- dest->flags = SF_VALUE_FLAG_NONE;
- dest->boolean = b;
- }
- return 0;
- }
- static int parser_bare_item(sf_parser *sfp, sf_value *dest) {
- switch (*sfp->pos) {
- case '"':
- return parser_string(sfp, dest);
- case '-':
- DIGIT_CASES:
- return parser_number(sfp, dest);
- case '@':
- return parser_date(sfp, dest);
- case ':':
- return parser_byteseq(sfp, dest);
- case '?':
- return parser_boolean(sfp, dest);
- case '*':
- ALPHA_CASES:
- return parser_token(sfp, dest);
- default:
- return SF_ERR_PARSE_ERROR;
- }
- }
- static int parser_skip_inner_list(sf_parser *sfp);
- int sf_parser_param(sf_parser *sfp, sf_vec *dest_key, sf_value *dest_value) {
- int rv;
- switch (sfp->state & SF_STATE_OP_MASK) {
- case SF_STATE_BEFORE:
- rv = parser_skip_inner_list(sfp);
- if (rv != 0) {
- return rv;
- }
- /* fall through */
- case SF_STATE_BEFORE_PARAMS:
- parser_set_op_state(sfp, SF_STATE_PARAMS);
- break;
- case SF_STATE_PARAMS:
- break;
- default:
- assert(0);
- abort();
- }
- if (parser_eof(sfp) || *sfp->pos != ';') {
- parser_set_op_state(sfp, SF_STATE_AFTER);
- return SF_ERR_EOF;
- }
- ++sfp->pos;
- parser_discard_sp(sfp);
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- rv = parser_key(sfp, dest_key);
- if (rv != 0) {
- return rv;
- }
- if (parser_eof(sfp) || *sfp->pos != '=') {
- if (dest_value) {
- dest_value->type = SF_TYPE_BOOLEAN;
- dest_value->flags = SF_VALUE_FLAG_NONE;
- dest_value->boolean = 1;
- }
- return 0;
- }
- ++sfp->pos;
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- return parser_bare_item(sfp, dest_value);
- }
- static int parser_skip_params(sf_parser *sfp) {
- int rv;
- for (;;) {
- rv = sf_parser_param(sfp, NULL, NULL);
- switch (rv) {
- case 0:
- break;
- case SF_ERR_EOF:
- return 0;
- case SF_ERR_PARSE_ERROR:
- return rv;
- default:
- assert(0);
- abort();
- }
- }
- }
- int sf_parser_inner_list(sf_parser *sfp, sf_value *dest) {
- int rv;
- switch (sfp->state & SF_STATE_OP_MASK) {
- case SF_STATE_BEFORE:
- parser_discard_sp(sfp);
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- break;
- case SF_STATE_BEFORE_PARAMS:
- rv = parser_skip_params(sfp);
- if (rv != 0) {
- return rv;
- }
- /* Technically, we are entering SF_STATE_AFTER, but we will set
- another state without reading the state. */
- /* parser_set_op_state(sfp, SF_STATE_AFTER); */
- /* fall through */
- case SF_STATE_AFTER:
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- switch (*sfp->pos) {
- case ' ':
- parser_discard_sp(sfp);
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- break;
- case ')':
- break;
- default:
- return SF_ERR_PARSE_ERROR;
- }
- break;
- default:
- assert(0);
- abort();
- }
- if (*sfp->pos == ')') {
- ++sfp->pos;
- parser_unset_inner_list_state(sfp);
- parser_set_op_state(sfp, SF_STATE_BEFORE_PARAMS);
- return SF_ERR_EOF;
- }
- rv = parser_bare_item(sfp, dest);
- if (rv != 0) {
- return rv;
- }
- parser_set_op_state(sfp, SF_STATE_BEFORE_PARAMS);
- return 0;
- }
- static int parser_skip_inner_list(sf_parser *sfp) {
- int rv;
- for (;;) {
- rv = sf_parser_inner_list(sfp, NULL);
- switch (rv) {
- case 0:
- break;
- case SF_ERR_EOF:
- return 0;
- case SF_ERR_PARSE_ERROR:
- return rv;
- default:
- assert(0);
- abort();
- }
- }
- }
- static int parser_next_key_or_item(sf_parser *sfp) {
- parser_discard_ows(sfp);
- if (parser_eof(sfp)) {
- return SF_ERR_EOF;
- }
- if (*sfp->pos != ',') {
- return SF_ERR_PARSE_ERROR;
- }
- ++sfp->pos;
- parser_discard_ows(sfp);
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- return 0;
- }
- static int parser_dict_value(sf_parser *sfp, sf_value *dest) {
- int rv;
- if (parser_eof(sfp) || *(sfp->pos) != '=') {
- /* Boolean true */
- if (dest) {
- dest->type = SF_TYPE_BOOLEAN;
- dest->flags = SF_VALUE_FLAG_NONE;
- dest->boolean = 1;
- }
- sfp->state = SF_STATE_DICT_BEFORE_PARAMS;
- return 0;
- }
- ++sfp->pos;
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- if (*sfp->pos == '(') {
- if (dest) {
- dest->type = SF_TYPE_INNER_LIST;
- dest->flags = SF_VALUE_FLAG_NONE;
- }
- ++sfp->pos;
- sfp->state = SF_STATE_DICT_INNER_LIST_BEFORE;
- return 0;
- }
- rv = parser_bare_item(sfp, dest);
- if (rv != 0) {
- return rv;
- }
- sfp->state = SF_STATE_DICT_BEFORE_PARAMS;
- return 0;
- }
- int sf_parser_dict(sf_parser *sfp, sf_vec *dest_key, sf_value *dest_value) {
- int rv;
- switch (sfp->state) {
- case SF_STATE_DICT_INNER_LIST_BEFORE:
- rv = parser_skip_inner_list(sfp);
- if (rv != 0) {
- return rv;
- }
- /* fall through */
- case SF_STATE_DICT_BEFORE_PARAMS:
- rv = parser_skip_params(sfp);
- if (rv != 0) {
- return rv;
- }
- /* fall through */
- case SF_STATE_DICT_AFTER:
- rv = parser_next_key_or_item(sfp);
- if (rv != 0) {
- return rv;
- }
- break;
- case SF_STATE_INITIAL:
- parser_discard_sp(sfp);
- if (parser_eof(sfp)) {
- return SF_ERR_EOF;
- }
- break;
- default:
- assert(0);
- abort();
- }
- rv = parser_key(sfp, dest_key);
- if (rv != 0) {
- return rv;
- }
- return parser_dict_value(sfp, dest_value);
- }
- int sf_parser_list(sf_parser *sfp, sf_value *dest) {
- int rv;
- switch (sfp->state) {
- case SF_STATE_LIST_INNER_LIST_BEFORE:
- rv = parser_skip_inner_list(sfp);
- if (rv != 0) {
- return rv;
- }
- /* fall through */
- case SF_STATE_LIST_BEFORE_PARAMS:
- rv = parser_skip_params(sfp);
- if (rv != 0) {
- return rv;
- }
- /* fall through */
- case SF_STATE_LIST_AFTER:
- rv = parser_next_key_or_item(sfp);
- if (rv != 0) {
- return rv;
- }
- break;
- case SF_STATE_INITIAL:
- parser_discard_sp(sfp);
- if (parser_eof(sfp)) {
- return SF_ERR_EOF;
- }
- break;
- default:
- assert(0);
- abort();
- }
- if (*sfp->pos == '(') {
- if (dest) {
- dest->type = SF_TYPE_INNER_LIST;
- dest->flags = SF_VALUE_FLAG_NONE;
- }
- ++sfp->pos;
- sfp->state = SF_STATE_LIST_INNER_LIST_BEFORE;
- return 0;
- }
- rv = parser_bare_item(sfp, dest);
- if (rv != 0) {
- return rv;
- }
- sfp->state = SF_STATE_LIST_BEFORE_PARAMS;
- return 0;
- }
- int sf_parser_item(sf_parser *sfp, sf_value *dest) {
- int rv;
- switch (sfp->state) {
- case SF_STATE_INITIAL:
- parser_discard_sp(sfp);
- if (parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- break;
- case SF_STATE_ITEM_INNER_LIST_BEFORE:
- rv = parser_skip_inner_list(sfp);
- if (rv != 0) {
- return rv;
- }
- /* fall through */
- case SF_STATE_ITEM_BEFORE_PARAMS:
- rv = parser_skip_params(sfp);
- if (rv != 0) {
- return rv;
- }
- /* fall through */
- case SF_STATE_ITEM_AFTER:
- parser_discard_sp(sfp);
- if (!parser_eof(sfp)) {
- return SF_ERR_PARSE_ERROR;
- }
- return SF_ERR_EOF;
- default:
- assert(0);
- abort();
- }
- if (*sfp->pos == '(') {
- if (dest) {
- dest->type = SF_TYPE_INNER_LIST;
- dest->flags = SF_VALUE_FLAG_NONE;
- }
- ++sfp->pos;
- sfp->state = SF_STATE_ITEM_INNER_LIST_BEFORE;
- return 0;
- }
- rv = parser_bare_item(sfp, dest);
- if (rv != 0) {
- return rv;
- }
- sfp->state = SF_STATE_ITEM_BEFORE_PARAMS;
- return 0;
- }
- void sf_parser_init(sf_parser *sfp, const uint8_t *data, size_t datalen) {
- if (datalen == 0) {
- sfp->pos = sfp->end = NULL;
- } else {
- sfp->pos = data;
- sfp->end = data + datalen;
- }
- sfp->state = SF_STATE_INITIAL;
- }
- void sf_unescape(sf_vec *dest, const sf_vec *src) {
- const uint8_t *p, *q;
- uint8_t *o;
- size_t len, slen;
- if (src->len == 0) {
- *dest = *src;
- return;
- }
- o = dest->base;
- p = src->base;
- len = src->len;
- for (;;) {
- q = memchr(p, '\\', len);
- if (q == NULL) {
- if (len == src->len) {
- *dest = *src;
- return;
- }
- memcpy(o, p, len);
- o += len;
- break;
- }
- slen = (size_t)(q - p);
- memcpy(o, p, slen);
- o += slen;
- p = q + 1;
- *o++ = *p++;
- len -= slen + 2;
- }
- dest->len = (size_t)(o - dest->base);
- }
- void sf_base64decode(sf_vec *dest, const sf_vec *src) {
- static const int index_tbl[] = {
- -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
- -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
- -1, -1, -1, -1, -1, -1, -1, 62, -1, -1, -1, 63, 52, 53, 54, 55, 56, 57,
- 58, 59, 60, 61, -1, -1, -1, -1, -1, -1, -1, 0, 1, 2, 3, 4, 5, 6,
- 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24,
- 25, -1, -1, -1, -1, -1, -1, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36,
- 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, -1, -1, -1,
- -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
- -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
- -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
- -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
- -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
- -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
- -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
- -1, -1, -1, -1};
- uint8_t *o;
- const uint8_t *p, *end;
- uint32_t n;
- size_t i;
- int idx;
- assert((src->len & 0x3) == 0);
- if (src->len == 0) {
- *dest = *src;
- return;
- }
- o = dest->base;
- p = src->base;
- end = src->base + src->len;
- for (; p != end;) {
- n = 0;
- for (i = 1; i <= 4; ++i, ++p) {
- idx = index_tbl[*p];
- if (idx == -1) {
- assert(i > 2);
- if (i == 3) {
- assert(*p == '=' && *(p + 1) == '=' && p + 2 == end);
- *o++ = (uint8_t)(n >> 16);
- goto fin;
- }
- assert(*p == '=' && p + 1 == end);
- *o++ = (uint8_t)(n >> 16);
- *o++ = (n >> 8) & 0xffu;
- goto fin;
- }
- n += (uint32_t)(idx << (24 - i * 6));
- }
- *o++ = (uint8_t)(n >> 16);
- *o++ = (n >> 8) & 0xffu;
- *o++ = n & 0xffu;
- }
- fin:
- dest->len = (size_t)(o - dest->base);
- }
|