server/src/util/parser.c

#ifdef _MSC_VER
#include <platform.h>
#endif
#include "parser.h"
#include "unicode.h"
#include "base36.h"
#include "log.h"

#include <assert.h>
#include <stdlib.h>
#include <wctype.h>
#include <memory.h>

#define SPACE_REPLACEMENT '~'
#define ESCAPE_CHAR       '\\'
#define MAXTOKENSIZE      8192

typedef struct parse_state {
    const char *current_token;
    struct parse_state *next;
    void *data;
    void(*dtor)(void *);
} parse_state;

static parse_state *states;

static int eatwhitespace_c(const char **str_p)
{
    int ret = 0;
    wint_t wc;
    size_t len;
    const char *str = *str_p;

    /* skip over potential whitespace */
    for (;;) {
        unsigned char utf8_character = (unsigned char)*str;
        if (~utf8_character & 0x80) {
            if (!iswspace(utf8_character))
                break;
            ++str;
        }
        else {
            ret = unicode_utf8_decode(&wc, str, &len);
            if (ret != 0) {
                log_warning("illegal character sequence in UTF8 string: %s\n", str);
                break;
            }
            if (!iswspace(wc))
                break;
            str += len;
        }
    }
    *str_p = str;
    return ret;
}

void init_tokens_ex(const char *initstr, void *data, void (*dtor)(void *))
{
    if (states == NULL) {
        states = calloc(1, sizeof(parse_state));
        if (!states) abort();
    }
    else if (states->dtor) {
        states->dtor(states->data);
    }
    states->dtor = dtor;
    states->data = data;
    states->current_token = initstr;
}

void init_tokens_str(const char *initstr) {
    init_tokens_ex(initstr, NULL, NULL);
}

void parser_pushstate(void)
{
    parse_state *new_state = calloc(1, sizeof(parse_state));
    if (!new_state) abort();
    new_state->current_token = NULL;
    new_state->next = states;
    states = new_state;
}

void parser_popstate(void)
{
    parse_state *new_state = states->next;
    if (states->dtor) {
        states->dtor(states->data);
    }
    free(states);
    states = new_state;
}

bool parser_end(void)
{
    if (states->current_token) {
        eatwhitespace_c(&states->current_token);
        return *states->current_token == 0;
    }
    return true;
}

void skip_token(void)
{
    char quotechar = 0;
    eatwhitespace_c(&states->current_token);

    while (*states->current_token) {
        wint_t wc;
        size_t len;

        unsigned char utf8_character = (unsigned char)states->current_token[0];
        if (~utf8_character & 0x80) {
            wc = utf8_character;
            ++states->current_token;
        }
        else {
            int ret = unicode_utf8_decode(&wc, states->current_token, &len);
            if (ret == 0) {
                states->current_token += len;
            }
            else {
                log_warning("illegal character sequence in UTF8 string: %s\n", states->current_token);
            }
        }
        if (iswspace(wc) && quotechar == 0) {
            return;
        }
        else {
            switch (utf8_character) {
            case '"':
            case '\'':
                if (utf8_character == quotechar)
                    return;
                quotechar = utf8_character;
                break;
            case ESCAPE_CHAR:
                ++states->current_token;
                break;
            }
        }
    }
}

char *parse_token(const char **str, char *lbuf, size_t buflen)
{
    char *cursor = lbuf;
    char quotechar = 0;
    bool escape = false;
    const char *ctoken = *str, *cstart;

    if (!ctoken) {
        return 0;
    }
    eatwhitespace_c(&ctoken);
    if (!*ctoken) {
        if (buflen > 0) {
            *cursor = 0;
        }
        return 0;
    }
    cstart = ctoken;
    while (*ctoken) {
        wint_t wc;
        size_t len;
        bool copy = false;

        unsigned char utf8_character = *(unsigned char *)ctoken;
        if (~utf8_character & 0x80) {
            wc = utf8_character;
            len = 1;
        }
        else {
            int ret = unicode_utf8_decode(&wc, ctoken, &len);
            if (ret != 0) {
                log_info("falling back to ISO-8859-1: %s\n", cstart);
                if (cursor - buflen < lbuf - 2) {
                    size_t inlen = 1;
                    len = 2;
                    unicode_latin1_to_utf8(cursor, &len, ctoken, &inlen);
                    cursor += len;
                    ctoken += inlen;
                    continue;
                }
            }
        }
        if (escape) {
            copy = true;
            escape = false;
        }
        else if (iswspace(wc)) {
            if (quotechar == 0)
                break;
            copy = true;
        }
        else if (utf8_character == '"' || utf8_character == '\'') {
            if (utf8_character == quotechar) {
                ++ctoken;
                break;
            }
            else if (quotechar == 0 && cstart == ctoken) {
                quotechar = utf8_character;
                ++ctoken;
            }
            else {
                if (cursor - buflen < lbuf - len) {
                    *cursor++ = *ctoken++;
                }
            }
        }
        else if (utf8_character == SPACE_REPLACEMENT) {
            if (cursor - buflen < lbuf - len) {
                *cursor++ = ' ';
            }
            ++ctoken;
        }
        else if (utf8_character == ESCAPE_CHAR) {
            escape = true;
            ++ctoken;
        }
        else {
            copy = true;
        }
        if (copy) {
            if (cursor - buflen < lbuf - len) {
                memcpy(cursor, ctoken, len);
                cursor += len;
            }
            ctoken += len;
        }
    }

    *cursor = '\0';
    unicode_utf8_trim(lbuf);
    *str = ctoken;
    return lbuf;
}

static char pbuf[MAXTOKENSIZE];       /* STATIC_RESULT: used for return, not across calls */
const char *parse_token_depr(const char **str)
{
    return parse_token(str, pbuf, MAXTOKENSIZE);
}

char *getstrtoken(void)
{
    return parse_token((const char **)&states->current_token, pbuf, MAXTOKENSIZE);
}

char *gettoken(char *lbuf, size_t bufsize)
{
    return parse_token((const char **)&states->current_token, lbuf, bufsize);
}

int getint(void)
{
    char token[16];
    const char * s = gettoken(token, sizeof(token));
    return s ? atoi(s) : 0;
}

int getuint(void)
{
    int n = getint();
    return (n < 0) ? 0 : n;
}

int getid(void)
{
    char token[8];
    const char *str = gettoken(token, sizeof(token));
    int i = str ? atoi36(str) : 0;
    if (i < 0) {
        return -1;
    }
    return i;
}

unsigned int atoip(const char *s)
{
    int n;

    assert(s);
    n = (s[0] >= '0' && s[0] <= '9');
    n = n ? atoi(s) : 0;

    if (n < 0)
        n = 0;

    return n;
}
move keyword.[hc] to util 2018-09-29 18:13:32 +02:00			`#ifdef _MSC_VER`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`#include <platform.h>`
move keyword.[hc] to util 2018-09-29 18:13:32 +02:00			`#endif`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`#include "parser.h"`
			`#include "unicode.h"`
ongoing config.c cleanup: getid() 2014-12-18 07:09:22 +01:00			`#include "base36.h"`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`#include "log.h"`

			`#include <assert.h>`
use cmake for autoconf, slim down platform.h 2014-03-15 19:29:11 +01:00			`#include <stdlib.h>`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`#include <wctype.h>`
			`#include <memory.h>`

			`#define SPACE_REPLACEMENT '~'`
			`#define ESCAPE_CHAR '\\'`
			`#define MAXTOKENSIZE 8192`

MSVC debugger gets confused when two structs have the same name 2019-01-18 22:26:55 +01:00			`typedef struct parse_state {`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`const char *current_token;`
MSVC debugger gets confused when two structs have the same name 2019-01-18 22:26:55 +01:00			`struct parse_state *next;`
fix parser to keep a reference to the order it is parsing. make push/popstate not crash. pass unit tests. 2017-11-10 07:56:56 +01:00			`void *data;`
			`void(dtor)(void );`
MSVC debugger gets confused when two structs have the same name 2019-01-18 22:26:55 +01:00			`} parse_state;`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00
MSVC debugger gets confused when two structs have the same name 2019-01-18 22:26:55 +01:00			`static parse_state *states;`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00
indentation rules, strictly applied 2011-03-07 08:02:35 +01:00			`static int eatwhitespace_c(const char **str_p)`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`{`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`int ret = 0;`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`wint_t wc;`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`size_t len;`
			`const char str = str_p;`

			`/* skip over potential whitespace */`
			`for (;;) {`
			`unsigned char utf8_character = (unsigned char)*str;`
			`if (~utf8_character & 0x80) {`
continue fixing compilation (gcc/clang) 2017-01-10 18:05:48 +01:00			`if (!iswspace(utf8_character))`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`break;`
			`++str;`
			`}`
			`else {`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`ret = unicode_utf8_decode(&wc, str, &len);`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`if (ret != 0) {`
			`log_warning("illegal character sequence in UTF8 string: %s\n", str);`
			`break;`
			`}`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`if (!iswspace(wc))`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`break;`
			`str += len;`
			`}`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`*str_p = str;`
			`return ret;`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`

fix parser to keep a reference to the order it is parsing. make push/popstate not crash. pass unit tests. 2017-11-10 07:56:56 +01:00			`void init_tokens_ex(const char initstr, void data, void (dtor)(void ))`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`{`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`if (states == NULL) {`
MSVC debugger gets confused when two structs have the same name 2019-01-18 22:26:55 +01:00			`states = calloc(1, sizeof(parse_state));`
reduce big arrays on the stack, report allies with new pump_paragraph function (WIP) 2018-11-26 22:01:18 +01:00			`if (!states) abort();`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`}`
fix parser to keep a reference to the order it is parsing. make push/popstate not crash. pass unit tests. 2017-11-10 07:56:56 +01:00			`else if (states->dtor) {`
			`states->dtor(states->data);`
			`}`
			`states->dtor = dtor;`
			`states->data = data;`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`states->current_token = initstr;`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`

fix parser to keep a reference to the order it is parsing. make push/popstate not crash. pass unit tests. 2017-11-10 07:56:56 +01:00			`void init_tokens_str(const char *initstr) {`
			`init_tokens_ex(initstr, NULL, NULL);`
			`}`

indentation rules, strictly applied 2011-03-07 08:02:35 +01:00			`void parser_pushstate(void)`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`{`
MSVC debugger gets confused when two structs have the same name 2019-01-18 22:26:55 +01:00			`parse_state *new_state = calloc(1, sizeof(parse_state));`
reduce big arrays on the stack, report allies with new pump_paragraph function (WIP) 2018-11-26 22:01:18 +01:00			`if (!new_state) abort();`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`new_state->current_token = NULL;`
			`new_state->next = states;`
			`states = new_state;`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`

indentation rules, strictly applied 2011-03-07 08:02:35 +01:00			`void parser_popstate(void)`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`{`
MSVC debugger gets confused when two structs have the same name 2019-01-18 22:26:55 +01:00			`parse_state *new_state = states->next;`
fix parser to keep a reference to the order it is parsing. make push/popstate not crash. pass unit tests. 2017-11-10 07:56:56 +01:00			`if (states->dtor) {`
			`states->dtor(states->data);`
			`}`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`free(states);`
			`states = new_state;`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`

remove custom boolean type use bool when we have C99, or our own typedef for bool 2012-06-24 07:41:07 +02:00			`bool parser_end(void)`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`{`
make getstrtoken() return null at EOL, kill init_tokens. init_order all the things! added a bunch of new assertions to cover for oversights. added some new tests for order parsing. 2014-08-23 09:17:58 +02:00			`if (states->current_token) {`
			`eatwhitespace_c(&states->current_token);`
			`return *states->current_token == 0;`
			`}`
			`return true;`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`

indentation rules, strictly applied 2011-03-07 08:02:35 +01:00			`void skip_token(void)`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`{`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`char quotechar = 0;`
			`eatwhitespace_c(&states->current_token);`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`while (*states->current_token) {`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`wint_t wc;`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`size_t len;`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`unsigned char utf8_character = (unsigned char)states->current_token[0];`
			`if (~utf8_character & 0x80) {`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`wc = utf8_character;`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`++states->current_token;`
			`}`
			`else {`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`int ret = unicode_utf8_decode(&wc, states->current_token, &len);`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`if (ret == 0) {`
			`states->current_token += len;`
			`}`
			`else {`
			`log_warning("illegal character sequence in UTF8 string: %s\n", states->current_token);`
			`}`
			`}`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`if (iswspace(wc) && quotechar == 0) {`
indentation rules, strictly applied 2011-03-07 08:02:35 +01:00			`return;`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`}`
			`else {`
			`switch (utf8_character) {`
			`case '"':`
			`case '\'':`
			`if (utf8_character == quotechar)`
			`return;`
			`quotechar = utf8_character;`
			`break;`
			`case ESCAPE_CHAR:`
			`++states->current_token;`
			`break;`
			`}`
			`}`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`
			`}`

parsing tokens when buffer is too small - skip the entire token. now with tests. 2014-12-24 15:55:55 +01:00			`char parse_token(const char str, char lbuf, size_t buflen)`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`{`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`char *cursor = lbuf;`
			`char quotechar = 0;`
			`bool escape = false;`
fix parser crash from turn 1179 2020-07-26 12:59:49 +02:00			`const char ctoken = str, *cstart;`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`if (!ctoken) {`
			`return 0;`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`eatwhitespace_c(&ctoken);`
			`if (!*ctoken) {`
parsing tokens when buffer is too small - skip the entire token. now with tests. 2014-12-24 15:55:55 +01:00			`if (buflen > 0) {`
rename to gettoken, use more widely, add a basic test. 2014-12-22 16:28:17 +01:00			`*cursor = 0;`
			`}`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`return 0;`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`
fix parser crash from turn 1179 2020-07-26 12:59:49 +02:00			`cstart = ctoken;`
parsing tokens when buffer is too small - skip the entire token. now with tests. 2014-12-24 15:55:55 +01:00			`while (*ctoken) {`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`wint_t wc;`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`size_t len;`
			`bool copy = false;`

			`unsigned char utf8_character = (unsigned char )ctoken;`
			`if (~utf8_character & 0x80) {`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`wc = utf8_character;`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`len = 1;`
			`}`
			`else {`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`int ret = unicode_utf8_decode(&wc, ctoken, &len);`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`if (ret != 0) {`
Parser fallback to latin1 when detecting invalid utf-8 2020-08-09 20:56:43 +02:00			`log_info("falling back to ISO-8859-1: %s\n", cstart);`
			`if (cursor - buflen < lbuf - 2) {`
			`size_t inlen = 1;`
			`len = 2;`
			`unicode_latin1_to_utf8(cursor, &len, ctoken, &inlen);`
			`cursor += len;`
			`ctoken += inlen;`
			`continue;`
			`}`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`}`
			`}`
			`if (escape) {`
			`copy = true;`
			`escape = false;`
			`}`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`else if (iswspace(wc)) {`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`if (quotechar == 0)`
			`break;`
			`copy = true;`
			`}`
			`else if (utf8_character == '"' \|\| utf8_character == '\'') {`
			`if (utf8_character == quotechar) {`
			`++ctoken;`
			`break;`
			`}`
fix parser crash from turn 1179 2020-07-26 12:59:49 +02:00			`else if (quotechar == 0 && cstart == ctoken) {`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`quotechar = utf8_character;`
			`++ctoken;`
			`}`
			`else {`
BUG 2381: parse_token overrun. 2017-10-29 18:03:44 +01:00			`if (cursor - buflen < lbuf - len) {`
			`cursor++ = ctoken++;`
			`}`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`}`
			`}`
			`else if (utf8_character == SPACE_REPLACEMENT) {`
BUG 2381: parse_token overrun. 2017-10-29 18:03:44 +01:00			`if (cursor - buflen < lbuf - len) {`
			`*cursor++ = ' ';`
			`}`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`++ctoken;`
			`}`
			`else if (utf8_character == ESCAPE_CHAR) {`
			`escape = true;`
			`++ctoken;`
			`}`
			`else {`
			`copy = true;`
			`}`
			`if (copy) {`
fix parse_token buffer overrun. missing tests for parse_token. this fixes http://bugs.eressea.de/view.php?id=2206 2016-06-07 21:47:09 +02:00			`if (cursor - buflen < lbuf - len) {`
parsing tokens when buffer is too small - skip the entire token. now with tests. 2014-12-24 15:55:55 +01:00			`memcpy(cursor, ctoken, len);`
			`cursor += len;`
			`}`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`ctoken += len;`
			`}`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`

start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`*cursor = '\0';`
make parse_token trim ignored characters like zero-width spaces. 2020-03-14 11:57:29 +01:00			`unicode_utf8_trim(lbuf);`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`*str = ctoken;`
			`return lbuf;`
			`}`

parsing needs to return a static buffer if it has no argument 2014-12-29 07:44:00 +01:00			`static char pbuf[MAXTOKENSIZE]; /* STATIC_RESULT: used for return, not across calls */`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`const char parse_token_depr(const char *str)`
			`{`
fix indentation in every file fix copyright date remove vi ts=2 code remove a couple of superfluous extern declarations 2015-01-30 20:37:14 +01:00			`return parse_token(str, pbuf, MAXTOKENSIZE);`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`

Leerzeichen aus Beschreibungen trimmen. 2019-04-24 12:55:41 +02:00			`char *getstrtoken(void)`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`{`
parsing needs to return a static buffer if it has no argument 2014-12-29 07:44:00 +01:00			`return parse_token((const char **)&states->current_token, pbuf, MAXTOKENSIZE);`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`}`

Leerzeichen aus Beschreibungen trimmen. 2019-04-24 12:55:41 +02:00			`char gettoken(char lbuf, size_t bufsize)`
start to get rid of getstrtoken(), which uses an internal static buffer and causes horrible bugs when called multiple times. 2014-12-22 14:21:24 +01:00			`{`
			`return parse_token((const char **)&states->current_token, lbuf, bufsize);`
undo more CRLF screwups. 2010-08-08 10:06:34 +02:00			`}`
ongoing config.c cleanup: getid() 2014-12-18 07:09:22 +01:00
additional tests for the parser. move more parsing code out of config.c 2014-12-22 16:31:10 +01:00			`int getint(void)`
			`{`
			`char token[16];`
			`const char * s = gettoken(token, sizeof(token));`
			`return s ? atoi(s) : 0;`
			`}`

do not use MIN and MAX. 2018-01-01 08:23:52 +01:00			`int getuint(void)`
additional tests for the parser. move more parsing code out of config.c 2014-12-22 16:31:10 +01:00			`{`
			`int n = getint();`
			`return (n < 0) ? 0 : n;`
			`}`

ongoing config.c cleanup: getid() 2014-12-18 07:09:22 +01:00			`int getid(void)`
			`{`
parsing tokens when buffer is too small - skip the entire token. now with tests. 2014-12-24 15:55:55 +01:00			`char token[8];`
rename to gettoken, use more widely, add a basic test. 2014-12-22 16:28:17 +01:00			`const char *str = gettoken(token, sizeof(token));`
ongoing config.c cleanup: getid() 2014-12-18 07:09:22 +01:00			`int i = str ? atoi36(str) : 0;`
			`if (i < 0) {`
			`return -1;`
			`}`
			`return i;`
			`}`
move atoip out of config (small helper) and test it. remove some unnecessary variables from laws.c 2014-12-23 09:23:37 +01:00
			`unsigned int atoip(const char *s)`
			`{`
			`int n;`

			`assert(s);`
fix parser to keep a reference to the order it is parsing. make push/popstate not crash. pass unit tests. 2017-11-10 07:56:56 +01:00			`n = (s[0] >= '0' && s[0] <= '9');`
do not call isdigit with a negative value. http://bugs.eressea.de/view.php?id=1987#c6941 2017-02-03 21:19:39 +01:00			`n = n ? atoi(s) : 0;`
move atoip out of config (small helper) and test it. remove some unnecessary variables from laws.c 2014-12-23 09:23:37 +01:00
			`if (n < 0)`
			`n = 0;`

			`return n;`
			`}`