2018-09-29 18:13:32 +02:00
|
|
|
#ifdef _MSC_VER
|
|
|
|
#include <platform.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include "order_parser.h"
|
|
|
|
|
2018-09-30 19:47:34 +02:00
|
|
|
#include <assert.h>
|
2018-10-02 21:40:14 +02:00
|
|
|
#include <wctype.h>
|
2018-09-29 18:13:32 +02:00
|
|
|
#include <stdlib.h>
|
2018-09-30 19:47:34 +02:00
|
|
|
#include <string.h>
|
2018-09-29 18:13:32 +02:00
|
|
|
|
|
|
|
struct OrderParserStruct {
|
|
|
|
void *m_userData;
|
|
|
|
char *m_buffer;
|
|
|
|
char *m_bufferPtr;
|
|
|
|
const char *m_bufferEnd;
|
|
|
|
OP_OrderHandler m_orderHandler;
|
2018-09-30 13:45:19 +02:00
|
|
|
enum OP_Error m_errorCode;
|
2018-09-29 18:13:32 +02:00
|
|
|
int m_lineNumber;
|
|
|
|
};
|
|
|
|
|
2018-10-02 21:40:14 +02:00
|
|
|
enum OP_Error OP_GetErrorCode(OP_Parser parser) {
|
|
|
|
return parser->m_errorCode;
|
|
|
|
}
|
|
|
|
|
2018-09-30 19:47:34 +02:00
|
|
|
void OP_SetOrderHandler(OP_Parser parser, OP_OrderHandler handler) {
|
|
|
|
parser->m_orderHandler = handler;
|
2018-09-29 21:19:24 +02:00
|
|
|
}
|
|
|
|
|
2018-09-30 19:47:34 +02:00
|
|
|
void OP_SetUserData(OP_Parser parser, void *userData) {
|
|
|
|
parser->m_userData = userData;
|
2018-09-29 21:19:24 +02:00
|
|
|
}
|
|
|
|
|
2018-09-30 19:47:34 +02:00
|
|
|
static void buffer_free(OP_Parser parser)
|
|
|
|
{
|
|
|
|
/* TODO: recycle buffers, reduce mallocs. */
|
|
|
|
free(parser->m_buffer);
|
|
|
|
parser->m_bufferEnd = parser->m_bufferPtr = parser->m_buffer = NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
void OP_ParserReset(OP_Parser parser) {
|
|
|
|
parser->m_lineNumber = 1;
|
|
|
|
buffer_free(parser);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2018-09-29 18:13:32 +02:00
|
|
|
OP_Parser OP_ParserCreate(void)
|
|
|
|
{
|
2018-09-29 21:19:24 +02:00
|
|
|
OP_Parser parser = calloc(1, sizeof(struct OrderParserStruct));
|
2018-09-30 19:47:34 +02:00
|
|
|
OP_ParserReset(parser);
|
2018-09-29 21:19:24 +02:00
|
|
|
return parser;
|
2018-09-29 18:13:32 +02:00
|
|
|
}
|
|
|
|
|
2018-09-30 19:47:34 +02:00
|
|
|
void OP_ParserFree(OP_Parser parser) {
|
|
|
|
free(parser->m_buffer);
|
|
|
|
free(parser);
|
2018-09-29 18:13:32 +02:00
|
|
|
}
|
|
|
|
|
2018-09-30 19:47:34 +02:00
|
|
|
static enum OP_Error buffer_append(OP_Parser parser, const char *s, int len)
|
2018-09-29 18:13:32 +02:00
|
|
|
{
|
2018-09-30 19:47:34 +02:00
|
|
|
if (parser->m_buffer == NULL) {
|
|
|
|
parser->m_buffer = malloc(len + 1);
|
|
|
|
if (!parser->m_buffer) {
|
|
|
|
return OP_ERROR_NO_MEMORY;
|
|
|
|
}
|
|
|
|
memcpy(parser->m_buffer, s, len);
|
|
|
|
parser->m_buffer[len] = '\0';
|
|
|
|
parser->m_bufferPtr = parser->m_buffer;
|
|
|
|
parser->m_bufferEnd = parser->m_buffer + len;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
size_t total = len;
|
|
|
|
char * buffer;
|
|
|
|
total += (parser->m_bufferEnd - parser->m_bufferPtr);
|
|
|
|
/* TODO: recycle buffers, reduce mallocs. */
|
|
|
|
buffer = malloc(total + 1);
|
|
|
|
memcpy(buffer, parser->m_bufferPtr, total - len);
|
|
|
|
memcpy(buffer + total - len, s, len);
|
|
|
|
buffer[total] = '\0';
|
|
|
|
free(parser->m_buffer);
|
|
|
|
parser->m_buffer = buffer;
|
|
|
|
if (!parser->m_buffer) {
|
|
|
|
return OP_ERROR_NO_MEMORY;
|
|
|
|
}
|
|
|
|
parser->m_bufferPtr = parser->m_buffer;
|
|
|
|
parser->m_bufferEnd = parser->m_buffer + total;
|
|
|
|
}
|
|
|
|
return OP_ERROR_NONE;
|
|
|
|
}
|
|
|
|
|
|
|
|
static char *skip_spaces(char *pos) {
|
|
|
|
char *next;
|
|
|
|
for (next = pos; *next && *next != '\n'; ++next) {
|
2018-10-02 21:40:14 +02:00
|
|
|
wint_t wch = *(unsigned char *)next;
|
2018-09-30 19:47:34 +02:00
|
|
|
/* TODO: handle unicode whitespace */
|
2018-10-02 21:40:14 +02:00
|
|
|
if (!iswspace(wch)) break;
|
2018-09-30 19:47:34 +02:00
|
|
|
}
|
|
|
|
return next;
|
|
|
|
}
|
|
|
|
|
2018-10-01 21:32:59 +02:00
|
|
|
static enum OP_Error handle_line(OP_Parser parser) {
|
|
|
|
if (parser->m_orderHandler) {
|
|
|
|
char * str = skip_spaces(parser->m_bufferPtr);
|
|
|
|
if (*str) {
|
|
|
|
parser->m_orderHandler(parser->m_userData, str);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return OP_ERROR_NONE;
|
|
|
|
}
|
|
|
|
|
2018-09-30 19:47:34 +02:00
|
|
|
static enum OP_Status parse_buffer(OP_Parser parser, int isFinal)
|
|
|
|
{
|
|
|
|
char * pos = strpbrk(parser->m_bufferPtr, "\\;\n");
|
|
|
|
while (pos) {
|
|
|
|
enum OP_Error code;
|
|
|
|
size_t len = pos - parser->m_bufferPtr;
|
|
|
|
char *next;
|
2018-10-02 21:40:14 +02:00
|
|
|
int continue_comment = 0;
|
2018-09-30 19:47:34 +02:00
|
|
|
|
|
|
|
switch (*pos) {
|
|
|
|
case '\n':
|
|
|
|
*pos = '\0';
|
|
|
|
code = handle_line(parser);
|
|
|
|
++parser->m_lineNumber;
|
|
|
|
if (code != OP_ERROR_NONE) {
|
|
|
|
parser->m_errorCode = code;
|
|
|
|
return OP_STATUS_ERROR;
|
|
|
|
}
|
|
|
|
parser->m_bufferPtr = pos + 1;
|
|
|
|
pos = strpbrk(parser->m_bufferPtr, "\\;\n");
|
|
|
|
break;
|
|
|
|
case '\\':
|
|
|
|
/* if this is the last non-space before the line break, then lines need to be joined */
|
|
|
|
next = skip_spaces(pos + 1);
|
|
|
|
if (*next == '\n') {
|
|
|
|
ptrdiff_t shift = (next + 1 - pos);
|
|
|
|
assert(shift > 0);
|
|
|
|
memmove(parser->m_bufferPtr + shift, parser->m_bufferPtr, len);
|
|
|
|
parser->m_bufferPtr += shift;
|
|
|
|
pos = strpbrk(next + 1, "\\;\n");
|
|
|
|
++parser->m_lineNumber;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
/* this is not multi-line input yet, so do nothing */
|
2018-10-01 02:26:31 +02:00
|
|
|
if (pos[1] == '\0') {
|
|
|
|
/* end of available input */
|
|
|
|
if (isFinal) {
|
|
|
|
/* input ends on a pointless backslash, kill it */
|
|
|
|
pos[0] = '\0';
|
|
|
|
pos = NULL;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
/* backslash is followed by data that we do not know */
|
|
|
|
pos = NULL;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
pos = strpbrk(pos + 1, "\\;\n");
|
|
|
|
}
|
2018-09-30 19:47:34 +02:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case ';':
|
|
|
|
/* the current line ends in a comment */
|
|
|
|
*pos++ = '\0';
|
|
|
|
handle_line(parser);
|
|
|
|
/* find the end of the comment so we can skip it.
|
|
|
|
* obs: multi-line comments are possible with a backslash. */
|
|
|
|
do {
|
|
|
|
next = strpbrk(pos, "\\\n");
|
|
|
|
if (next) {
|
|
|
|
if (*next == '\n') {
|
|
|
|
/* no more lines in this comment, we're done: */
|
|
|
|
++parser->m_lineNumber;
|
2018-10-02 21:40:14 +02:00
|
|
|
break; /* exit loop */
|
2018-09-30 19:47:34 +02:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
/* is this backslash the final character? */
|
|
|
|
next = skip_spaces(pos + 1);
|
|
|
|
if (*next == '\n') {
|
|
|
|
/* we have a multi-line comment! */
|
|
|
|
pos = next + 1;
|
|
|
|
++parser->m_lineNumber;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
/* keep looking for a backslash */
|
|
|
|
pos = next;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} while (next && *next);
|
|
|
|
|
2018-10-02 21:40:14 +02:00
|
|
|
if (!next) {
|
|
|
|
/* we exhausted the buffer before we finished the line */
|
2018-09-30 19:47:34 +02:00
|
|
|
if (isFinal) {
|
2018-10-02 21:40:14 +02:00
|
|
|
/* this comment was at the end of the file, it just has no newline. done! */
|
2018-09-30 19:47:34 +02:00
|
|
|
return OP_STATUS_OK;
|
|
|
|
}
|
|
|
|
else {
|
2018-10-02 21:40:14 +02:00
|
|
|
/* there is more of this line in the next buffer, save the semicolon */
|
|
|
|
continue_comment = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
if (*next) {
|
|
|
|
/* end comment parsing, begin parsing a new line */
|
|
|
|
pos = next + 1;
|
|
|
|
continue_comment = 0;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
/* reached end of input naturally, need more data to finish */
|
|
|
|
continue_comment = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (continue_comment) {
|
|
|
|
ptrdiff_t skip = parser->m_bufferEnd - parser->m_bufferPtr;
|
|
|
|
continue_comment = 0;
|
|
|
|
if (skip > 0) {
|
|
|
|
/* should always be true */
|
|
|
|
parser->m_bufferPtr += (skip - 1);
|
|
|
|
parser->m_bufferPtr[0] = ';';
|
2018-09-30 19:47:34 +02:00
|
|
|
}
|
2018-10-02 21:40:14 +02:00
|
|
|
return OP_STATUS_OK;
|
2018-09-30 19:47:34 +02:00
|
|
|
}
|
2018-10-02 21:40:14 +02:00
|
|
|
/* continue the outer loop */
|
|
|
|
parser->m_bufferPtr = pos;
|
|
|
|
pos = strpbrk(pos, "\\;\n");
|
2018-09-30 19:47:34 +02:00
|
|
|
break;
|
|
|
|
default:
|
|
|
|
parser->m_errorCode = OP_ERROR_SYNTAX;
|
|
|
|
return OP_STATUS_ERROR;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (isFinal && parser->m_bufferPtr < parser->m_bufferEnd) {
|
|
|
|
/* this line ends without a line break */
|
|
|
|
handle_line(parser);
|
|
|
|
}
|
2018-09-29 18:13:32 +02:00
|
|
|
return OP_STATUS_OK;
|
|
|
|
}
|
2018-09-30 19:47:34 +02:00
|
|
|
|
|
|
|
enum OP_Status OP_Parse(OP_Parser parser, const char *s, int len, int isFinal)
|
|
|
|
{
|
|
|
|
enum OP_Error code;
|
|
|
|
|
|
|
|
if (parser->m_bufferPtr >= parser->m_bufferEnd) {
|
|
|
|
buffer_free(parser);
|
|
|
|
}
|
|
|
|
|
|
|
|
code = buffer_append(parser, s, len);
|
|
|
|
if (code != OP_ERROR_NONE) {
|
|
|
|
parser->m_errorCode = code;
|
|
|
|
return OP_STATUS_ERROR;
|
|
|
|
}
|
|
|
|
|
|
|
|
return parse_buffer(parser, isFinal);
|
|
|
|
}
|