322 lines
6.4 KiB
C
322 lines
6.4 KiB
C
/******************************************************************************
|
|
Copyright (c) 2013 by Hugh Bailey <obs.jim@gmail.com>
|
|
|
|
This software is provided 'as-is', without any express or implied
|
|
warranty. In no event will the authors be held liable for any damages
|
|
arising from the use of this software.
|
|
|
|
Permission is granted to anyone to use this software for any purpose,
|
|
including commercial applications, and to alter it and redistribute it
|
|
freely, subject to the following restrictions:
|
|
|
|
1. The origin of this software must not be misrepresented; you must not
|
|
claim that you wrote the original software. If you use this software
|
|
in a product, an acknowledgment in the product documentation would be
|
|
appreciated but is not required.
|
|
|
|
2. Altered source versions must be plainly marked as such, and must not be
|
|
misrepresented as being the original software.
|
|
|
|
3. This notice may not be removed or altered from any source
|
|
distribution.
|
|
******************************************************************************/
|
|
|
|
#include <ctype.h>
|
|
#include "lexer.h"
|
|
|
|
static const char *astrblank = "";
|
|
|
|
static inline bool strref_is_empty(const struct strref *str)
|
|
{
|
|
return !str || !str->array || !str->len || !*str->array;
|
|
}
|
|
|
|
int strref_cmp(const struct strref *str1, const char *str2)
|
|
{
|
|
size_t i = 0;
|
|
|
|
if (strref_is_empty(str1))
|
|
return (!str2 || !*str2) ? 0 : -1;
|
|
if (!str2)
|
|
str2 = astrblank;
|
|
|
|
do {
|
|
char ch1, ch2;
|
|
|
|
ch1 = (i < str1->len) ? str1->array[i] : 0;
|
|
ch2 = *str2;
|
|
|
|
if (ch1 < ch2)
|
|
return -1;
|
|
else if (ch1 > ch2)
|
|
return 1;
|
|
} while (i++ < str1->len && *str2++);
|
|
|
|
return 0;
|
|
}
|
|
|
|
int strref_cmpi(const struct strref *str1, const char *str2)
|
|
{
|
|
size_t i = 0;
|
|
|
|
if (strref_is_empty(str1))
|
|
return (!str2 || !*str2) ? 0 : -1;
|
|
if (!str2)
|
|
str2 = astrblank;
|
|
|
|
do {
|
|
char ch1, ch2;
|
|
|
|
ch1 = (i < str1->len) ? toupper(str1->array[i]) : 0;
|
|
ch2 = toupper(*str2);
|
|
|
|
if (ch1 < ch2)
|
|
return -1;
|
|
else if (ch1 > ch2)
|
|
return 1;
|
|
} while (i++ < str1->len && *str2++);
|
|
|
|
return 0;
|
|
}
|
|
|
|
int strref_cmp_strref(const struct strref *str1, const struct strref *str2)
|
|
{
|
|
size_t i = 0;
|
|
|
|
if (strref_is_empty(str1))
|
|
return strref_is_empty(str2) ? 0 : -1;
|
|
if (strref_is_empty(str2))
|
|
return -1;
|
|
|
|
do {
|
|
char ch1, ch2;
|
|
|
|
ch1 = (i < str1->len) ? str1->array[i] : 0;
|
|
ch2 = (i < str2->len) ? str2->array[i] : 0;
|
|
|
|
if (ch1 < ch2)
|
|
return -1;
|
|
else if (ch1 > ch2)
|
|
return 1;
|
|
|
|
i++;
|
|
} while (i <= str1->len && i <= str2->len);
|
|
|
|
return 0;
|
|
}
|
|
|
|
int strref_cmpi_strref(const struct strref *str1, const struct strref *str2)
|
|
{
|
|
size_t i = 0;
|
|
|
|
if (strref_is_empty(str1))
|
|
return strref_is_empty(str2) ? 0 : -1;
|
|
if (strref_is_empty(str2))
|
|
return -1;
|
|
|
|
do {
|
|
char ch1, ch2;
|
|
|
|
ch1 = (i < str1->len) ? toupper(str1->array[i]) : 0;
|
|
ch2 = (i < str2->len) ? toupper(str2->array[i]) : 0;
|
|
|
|
if (ch1 < ch2)
|
|
return -1;
|
|
else if (ch1 > ch2)
|
|
return 1;
|
|
|
|
i++;
|
|
} while (i <= str1->len && i <= str2->len);
|
|
|
|
return 0;
|
|
}
|
|
/* ------------------------------------------------------------------------- */
|
|
|
|
bool valid_int_str(const char *str, size_t n)
|
|
{
|
|
bool found_num = false;
|
|
|
|
if (!str)
|
|
return false;
|
|
if (!*str)
|
|
return false;
|
|
|
|
if (!n)
|
|
n = strlen(str);
|
|
if (*str == '-' || *str == '+')
|
|
++str;
|
|
|
|
do {
|
|
if (*str > '9' || *str < '0')
|
|
return false;
|
|
|
|
found_num = true;
|
|
} while(*++str && --n);
|
|
|
|
return found_num;
|
|
}
|
|
|
|
bool valid_float_str(const char *str, size_t n)
|
|
{
|
|
bool found_num = false;
|
|
bool found_exp = false;
|
|
bool found_dec = false;
|
|
|
|
if (!str)
|
|
return false;
|
|
if (!*str)
|
|
return false;
|
|
|
|
if (!n)
|
|
n = strlen(str);
|
|
if (*str == '-' || *str == '+')
|
|
++str;
|
|
|
|
do {
|
|
if (*str == '.') {
|
|
if (found_dec || found_exp || !found_num)
|
|
return false;
|
|
|
|
found_dec = true;
|
|
|
|
} else if (*str == 'e') {
|
|
if (found_exp || !found_num)
|
|
return false;
|
|
|
|
found_exp = true;
|
|
found_num = false;
|
|
|
|
} else if (*str == '-' || *str == '+') {
|
|
if (!found_exp || !found_num)
|
|
return false;
|
|
|
|
} else if (*str > '9' || *str < '0') {
|
|
return false;
|
|
} else {
|
|
found_num = true;
|
|
}
|
|
} while(*++str && --n);
|
|
|
|
return found_num;
|
|
}
|
|
|
|
/* ------------------------------------------------------------------------- */
|
|
|
|
void error_data_add(struct error_data *data, const char *file,
|
|
uint32_t row, uint32_t column, const char *msg, int level)
|
|
{
|
|
struct error_item item;
|
|
|
|
if (!data)
|
|
return;
|
|
|
|
item.file = file;
|
|
item.row = row;
|
|
item.column = column;
|
|
item.level = level;
|
|
item.error = bstrdup(msg);
|
|
|
|
da_push_back(data->errors, &item);
|
|
}
|
|
|
|
char *error_data_buildstring(struct error_data *ed)
|
|
{
|
|
struct dstr str;
|
|
struct error_item *items = ed->errors.array;
|
|
size_t i;
|
|
|
|
dstr_init(&str);
|
|
for (i = 0; i < ed->errors.num; i++) {
|
|
struct error_item *item = items+i;
|
|
dstr_catf(&str, "%s (%u, %u): %s\n", item->file, item->row,
|
|
item->column, item->error);
|
|
}
|
|
|
|
return str.array;
|
|
}
|
|
|
|
/* ------------------------------------------------------------------------- */
|
|
|
|
static inline enum base_token_type get_char_token_type(const char ch)
|
|
{
|
|
if (is_whitespace(ch))
|
|
return BASETOKEN_WHITESPACE;
|
|
else if (isdigit(ch))
|
|
return BASETOKEN_DIGIT;
|
|
else if (isalpha(ch))
|
|
return BASETOKEN_ALPHA;
|
|
|
|
return BASETOKEN_OTHER;
|
|
}
|
|
|
|
bool lexer_getbasetoken(struct lexer *lex, struct base_token *token,
|
|
bool ignore_whitespace)
|
|
{
|
|
const char *offset = lex->offset;
|
|
const char *token_start = NULL;
|
|
enum base_token_type type = BASETOKEN_NONE;
|
|
|
|
if (!offset)
|
|
return false;
|
|
|
|
while (*offset != 0) {
|
|
char ch = *(offset++);
|
|
enum base_token_type new_type = get_char_token_type(ch);
|
|
|
|
if (type == BASETOKEN_NONE) {
|
|
if (new_type == BASETOKEN_WHITESPACE &&
|
|
ignore_whitespace)
|
|
continue;
|
|
|
|
token_start = offset-1;
|
|
type = new_type;
|
|
|
|
if (type != BASETOKEN_DIGIT ||
|
|
type != BASETOKEN_ALPHA) {
|
|
if (is_newline(ch) &&
|
|
is_newline_pair(ch, *offset)) {
|
|
offset++;
|
|
}
|
|
break;
|
|
}
|
|
} else if (type != new_type) {
|
|
break;
|
|
}
|
|
}
|
|
|
|
lex->offset = offset;
|
|
|
|
if (token_start && offset > token_start) {
|
|
strref_set(&token->text, token_start, offset-token_start);
|
|
token->type = type;
|
|
return true;
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
void lexer_getstroffset(const struct lexer *lex, const char *str,
|
|
uint32_t *row, uint32_t *col)
|
|
{
|
|
uint32_t cur_col = 1, cur_row = 1;
|
|
const char *text = lex->text;
|
|
|
|
if (!str)
|
|
return;
|
|
|
|
while (text < str) {
|
|
if (is_newline(*text)) {
|
|
text += newline_size(text)-1;
|
|
cur_col = 1;
|
|
cur_row++;
|
|
} else {
|
|
cur_col++;
|
|
}
|
|
|
|
text++;
|
|
}
|
|
|
|
*row = cur_row;
|
|
*col = cur_col;
|
|
}
|