123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280 |
- /*
- * Copyright (c) 2013 Hugh Bailey <[email protected]>
- *
- * Permission to use, copy, modify, and distribute this software for any
- * purpose with or without fee is hereby granted, provided that the above
- * copyright notice and this permission notice appear in all copies.
- *
- * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
- * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
- * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
- * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
- * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
- * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
- * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
- */
- #pragma once
- #include "c99defs.h"
- #include "dstr.h"
- #include "darray.h"
- #ifdef __cplusplus
- extern "C" {
- #endif
- /* ------------------------------------------------------------------------- */
- /* string reference (string segment within an already existing array) */
- struct strref {
- const char *array;
- size_t len;
- };
- static inline void strref_clear(struct strref *dst)
- {
- dst->array = NULL;
- dst->len = 0;
- }
- static inline void strref_set(struct strref *dst, const char *array, size_t len)
- {
- dst->array = array;
- dst->len = len;
- }
- static inline void strref_copy(struct strref *dst, const struct strref *src)
- {
- dst->array = src->array;
- dst->len = src->len;
- }
- static inline void strref_add(struct strref *dst, const struct strref *t)
- {
- if (!dst->array)
- strref_copy(dst, t);
- else
- dst->len += t->len;
- }
- static inline bool strref_is_empty(const struct strref *str)
- {
- return !str || !str->array || !str->len || !*str->array;
- }
- EXPORT int strref_cmp(const struct strref *str1, const char *str2);
- EXPORT int strref_cmpi(const struct strref *str1, const char *str2);
- EXPORT int strref_cmp_strref(const struct strref *str1,
- const struct strref *str2);
- EXPORT int strref_cmpi_strref(const struct strref *str1,
- const struct strref *str2);
- /* ------------------------------------------------------------------------- */
- EXPORT bool valid_int_str(const char *str, size_t n);
- EXPORT bool valid_float_str(const char *str, size_t n);
- static inline bool valid_int_strref(const struct strref *str)
- {
- return valid_int_str(str->array, str->len);
- }
- static inline bool valid_float_strref(const struct strref *str)
- {
- return valid_float_str(str->array, str->len);
- }
- static inline bool is_whitespace(char ch)
- {
- return ch == ' ' || ch == '\r' || ch == '\t' || ch == '\n';
- }
- static inline bool is_newline(char ch)
- {
- return ch == '\r' || ch == '\n';
- }
- static inline bool is_space_or_tab(const char ch)
- {
- return ch == ' ' || ch == '\t';
- }
- static inline bool is_newline_pair(char ch1, char ch2)
- {
- return (ch1 == '\r' && ch2 == '\n') || (ch1 == '\n' && ch2 == '\r');
- }
- static inline int newline_size(const char *array)
- {
- if (strncmp(array, "\r\n", 2) == 0 || strncmp(array, "\n\r", 2) == 0)
- return 2;
- else if (*array == '\r' || *array == '\n')
- return 1;
- return 0;
- }
- /* ------------------------------------------------------------------------- */
- /*
- * A "base" token is one of four things:
- * 1.) A sequence of alpha characters
- * 2.) A sequence of numeric characters
- * 3.) A single whitespace character if whitespace is not ignored
- * 4.) A single character that does not fall into the above 3 categories
- */
- enum base_token_type {
- BASETOKEN_NONE,
- BASETOKEN_ALPHA,
- BASETOKEN_DIGIT,
- BASETOKEN_WHITESPACE,
- BASETOKEN_OTHER,
- };
- struct base_token {
- struct strref text;
- enum base_token_type type;
- bool passed_whitespace;
- };
- static inline void base_token_clear(struct base_token *t)
- {
- memset(t, 0, sizeof(struct base_token));
- }
- static inline void base_token_copy(struct base_token *dst,
- struct base_token *src)
- {
- memcpy(dst, src, sizeof(struct base_token));
- }
- /* ------------------------------------------------------------------------- */
- #define LEX_ERROR 0
- #define LEX_WARNING 1
- struct error_item {
- char *error;
- const char *file;
- uint32_t row, column;
- int level;
- };
- static inline void error_item_init(struct error_item *ei)
- {
- memset(ei, 0, sizeof(struct error_item));
- }
- static inline void error_item_free(struct error_item *ei)
- {
- bfree(ei->error);
- error_item_init(ei);
- }
- static inline void error_item_array_free(struct error_item *array, size_t num)
- {
- size_t i;
- for (i = 0; i < num; i++)
- error_item_free(array + i);
- }
- /* ------------------------------------------------------------------------- */
- struct error_data {
- DARRAY(struct error_item) errors;
- };
- static inline void error_data_init(struct error_data *data)
- {
- da_init(data->errors);
- }
- static inline void error_data_free(struct error_data *data)
- {
- error_item_array_free(data->errors.array, data->errors.num);
- da_free(data->errors);
- }
- static inline const struct error_item *error_data_item(struct error_data *ed,
- size_t idx)
- {
- return ed->errors.array + idx;
- }
- EXPORT char *error_data_buildstring(struct error_data *ed);
- EXPORT void error_data_add(struct error_data *ed, const char *file,
- uint32_t row, uint32_t column, const char *msg,
- int level);
- static inline size_t error_data_type_count(struct error_data *ed, int type)
- {
- size_t count = 0, i;
- for (i = 0; i < ed->errors.num; i++) {
- if (ed->errors.array[i].level == type)
- count++;
- }
- return count;
- }
- static inline bool error_data_has_errors(struct error_data *ed)
- {
- size_t i;
- for (i = 0; i < ed->errors.num; i++)
- if (ed->errors.array[i].level == LEX_ERROR)
- return true;
- return false;
- }
- /* ------------------------------------------------------------------------- */
- struct lexer {
- char *text;
- const char *offset;
- };
- static inline void lexer_init(struct lexer *lex)
- {
- memset(lex, 0, sizeof(struct lexer));
- }
- static inline void lexer_free(struct lexer *lex)
- {
- bfree(lex->text);
- lexer_init(lex);
- }
- static inline void lexer_start(struct lexer *lex, const char *text)
- {
- lexer_free(lex);
- lex->text = bstrdup(text);
- lex->offset = lex->text;
- }
- static inline void lexer_start_move(struct lexer *lex, char *text)
- {
- lexer_free(lex);
- lex->text = text;
- lex->offset = lex->text;
- }
- static inline void lexer_reset(struct lexer *lex)
- {
- lex->offset = lex->text;
- }
- enum ignore_whitespace { PARSE_WHITESPACE, IGNORE_WHITESPACE };
- EXPORT bool lexer_getbasetoken(struct lexer *lex, struct base_token *t,
- enum ignore_whitespace iws);
- EXPORT void lexer_getstroffset(const struct lexer *lex, const char *str,
- uint32_t *row, uint32_t *col);
- #ifdef __cplusplus
- }
- #endif
|