| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280 | 
							- /*
 
-  * Copyright (c) 2013 Hugh Bailey <[email protected]>
 
-  *
 
-  * Permission to use, copy, modify, and distribute this software for any
 
-  * purpose with or without fee is hereby granted, provided that the above
 
-  * copyright notice and this permission notice appear in all copies.
 
-  *
 
-  * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
 
-  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
 
-  * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
 
-  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
 
-  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
 
-  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
 
-  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
 
-  */
 
- #pragma once
 
- #include "c99defs.h"
 
- #include "dstr.h"
 
- #include "darray.h"
 
- #ifdef __cplusplus
 
- extern "C" {
 
- #endif
 
- /* ------------------------------------------------------------------------- */
 
- /* string reference (string segment within an already existing array) */
 
- struct strref {
 
- 	const char *array;
 
- 	size_t len;
 
- };
 
- static inline void strref_clear(struct strref *dst)
 
- {
 
- 	dst->array = NULL;
 
- 	dst->len = 0;
 
- }
 
- static inline void strref_set(struct strref *dst, const char *array, size_t len)
 
- {
 
- 	dst->array = array;
 
- 	dst->len = len;
 
- }
 
- static inline void strref_copy(struct strref *dst, const struct strref *src)
 
- {
 
- 	dst->array = src->array;
 
- 	dst->len = src->len;
 
- }
 
- static inline void strref_add(struct strref *dst, const struct strref *t)
 
- {
 
- 	if (!dst->array)
 
- 		strref_copy(dst, t);
 
- 	else
 
- 		dst->len += t->len;
 
- }
 
- static inline bool strref_is_empty(const struct strref *str)
 
- {
 
- 	return !str || !str->array || !str->len || !*str->array;
 
- }
 
- EXPORT int strref_cmp(const struct strref *str1, const char *str2);
 
- EXPORT int strref_cmpi(const struct strref *str1, const char *str2);
 
- EXPORT int strref_cmp_strref(const struct strref *str1,
 
- 			     const struct strref *str2);
 
- EXPORT int strref_cmpi_strref(const struct strref *str1,
 
- 			      const struct strref *str2);
 
- /* ------------------------------------------------------------------------- */
 
- EXPORT bool valid_int_str(const char *str, size_t n);
 
- EXPORT bool valid_float_str(const char *str, size_t n);
 
- static inline bool valid_int_strref(const struct strref *str)
 
- {
 
- 	return valid_int_str(str->array, str->len);
 
- }
 
- static inline bool valid_float_strref(const struct strref *str)
 
- {
 
- 	return valid_float_str(str->array, str->len);
 
- }
 
- static inline bool is_whitespace(char ch)
 
- {
 
- 	return ch == ' ' || ch == '\r' || ch == '\t' || ch == '\n';
 
- }
 
- static inline bool is_newline(char ch)
 
- {
 
- 	return ch == '\r' || ch == '\n';
 
- }
 
- static inline bool is_space_or_tab(const char ch)
 
- {
 
- 	return ch == ' ' || ch == '\t';
 
- }
 
- static inline bool is_newline_pair(char ch1, char ch2)
 
- {
 
- 	return (ch1 == '\r' && ch2 == '\n') || (ch1 == '\n' && ch2 == '\r');
 
- }
 
- static inline int newline_size(const char *array)
 
- {
 
- 	if (strncmp(array, "\r\n", 2) == 0 || strncmp(array, "\n\r", 2) == 0)
 
- 		return 2;
 
- 	else if (*array == '\r' || *array == '\n')
 
- 		return 1;
 
- 	return 0;
 
- }
 
- /* ------------------------------------------------------------------------- */
 
- /* 
 
-  * A "base" token is one of four things:
 
-  *   1.) A sequence of alpha characters
 
-  *   2.) A sequence of numeric characters
 
-  *   3.) A single whitespace character if whitespace is not ignored
 
-  *   4.) A single character that does not fall into the above 3 categories
 
-  */
 
- enum base_token_type {
 
- 	BASETOKEN_NONE,
 
- 	BASETOKEN_ALPHA,
 
- 	BASETOKEN_DIGIT,
 
- 	BASETOKEN_WHITESPACE,
 
- 	BASETOKEN_OTHER,
 
- };
 
- struct base_token {
 
- 	struct strref text;
 
- 	enum base_token_type type;
 
- 	bool passed_whitespace;
 
- };
 
- static inline void base_token_clear(struct base_token *t)
 
- {
 
- 	memset(t, 0, sizeof(struct base_token));
 
- }
 
- static inline void base_token_copy(struct base_token *dst,
 
- 				   struct base_token *src)
 
- {
 
- 	memcpy(dst, src, sizeof(struct base_token));
 
- }
 
- /* ------------------------------------------------------------------------- */
 
- #define LEX_ERROR 0
 
- #define LEX_WARNING 1
 
- struct error_item {
 
- 	char *error;
 
- 	const char *file;
 
- 	uint32_t row, column;
 
- 	int level;
 
- };
 
- static inline void error_item_init(struct error_item *ei)
 
- {
 
- 	memset(ei, 0, sizeof(struct error_item));
 
- }
 
- static inline void error_item_free(struct error_item *ei)
 
- {
 
- 	bfree(ei->error);
 
- 	error_item_init(ei);
 
- }
 
- static inline void error_item_array_free(struct error_item *array, size_t num)
 
- {
 
- 	size_t i;
 
- 	for (i = 0; i < num; i++)
 
- 		error_item_free(array + i);
 
- }
 
- /* ------------------------------------------------------------------------- */
 
- struct error_data {
 
- 	DARRAY(struct error_item) errors;
 
- };
 
- static inline void error_data_init(struct error_data *data)
 
- {
 
- 	da_init(data->errors);
 
- }
 
- static inline void error_data_free(struct error_data *data)
 
- {
 
- 	error_item_array_free(data->errors.array, data->errors.num);
 
- 	da_free(data->errors);
 
- }
 
- static inline const struct error_item *error_data_item(struct error_data *ed,
 
- 						       size_t idx)
 
- {
 
- 	return ed->errors.array + idx;
 
- }
 
- EXPORT char *error_data_buildstring(struct error_data *ed);
 
- EXPORT void error_data_add(struct error_data *ed, const char *file,
 
- 			   uint32_t row, uint32_t column, const char *msg,
 
- 			   int level);
 
- static inline size_t error_data_type_count(struct error_data *ed, int type)
 
- {
 
- 	size_t count = 0, i;
 
- 	for (i = 0; i < ed->errors.num; i++) {
 
- 		if (ed->errors.array[i].level == type)
 
- 			count++;
 
- 	}
 
- 	return count;
 
- }
 
- static inline bool error_data_has_errors(struct error_data *ed)
 
- {
 
- 	size_t i;
 
- 	for (i = 0; i < ed->errors.num; i++)
 
- 		if (ed->errors.array[i].level == LEX_ERROR)
 
- 			return true;
 
- 	return false;
 
- }
 
- /* ------------------------------------------------------------------------- */
 
- struct lexer {
 
- 	char *text;
 
- 	const char *offset;
 
- };
 
- static inline void lexer_init(struct lexer *lex)
 
- {
 
- 	memset(lex, 0, sizeof(struct lexer));
 
- }
 
- static inline void lexer_free(struct lexer *lex)
 
- {
 
- 	bfree(lex->text);
 
- 	lexer_init(lex);
 
- }
 
- static inline void lexer_start(struct lexer *lex, const char *text)
 
- {
 
- 	lexer_free(lex);
 
- 	lex->text = bstrdup(text);
 
- 	lex->offset = lex->text;
 
- }
 
- static inline void lexer_start_move(struct lexer *lex, char *text)
 
- {
 
- 	lexer_free(lex);
 
- 	lex->text = text;
 
- 	lex->offset = lex->text;
 
- }
 
- static inline void lexer_reset(struct lexer *lex)
 
- {
 
- 	lex->offset = lex->text;
 
- }
 
- enum ignore_whitespace { PARSE_WHITESPACE, IGNORE_WHITESPACE };
 
- EXPORT bool lexer_getbasetoken(struct lexer *lex, struct base_token *t,
 
- 			       enum ignore_whitespace iws);
 
- EXPORT void lexer_getstroffset(const struct lexer *lex, const char *str,
 
- 			       uint32_t *row, uint32_t *col);
 
- #ifdef __cplusplus
 
- }
 
- #endif
 
 
  |