2024-10-16 17:35:38 -06:00
|
|
|
#ifndef ARC_STD_PARSER_H_
|
|
|
|
|
#define ARC_STD_PARSER_H_
|
|
|
|
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
|
extern "C" {
|
|
|
|
|
#endif
|
|
|
|
|
|
2024-10-16 05:14:53 -06:00
|
|
|
#include "arc/std/array.h"
|
2024-10-16 23:46:16 -06:00
|
|
|
#include "arc/std/lexer.h"
|
2024-11-23 19:27:30 -07:00
|
|
|
#include "arc/std/vector.h"
|
2024-10-16 05:14:53 -06:00
|
|
|
#include <stdint.h>
|
2024-10-16 17:35:38 -06:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @brief a parser type
|
|
|
|
|
*/
|
|
|
|
|
typedef struct ARC_Parser ARC_Parser;
|
|
|
|
|
|
|
|
|
|
/**
|
2024-10-16 18:00:52 -06:00
|
|
|
* @brief a langue tag type for the parser //TODO: explain this better
|
2024-10-16 17:35:38 -06:00
|
|
|
*/
|
2024-11-23 19:27:30 -07:00
|
|
|
typedef struct ARC_ParserTag {
|
2024-10-16 05:14:53 -06:00
|
|
|
uint32_t tagId;
|
|
|
|
|
|
|
|
|
|
uint32_t **tokensOrTags;
|
2024-11-29 13:38:32 -07:00
|
|
|
uint32_t tokensOrTagsSize;
|
2024-11-23 19:27:30 -07:00
|
|
|
} ARC_ParserTag;
|
2024-10-16 05:14:53 -06:00
|
|
|
|
2024-11-29 13:38:32 -07:00
|
|
|
/*
|
2024-11-30 01:14:55 -07:00
|
|
|
* @brief a parser type used inside of the parser data create function
|
|
|
|
|
*
|
|
|
|
|
* @note there are no public creation and destruction functions for this type as it is only ment to be used within the creation callback
|
|
|
|
|
* @note if the parser tag token is a token then tagTokens will be NULL
|
|
|
|
|
* @note if the parser tag token is a tag then token will be NULL
|
2024-11-29 13:38:32 -07:00
|
|
|
*/
|
|
|
|
|
typedef struct ARC_ParserTagToken {
|
|
|
|
|
uint32_t id;
|
|
|
|
|
|
|
|
|
|
ARC_LexerToken *token;
|
|
|
|
|
ARC_Vector *tagTokens;
|
|
|
|
|
} ARC_ParserTagToken;
|
|
|
|
|
|
2024-10-16 18:00:52 -06:00
|
|
|
/**
|
|
|
|
|
* @brief a callback function to initialize the lexer the parser uses with rules
|
|
|
|
|
*
|
|
|
|
|
* @param lexer the lexer used by the parser that rules should be added to
|
|
|
|
|
*/
|
|
|
|
|
typedef void (* ARC_Parser_InitLexerRulesFn)(ARC_Lexer *lexer);
|
2024-10-16 17:35:38 -06:00
|
|
|
|
2024-11-30 01:14:55 -07:00
|
|
|
/**
|
|
|
|
|
* @brief TODO: write this
|
|
|
|
|
*/
|
|
|
|
|
typedef void (* ARC_ParserData_CreateFn)(void **data, ARC_ParserTagToken *parsedData, void *userData);
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @brief TODO: write this
|
|
|
|
|
*/
|
|
|
|
|
typedef void (* ARC_ParserData_DestroyFn)(void *data);
|
|
|
|
|
|
2024-10-16 17:35:38 -06:00
|
|
|
/**
|
|
|
|
|
* @brief creates an ARC_Parser type
|
|
|
|
|
*
|
2024-11-20 10:27:17 -07:00
|
|
|
* @TODO: fix this documentation to reflect changes
|
|
|
|
|
*
|
2024-10-16 05:14:53 -06:00
|
|
|
* @TODO: probs want to move the note to another file
|
|
|
|
|
* @note array of tokens for langauge? like
|
|
|
|
|
* ARC_ParserTag tag = {
|
|
|
|
|
* VARIABLE_NAME, //tagId
|
|
|
|
|
* {
|
|
|
|
|
* { 2, CHAR_OR_NUM, VARIABLE_NAME },
|
|
|
|
|
* { 1, LAMBDA },
|
|
|
|
|
* }, //components
|
|
|
|
|
* 2 //componentsSize
|
|
|
|
|
* };
|
|
|
|
|
*
|
2024-10-16 18:00:52 -06:00
|
|
|
* @param[out] parser ARC_Parser to create
|
|
|
|
|
* @param[in] language an arry of ARC_ParserLanguageTags defining a langauge
|
|
|
|
|
* @param[in] initLexerRulesFn a callback used to initalize the token rules the lexer within the parser will use
|
2024-10-16 17:35:38 -06:00
|
|
|
*/
|
2024-11-30 01:14:55 -07:00
|
|
|
void ARC_Parser_Create(ARC_Parser **parser, ARC_Array *language, ARC_Parser_InitLexerRulesFn initLexerRulesFn, ARC_ParserData_CreateFn *createDataFn, void *createUserData, ARC_ParserData_DestroyFn *destroyDataFn);
|
2024-10-16 17:35:38 -06:00
|
|
|
|
2024-11-23 19:27:30 -07:00
|
|
|
/**
|
|
|
|
|
* @brief creates an ARC_Parser type from an arc vector
|
|
|
|
|
*
|
|
|
|
|
* @param[out] parser ARC_Parser to create
|
|
|
|
|
* @param[in] language an vector of ARC_ParserLanguageTags defining a langauge
|
|
|
|
|
* @param[in] initLexerRulesFn a callback used to initalize the token rules the lexer within the parser will use
|
|
|
|
|
*/
|
2024-11-30 01:14:55 -07:00
|
|
|
void ARC_Parser_CreateFromVector(ARC_Parser **parser, ARC_Vector *language, ARC_Parser_InitLexerRulesFn initLexerRulesFn, ARC_ParserData_CreateFn *createDataFn, void *createUserData, ARC_ParserData_DestroyFn *destroyDataFn);
|
2024-11-23 19:27:30 -07:00
|
|
|
|
2024-10-16 17:35:38 -06:00
|
|
|
/**
|
2024-10-16 18:00:52 -06:00
|
|
|
* @brief creates an ARC_Parser type from a string
|
2024-10-16 17:35:38 -06:00
|
|
|
*
|
2024-10-16 18:00:52 -06:00
|
|
|
* @TODO: probs want to move the note to another file
|
|
|
|
|
* @note the syntax looks like:
|
|
|
|
|
* <variable> -> CHAR <variableName> EOF
|
|
|
|
|
* <variableName> -> <charOrNum> <variableName> | LAMBDA
|
|
|
|
|
* <charOrNum> -> CHAR | NUM
|
|
|
|
|
*
|
|
|
|
|
* @param[out] parser ARC_Parser to create
|
|
|
|
|
* @param[in] language an arry of ARC_ParserLanguageTags defining a langauge
|
|
|
|
|
* @param[in] initLexerRulesFn a callback used to initalize the token rules the lexer within the parser will use
|
2024-10-16 17:35:38 -06:00
|
|
|
*/
|
2024-10-16 18:00:52 -06:00
|
|
|
void ARC_Parser_CreateFromString(ARC_Parser **parser, ARC_String *languageString, ARC_Parser_InitLexerRulesFn initLexerRulesFn);
|
2024-10-16 17:35:38 -06:00
|
|
|
|
|
|
|
|
/**
|
2024-10-16 05:14:53 -06:00
|
|
|
* @brief destroys an ARC_Parser type
|
2024-10-16 17:35:38 -06:00
|
|
|
*
|
2024-10-16 05:14:53 -06:00
|
|
|
* @param[in] parser ARC_Parser to free
|
2024-10-16 17:35:38 -06:00
|
|
|
*/
|
2024-10-16 05:14:53 -06:00
|
|
|
void ARC_Parser_Destroy(ARC_Parser *parser);
|
2024-10-16 17:35:38 -06:00
|
|
|
|
|
|
|
|
/**
|
2024-10-16 18:00:52 -06:00
|
|
|
* @brief
|
2024-10-16 17:35:38 -06:00
|
|
|
*
|
2024-10-24 19:56:26 -06:00
|
|
|
* @param[in] parser
|
|
|
|
|
* @param[in/out] data the string to parse, will be freed and set to NULL by the end of this function
|
2024-10-16 17:35:38 -06:00
|
|
|
*/
|
2024-10-24 19:56:26 -06:00
|
|
|
void ARC_Parser_Parse(ARC_Parser *parser, ARC_String **data);
|
2024-10-16 17:35:38 -06:00
|
|
|
|
|
|
|
|
/**
|
2024-10-16 18:00:52 -06:00
|
|
|
* @brief
|
2024-10-16 17:35:38 -06:00
|
|
|
*
|
2024-10-16 18:00:52 -06:00
|
|
|
* @param[in] parser
|
|
|
|
|
* @param[in] language
|
2024-10-16 17:35:38 -06:00
|
|
|
*/
|
|
|
|
|
void ARC_Parser_ParseFile(ARC_Parser *parser, ARC_String *path);
|
|
|
|
|
|
2024-11-20 10:27:17 -07:00
|
|
|
/**
|
|
|
|
|
* @brief
|
|
|
|
|
*
|
|
|
|
|
* @param[in] parser
|
|
|
|
|
*/
|
|
|
|
|
void ARC_Parser_ClearData(ARC_Parser *parser);
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @brief
|
|
|
|
|
*
|
|
|
|
|
* @param[in] parser
|
|
|
|
|
*/
|
|
|
|
|
void *ARC_Parser_GetData(ARC_Parser *parser);
|
|
|
|
|
|
2024-11-01 04:39:45 -06:00
|
|
|
/**
|
|
|
|
|
* @brief basic tag for letting the parser know it is ok to end
|
|
|
|
|
*/
|
|
|
|
|
#define ARC_PARSER_TAG_LAMBDA 0
|
|
|
|
|
|
2024-10-16 17:35:38 -06:00
|
|
|
#ifdef __cplusplus
|
|
|
|
|
}
|
|
|
|
|
#endif
|
|
|
|
|
|
2024-10-16 05:14:53 -06:00
|
|
|
#endif // !ARC_STD_PARSER_H_
|