Write a general header file and a header file for regular expressions.
This commit is contained in:
parent
41d4d98678
commit
e86518b716
24
include/liblex.h
Normal file
24
include/liblex.h
Normal file
|
@ -0,0 +1,24 @@
|
||||||
|
#ifndef LIBLEX_H
|
||||||
|
#define LIBLEX_H
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Represents a result of a liblex operation.
|
||||||
|
*/
|
||||||
|
enum liblex_result_e {
|
||||||
|
/**
|
||||||
|
* Represents a succesful operation.
|
||||||
|
*/
|
||||||
|
LIBLEX_SUCCESS,
|
||||||
|
/**
|
||||||
|
* Represents a memory allocation failure.
|
||||||
|
*/
|
||||||
|
LIBLEX_MALLOC,
|
||||||
|
/**
|
||||||
|
* Represents an invalid pattern.
|
||||||
|
*/
|
||||||
|
LIBLEX_INVALID
|
||||||
|
};
|
||||||
|
|
||||||
|
typedef enum liblex_result_e liblex_result;
|
||||||
|
|
||||||
|
#endif
|
169
include/pattern.h
Normal file
169
include/pattern.h
Normal file
|
@ -0,0 +1,169 @@
|
||||||
|
#ifndef LIBLEX_PATTERN_H
|
||||||
|
#define LIBLEX_PATTERN_H
|
||||||
|
|
||||||
|
#include "liblex.h"
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Enum that represents the type
|
||||||
|
* of a NFA node / state.
|
||||||
|
*/
|
||||||
|
enum pattern_node_type_e {
|
||||||
|
/**
|
||||||
|
* Represents a clear, un-configured node.
|
||||||
|
*/
|
||||||
|
PNODE_CLEAR,
|
||||||
|
/**
|
||||||
|
* Represents a single value to be matched.
|
||||||
|
*/
|
||||||
|
PNODE_VALUE,
|
||||||
|
/**
|
||||||
|
* Represents a range of values, inclusive.
|
||||||
|
*/
|
||||||
|
PNODE_RANGE,
|
||||||
|
/**
|
||||||
|
* Represents any character other than the NULL terminator.
|
||||||
|
*/
|
||||||
|
PNODE_ANY,
|
||||||
|
/**
|
||||||
|
* Represents a "connection" between nodes, does not
|
||||||
|
* match any value.
|
||||||
|
* */
|
||||||
|
PNODE_CONNECT,
|
||||||
|
/**
|
||||||
|
* Represents a fork / divide in possible "next" states.
|
||||||
|
*/
|
||||||
|
PNODE_FORK,
|
||||||
|
/**
|
||||||
|
* Represents a succesfully matched pattern.
|
||||||
|
*/
|
||||||
|
PNODE_END
|
||||||
|
};
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Struct representing a single NFA node / state.
|
||||||
|
*/
|
||||||
|
struct pattern_node_s {
|
||||||
|
/**
|
||||||
|
* The type of this node.
|
||||||
|
*/
|
||||||
|
enum pattern_node_type_e type;
|
||||||
|
/**
|
||||||
|
* The id of this node.
|
||||||
|
* The id is unique within the pattern.
|
||||||
|
*/
|
||||||
|
int id;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* The node's data that varies based on type.
|
||||||
|
*/
|
||||||
|
union {
|
||||||
|
/**
|
||||||
|
* Data for a "value" node.
|
||||||
|
*/
|
||||||
|
struct {
|
||||||
|
/**
|
||||||
|
* The value this node matches.
|
||||||
|
*/
|
||||||
|
char value;
|
||||||
|
/**
|
||||||
|
* The next state in the pattern.
|
||||||
|
*/
|
||||||
|
struct pattern_node_s* next;
|
||||||
|
} value_s;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Data for a "range" node.
|
||||||
|
*/
|
||||||
|
struct {
|
||||||
|
/**
|
||||||
|
* The beginning of the range, inclusive, of matched values.
|
||||||
|
*/
|
||||||
|
char from;
|
||||||
|
/**
|
||||||
|
* The end of the range, inclusive, of matched values.
|
||||||
|
*/
|
||||||
|
char to;
|
||||||
|
/**
|
||||||
|
* The next state in the pattern.
|
||||||
|
*/
|
||||||
|
struct pattern_node_s* next;
|
||||||
|
} range_s;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Data for an "any" node.
|
||||||
|
*/
|
||||||
|
struct {
|
||||||
|
/**
|
||||||
|
* The next state in the pattern.
|
||||||
|
*/
|
||||||
|
struct pattern_node_s* next;
|
||||||
|
} any_s;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Data for a "connect" node.
|
||||||
|
*/
|
||||||
|
struct {
|
||||||
|
/**
|
||||||
|
* The next node in the pattern.
|
||||||
|
*/
|
||||||
|
struct pattern_node_s* next;
|
||||||
|
} connect_s;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Data for a "fork" node.
|
||||||
|
*/
|
||||||
|
struct {
|
||||||
|
/**
|
||||||
|
* The left node in the fork.
|
||||||
|
*/
|
||||||
|
struct pattern_node_s* left;
|
||||||
|
/**
|
||||||
|
* The right node in the fork.
|
||||||
|
*/
|
||||||
|
struct pattern_node_s* right;
|
||||||
|
} fork_s;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Data for an "end" node.
|
||||||
|
*/
|
||||||
|
struct {
|
||||||
|
/**
|
||||||
|
* The ID of the pattern that just finished matching.
|
||||||
|
*/
|
||||||
|
int pattern_id;
|
||||||
|
} end_s;
|
||||||
|
} data_u;
|
||||||
|
};
|
||||||
|
|
||||||
|
/**
|
||||||
|
* A chain of pattern nodes.
|
||||||
|
*/
|
||||||
|
struct pattern_chain_s {
|
||||||
|
/**
|
||||||
|
* The beginning of the chain, its first state.
|
||||||
|
*/
|
||||||
|
struct pattern_node_s* head;
|
||||||
|
/**
|
||||||
|
* The end of the chain, its last state.
|
||||||
|
*/
|
||||||
|
struct pattern_node_s* tail;
|
||||||
|
};
|
||||||
|
|
||||||
|
typedef enum pattern_node_type_e pattern_node_type;
|
||||||
|
typedef struct pattern_node_s pattern_node;
|
||||||
|
typedef struct pattern_chain_s pattern_chain;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Compiles a string representation of a pattern into a pattern NFA,
|
||||||
|
* and stores the first node of the new NFA in root.
|
||||||
|
* @param root the node to store the resulting pattern into.
|
||||||
|
* @param expression the pattern represented as a string.
|
||||||
|
* @return LIBLEX_SUCCESS if all goes well, otherwise some other liblex_result.
|
||||||
|
*/
|
||||||
|
liblex_result pattern_compile(pattern_node** root, char* expression);
|
||||||
|
/**
|
||||||
|
* Frees a pattern NFA allocated by pattern_compile.
|
||||||
|
*/
|
||||||
|
void pattern_free(pattern_node* root);
|
||||||
|
|
||||||
|
#endif
|
Loading…
Reference in New Issue
Block a user