1 #ifndef SRC_REGEX_H_
2 #define SRC_REGEX_H_
3 
4 #include <stdbool.h>
5 #include <stdio.h>
6 
7 #ifdef USE_PCRE2
8 #include <pcre2.h>
9 #else
10 #include <pcre.h>
11 #endif
12 
13 #include "dso.h"
14 
15 enum { REGEX_MATCH,
16        REGEX_MATCH_PARTIAL,
17        REGEX_NO_MATCH,
18        REGEX_ERROR = -1,
19 };
20 
21 struct regex_data;
22 
23 #ifdef USE_PCRE2
24 struct regex_error_data {
25 	int error_code;
26 	PCRE2_SIZE error_offset;
27 };
28 #else
29 struct regex_error_data {
30 	char const *error_buffer;
31 	int error_offset;
32 };
33 #endif
34 
35 struct mmap_area;
36 
37 /**
38  * regex_arch_string return a string that represents the pointer width, the
39  * width of what the backend considers a size type, and the endianness of the
40  * system that this library was build for. (e.g. for x86_64: "8-8-el").
41  * This is required when loading stored regular espressions. PCRE2 regular
42  * expressions are not portable across architectures that do not have a
43  * matching arch-string.
44  */
45 char const *regex_arch_string(void) hidden;
46 
47 /**
48  * regex_verison returns the version string of the underlying regular
49  * regular expressions library. In the case of PCRE it just returns the
50  * result of pcre_version(). In the case of PCRE2, the very first time this
51  * function is called it allocates a buffer large enough to hold the version
52  * string and reads the PCRE2_CONFIG_VERSION option to fill the buffer.
53  * The allocated buffer will linger in memory until the calling process is being
54  * reaped.
55  *
56  * It may return NULL on error.
57  */
58 char const *regex_version(void) hidden;
59 /**
60  * This constructor function allocates a buffer for a regex_data structure.
61  * The buffer is being initialized with zeroes.
62  */
63 struct regex_data *regex_data_create(void) hidden;
64 /**
65  * This complementary destructor function frees the a given regex_data buffer.
66  * It also frees any non NULL member pointers with the appropriate pcreX_X_free
67  * function. For PCRE this function respects the extra_owned field and frees
68  * the pcre_extra data conditionally. Calling this function on a NULL pointer is
69  * save.
70  */
71 void regex_data_free(struct regex_data *regex) hidden;
72 /**
73  * This function compiles the regular expression. Additionally, it prepares
74  * data structures required by the different underlying engines. For PCRE
75  * it calls pcre_study to generate optional data required for optimized
76  * execution of the compiled pattern. In the case of PCRE2, it allocates
77  * a pcre2_match_data structure of appropriate size to hold all possible
78  * matches created by the pattern.
79  *
80  * @arg regex If successful, the structure returned through *regex was allocated
81  *            with regex_data_create and must be freed with regex_data_free.
82  * @arg pattern_string The pattern string that is to be compiled.
83  * @arg errordata A pointer to a regex_error_data structure must be passed
84  *                to this function. This structure depends on the underlying
85  *                implementation. It can be passed to regex_format_error
86  *                to generate a human readable error message.
87  * @retval 0 on success
88  * @retval -1 on error
89  */
90 int regex_prepare_data(struct regex_data **regex, char const *pattern_string,
91 		       struct regex_error_data *errordata) hidden;
92 /**
93  * This function loads a serialized precompiled pattern from a contiguous
94  * data region given by map_area.
95  *
96  * @arg map_area Description of the memory region holding a serialized
97  *               representation of the precompiled pattern.
98  * @arg regex If successful, the structure returned through *regex was allocated
99  *            with regex_data_create and must be freed with regex_data_free.
100  * @arg do_load_precompregex If non-zero precompiled patterns get loaded from
101  *			     the mmap region (ignored by PCRE1 back-end).
102  * @arg regex_compiled Set to true if a precompiled pattern was loaded
103  * 		       into regex, otherwise set to false to indicate later
104  *		       compilation must occur
105  *
106  * @retval 0 on success
107  * @retval -1 on error
108  */
109 int regex_load_mmap(struct mmap_area *map_area,
110 		    struct regex_data **regex,
111 		    int do_load_precompregex,
112 		    bool *regex_compiled) hidden;
113 /**
114  * This function stores a precompiled regular expression to a file.
115  * In the case of PCRE, it just dumps the binary representation of the
116  * precomplied pattern into a file. In the case of PCRE2, it uses the
117  * serialization function provided by the library.
118  *
119  * @arg regex The precomplied regular expression data.
120  * @arg fp A file stream specifying the output file.
121  * @arg do_write_precompregex If non-zero precompiled patterns are written to
122  *			      the output file (ignored by PCRE1 back-end).
123  */
124 int regex_writef(struct regex_data *regex, FILE *fp,
125 		 int do_write_precompregex) hidden;
126 /**
127  * This function applies a precompiled pattern to a subject string and
128  * returns whether or not a match was found.
129  *
130  * @arg regex The precompiled pattern.
131  * @arg subject The subject string.
132  * @arg partial Boolean indicating if partial matches are wanted. A nonzero
133  *              value is equivalent to specifying PCRE[2]_PARTIAL_SOFT as
134  *              option to pcre_exec of pcre2_match.
135  * @retval REGEX_MATCH if a match was found
136  * @retval REGEX_MATCH_PARTIAL if a partial match was found
137  * @retval REGEX_NO_MATCH if no match was found
138  * @retval REGEX_ERROR if an error was encountered during the execution of the
139  *                     regular expression
140  */
141 int regex_match(struct regex_data *regex, char const *subject,
142 		int partial) hidden;
143 /**
144  * This function compares two compiled regular expressions (regex1 and regex2).
145  * It compares the binary representations of the compiled patterns. It is a very
146  * crude approximation because the binary representation holds data like
147  * reference counters, that has nothing to do with the actual state machine.
148  *
149  * @retval SELABEL_EQUAL if the pattern's binary representations are exactly
150  *                       the same
151  * @retval SELABEL_INCOMPARABLE otherwise
152  */
153 int regex_cmp(struct regex_data *regex1, struct regex_data *regex2) hidden;
154 /**
155  * This function takes the error data returned by regex_prepare_data and turns
156  * it in to a human readable error message.
157  * If the buffer given to hold the error message is to small it truncates the
158  * message and indicates the truncation with an ellipsis ("...") at the end of
159  * the buffer.
160  *
161  * @arg error_data Error data as returned by regex_prepare_data.
162  * @arg buffer String buffer to hold the formatted error string.
163  * @arg buf_size Total size of the given buffer in bytes.
164  */
165 void regex_format_error(struct regex_error_data const *error_data, char *buffer,
166 			size_t buf_size) hidden;
167 #endif /* SRC_REGEX_H_ */
168