8 #include <ecoli_malloc.h>
10 #include <ecoli_test.h>
11 #include <ecoli_strvec.h>
12 #include <ecoli_node.h>
13 #include <ecoli_node_many.h>
14 #include <ecoli_node_or.h>
15 #include <ecoli_node_str.h>
16 #include <ecoli_node_int.h>
17 #include <ecoli_node_re_lex.h>
19 struct regexp_pattern {
25 struct ec_node_re_lex {
27 struct ec_node *child;
28 struct regexp_pattern *table;
32 static struct ec_strvec *
33 tokenize(struct regexp_pattern *table, size_t table_len, const char *str)
35 struct ec_strvec *strvec = NULL;
47 strvec = ec_strvec_new();
53 for (i = 0; i < table_len; i++) {
54 ret = regexec(&table[i].r, &dup[off], 1, &pos, 0);
57 if (pos.rm_so != 0 || pos.rm_eo == 0) {
62 if (table[i].keep == 0)
65 c = dup[pos.rm_eo + off];
66 dup[pos.rm_eo + off] = '\0';
67 ec_log(EC_LOG_DEBUG, "re_lex match <%s>\n", &dup[off]);
68 if (ec_strvec_add(strvec, &dup[off]) < 0)
71 dup[pos.rm_eo + off] = c;
86 ec_strvec_free(strvec);
90 static struct ec_parsed *ec_node_re_lex_parse(const struct ec_node *gen_node,
91 const struct ec_strvec *strvec)
93 struct ec_node_re_lex *node = (struct ec_node_re_lex *)gen_node;
94 struct ec_strvec *new_vec = NULL, *match_strvec;
95 struct ec_parsed *parsed = NULL, *child_parsed;
98 parsed = ec_parsed_new();
102 if (ec_strvec_len(strvec) == 0)
105 str = ec_strvec_val(strvec, 0);
106 new_vec = tokenize(node->table, node->len, str);
110 printf("--------\n");
111 ec_strvec_dump(stdout, new_vec);
112 child_parsed = ec_node_parse_strvec(node->child, new_vec);
113 if (child_parsed == NULL)
116 if (!ec_parsed_matches(child_parsed) ||
117 ec_parsed_len(child_parsed) !=
118 ec_strvec_len(new_vec)) {
119 ec_strvec_free(new_vec);
120 ec_parsed_free(child_parsed);
123 ec_strvec_free(new_vec);
126 ec_parsed_add_child(parsed, child_parsed);
127 match_strvec = ec_strvec_ndup(strvec, 0, 1);
128 if (match_strvec == NULL)
130 ec_parsed_set_match(parsed, gen_node, match_strvec);
135 ec_strvec_free(new_vec);
136 ec_parsed_free(parsed);
141 static void ec_node_re_lex_free_priv(struct ec_node *gen_node)
143 struct ec_node_re_lex *node = (struct ec_node_re_lex *)gen_node;
146 for (i = 0; i < node->len; i++) {
147 ec_free(node->table[i].pattern);
148 regfree(&node->table[i].r);
151 ec_free(node->table);
152 ec_node_free(node->child);
155 static struct ec_node_type ec_node_re_lex_type = {
157 .parse = ec_node_re_lex_parse,
158 //.complete = ec_node_re_lex_complete, //XXX
159 .size = sizeof(struct ec_node_re_lex),
160 .free_priv = ec_node_re_lex_free_priv,
163 EC_NODE_TYPE_REGISTER(ec_node_re_lex_type);
165 int ec_node_re_lex_add(struct ec_node *gen_node, const char *pattern, int keep)
167 struct ec_node_re_lex *node = (struct ec_node_re_lex *)gen_node;
168 struct regexp_pattern *table;
170 char *pat_dup = NULL;
173 pat_dup = ec_strdup(pattern);
178 table = ec_realloc(node->table, sizeof(*table) * (node->len + 1));
182 ret = regcomp(&table[node->len].r, pattern, REG_EXTENDED);
185 "Regular expression <%s> compilation failed: %d\n",
187 if (ret == REG_ESPACE)
195 table[node->len].pattern = pat_dup;
196 table[node->len].keep = keep;
207 struct ec_node *ec_node_re_lex(const char *id, struct ec_node *child)
209 struct ec_node_re_lex *node = NULL;
214 node = (struct ec_node_re_lex *)__ec_node_new(&ec_node_re_lex_type, id);
226 static int ec_node_re_lex_testcase(void)
228 struct ec_node *node;
231 node = ec_node_re_lex(NULL,
234 ec_node_str(NULL, "foo"),
235 ec_node_str(NULL, "bar"),
236 ec_node_int(NULL, 0, 1000, 0)
241 ec_log(EC_LOG_ERR, "cannot create node\n");
245 /* XXX add ^ automatically ? */
246 ret |= ec_node_re_lex_add(node, "[a-zA-Z]+", 1);
247 ret |= ec_node_re_lex_add(node, "[0-9]+", 1);
248 ret |= ec_node_re_lex_add(node, "=", 1);
249 ret |= ec_node_re_lex_add(node, "-", 1);
250 ret |= ec_node_re_lex_add(node, "\\+", 1);
251 ret |= ec_node_re_lex_add(node, "[ ]+", 0);
253 ec_log(EC_LOG_ERR, "cannot add regexp to node\n");
258 ret |= EC_TEST_CHECK_PARSE(node, 1, " foo bar 324 bar234");
259 ret |= EC_TEST_CHECK_PARSE(node, 1, "foo bar324");
260 ret |= EC_TEST_CHECK_PARSE(node, 1, "");
261 ret |= EC_TEST_CHECK_PARSE(node, -1, "foobar");
268 static struct ec_test ec_node_re_lex_test = {
269 .name = "node_re_lex",
270 .test = ec_node_re_lex_testcase,
273 EC_TEST_REGISTER(ec_node_re_lex_test);