forked from festvox/flite
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcompile_regexes.c
98 lines (88 loc) · 4.42 KB
/
compile_regexes.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
/*************************************************************************/
/* */
/* Language Technologies Institute */
/* Carnegie Mellon University */
/* Copyright (c) 2008 */
/* All Rights Reserved. */
/* */
/* Permission is hereby granted, free of charge, to use and distribute */
/* this software and its documentation without restriction, including */
/* without limitation the rights to use, copy, modify, merge, publish, */
/* distribute, sublicense, and/or sell copies of this work, and to */
/* permit persons to whom this work is furnished to do so, subject to */
/* the following conditions: */
/* 1. The code must retain the above copyright notice, this list of */
/* conditions and the following disclaimer. */
/* 2. Any modifications must be clearly marked as such. */
/* 3. Original authors' names are not deleted. */
/* 4. The authors' names are not used to endorse or promote products */
/* derived from this software without specific prior written */
/* permission. */
/* */
/* CARNEGIE MELLON UNIVERSITY AND THE CONTRIBUTORS TO THIS WORK */
/* DISCLAIM ALL WARRANTIES WITH REGARD TO THIS SOFTWARE, INCLUDING */
/* ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS, IN NO EVENT */
/* SHALL CARNEGIE MELLON UNIVERSITY NOR THE CONTRIBUTORS BE LIABLE */
/* FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES */
/* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN */
/* AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, */
/* ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF */
/* THIS SOFTWARE. */
/* */
/*************************************************************************/
/* Author: Alan W Black ([email protected]) */
/* Date: May 2008 */
/*************************************************************************/
/* */
/* To avoid an initialization phase where regexes need to be set up we */
/* precompile them into statics that can be used directly -- */
/* (dhd championed this technique, and this is a reimplementation of */
/* his compilation technique this) */
/* */
/*************************************************************************/
#include <stdio.h>
#include <string.h>
#include <sys/time.h>
#include <unistd.h>
#include "flite.h"
static void compregex_usage()
{
printf("compregex: compile regexes into C structures\n");
printf("usage: compregex name regex\n"
" Compiles regex into a C structure called name\n");
exit(0);
}
static void regex_to_C(const char *name, const cst_regex *rgx)
{
int i;
printf("static const unsigned char %s_rxprog[] = {\n ",name);
for (i=0; i<rgx->regsize; i++)
{
printf("%d, ", (unsigned char)rgx->program[i]);
if (i%16 == 15)
printf("\n ");
}
printf("\n};\n");
printf("static const cst_regex %s_rx = {\n ",name);
printf("%d, ",rgx->regstart);
printf("%d, ",rgx->reganch);
if (rgx->regmust == NULL)
printf("NULL, ");
else
printf("%s_rxprog + %ld, ", name, (long int)(rgx->regmust - rgx->program));
printf("%d, ",rgx->regmlen);
printf("%d,\n ",rgx->regsize);
printf("(char *)%s_rxprog\n",name);
printf("};\n");
printf("const cst_regex * const %s = &%s_rx;\n\n",name, name);
}
int main(int argc, char **argv)
{
cst_regex *rgx;
if (argc != 3)
compregex_usage();
rgx = new_cst_regex(argv[2]);
regex_to_C(argv[1],rgx);
delete_cst_regex(rgx);
return 0;
}