-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathregex.h
122 lines (101 loc) · 1.83 KB
/
regex.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
#ifndef REGEX_H
#define REGEX_H
#include <stdbool.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#define MAXN 92
#define MAXCAP 20
#define swap(x,y) do \
{ unsigned char swap_temp[sizeof(x) == sizeof(y) ? (signed)sizeof(x) : -1]; \
memcpy(swap_temp,&y,sizeof(x)); \
memcpy(&y,&x, sizeof(x)); \
memcpy(&x,swap_temp,sizeof(x)); \
} while(0)
enum Token {
Lit = 256,
Dot,
Sentinel,
Paren,
RParen,
Optional,
Star,
Plus,
NGOptional,
NGStar,
NGPlus,
Concat,
Alternative,
};
enum Op {
Char,
Any,
Save,
Match,
Split,
Jmp,
};
enum TokenType {
NonOp,
Surround,
Unary,
Binary,
};
static const enum TokenType token_type[Alternative + 1] = {
[Char] = NonOp,
[Dot] = NonOp,
[Optional] = Unary,
[Star] = Unary,
[Plus] = Unary,
[NGOptional] = Unary,
[NGStar] = Unary,
[NGPlus] = Unary,
[Concat] = Binary,
[Alternative] = Binary,
[Sentinel] = Surround,
[Paren] = Surround,
};
typedef struct Regex Regex;
struct Regex
{
enum Token type;
union {
char ch;
int capture_id;
};
Regex *left, *right;
};
typedef struct Instruction Instruction;
struct Instruction
{
enum Op op;
union {
char ch;
int save_id;
};
int timestamp;
Instruction *left, *right;
};
typedef struct Program Program;
struct Program
{
Instruction *start;
size_t size;
};
typedef struct Capture Capture;
struct Capture
{
size_t ref, size;
const char *captures[MAXCAP];
};
Regex *newRegex(const char*);
void printRegex(Regex *, int);
void destroyRegex(Regex *r);
Program *compile(Regex *);
void printProgram(Program *);
Capture *newCapture(size_t);
Capture *incRef(Capture *);
Capture *decRef(Capture *);
Capture *updateCapture(Capture *, int, const char *);
bool run(Program *, const char *, const char **, size_t);
#endif /* end of include guard: REGEX_H */