annotate c/regexParser/main.cc @ 69:eecddded9b91

implement printTree
author Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
date Wed, 12 Aug 2015 15:10:50 +0900
parents d27b3af1fe75
children 87dff3a124ab
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
55
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
1 /*
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
2 * <literal> ::= [a-z][A-Z][0-9]
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
3 * <charClass> ::= '['<literal>'-'<literal>']'
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
4 * <group> ::= '('<regex>')'
66
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
5 * <regexAtom> ::= <literal>|<charClass>|<group>
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
6 * <regex> ::= <regexAtom>|<regexAtom>'*'|<regexAtom>'|'<regex>|<regexAtom><regex>
55
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
7 */
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
8
45
89a198fa6b23 add dfrTobin
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
9 #include <stdio.h>
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
10 #include <stdlib.h>
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
11 #include <string.h>
57
71b497d25273 fix literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 56
diff changeset
12
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
13 typedef struct charClass {
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
14 unsigned char table[256];
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
15 struct utf8Range {
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
16 unsigned char *begin;
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
17 unsigned char *end;
64
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
18 struct utf8Range *next;
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
19 } *rangeList;
64
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
20 } CharClass, *CharClassPtr;
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
21
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
22 typedef struct node {
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
23 unsigned char type;
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
24 union value {
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
25 charClass *cc;
67
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
26 unsigned char character;
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
27 } Value, *ValuePtr;
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
28 struct node *self;
68
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
29 struct node *parent;
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
30 struct node *left;
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
31 struct node *right;
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
32 } Node, *NodePtr;
52
a2826bf4e80a remove magic number
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 51
diff changeset
33
64
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
34 unsigned char *ptr;
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
35 unsigned char tokenType;
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
36 int tokenValue;
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
37 NodePtr regexHeadNode;
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
38
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
39 NodePtr charClass();
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
40 NodePtr group();
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
41 NodePtr orexp();
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
42 NodePtr asterisk();
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
43 NodePtr regex();
67
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
44 NodePtr createNode(unsigned char,NodePtr,NodePtr);
64
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
45 extern void token();
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
46 extern NodePtr regexAtom();
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
47
55
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
48
62
a49b4a8b8c14 implement isLiteral
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 61
diff changeset
49 bool isLiteral(char c) {
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
50 if (*ptr > 0x7f) return true;
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
51 else if (*ptr == '(') return false;
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
52 else if (*ptr == '[') return false;
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
53 else if (*ptr == '|') return false;
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
54 else if (*ptr == '*') return false;
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
55 return true;
62
a49b4a8b8c14 implement isLiteral
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 61
diff changeset
56 }
a49b4a8b8c14 implement isLiteral
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 61
diff changeset
57
60
8616a045a7f4 impl asterisk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 59
diff changeset
58 void printNodeDate(NodePtr n) {
8616a045a7f4 impl asterisk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 59
diff changeset
59 puts("---------------------");
67
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
60 printf("Self Node char : %c\n", n->Value.character);
60
8616a045a7f4 impl asterisk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 59
diff changeset
61 printf("Self Node addr : %p\n", n->self);
8616a045a7f4 impl asterisk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 59
diff changeset
62 printf("left Node addr : %p\n", n->left);
8616a045a7f4 impl asterisk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 59
diff changeset
63 printf("right Node addr : %p\n", n->right);
8616a045a7f4 impl asterisk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 59
diff changeset
64 puts("---------------------");
8616a045a7f4 impl asterisk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 59
diff changeset
65 puts("");
8616a045a7f4 impl asterisk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 59
diff changeset
66 }
8616a045a7f4 impl asterisk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 59
diff changeset
67
67
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
68 NodePtr createNode(unsigned char character, NodePtr left, NodePtr right) {
57
71b497d25273 fix literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 56
diff changeset
69 NodePtr n = (NodePtr)malloc(sizeof(Node));
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
70 n->self = n;
67
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
71 n->Value.character = character;
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
72 n->left = left;
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
73 n->right = right;
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
74
60
8616a045a7f4 impl asterisk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 59
diff changeset
75 printNodeDate(n);
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
76 return n;
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
77 }
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
78
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
79 // <charClass> ::= '['<literal>'-'<literal>']'
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
80 NodePtr charClass() {
62
a49b4a8b8c14 implement isLiteral
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 61
diff changeset
81 NodePtr n = (NodePtr)malloc(sizeof(Node));
67
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
82 unsigned char startChar = *ptr;
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
83 while (*ptr == '-') {
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
84 ptr++;
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
85 }
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
86 unsigned char endChar = *ptr;
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
87 unsigned char *charTable = (unsigned char*)malloc(sizeof(char)*256);
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
88
62
a49b4a8b8c14 implement isLiteral
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 61
diff changeset
89 return n;
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
90 }
55
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
91
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
92 // <literal> ::= [a-z][A-Z][0-9]
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
93 NodePtr literal() {
65
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 64
diff changeset
94 NodePtr n = createNode(*ptr,0,0);
57
71b497d25273 fix literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 56
diff changeset
95 ptr++;
71b497d25273 fix literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 56
diff changeset
96 return n;
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
97 }
55
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
98
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
99 // <group> ::= '('<regex>')'
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
100 NodePtr group() {
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
101 token();
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
102 NodePtr n = regex();
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
103 token();
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
104 if (*ptr == ')') {
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
105 n = createNode('(',n,0);
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
106 } else {
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
107 // ) reqiured
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
108 }
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
109 return n;
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
110 }
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
111
55
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
112
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
113 void token() {
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
114 while (*ptr != '\0') {
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
115 if ((*ptr == '(') || (*ptr == ')')) {
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
116 tokenType = *ptr++;
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
117 tokenValue = 0;
67
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
118 if (ptr[1] == ')') {
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
119 ptr++;
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
120 }
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
121 return;
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
122 } else if (*ptr == '[') {
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
123 tokenType = '[';
64
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
124 tokenValue = *ptr;
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
125 if (ptr[1] == ']') {
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
126 ptr++;
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
127 }
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
128 return;
58
4053c3e0fa7f implement group()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 57
diff changeset
129 } else if (*ptr == '|'){
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
130 tokenType = '|';
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
131 tokenValue = 0;
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
132 return;
60
8616a045a7f4 impl asterisk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 59
diff changeset
133 } else if (*ptr == '*'){
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
134 tokenType = '*';
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
135 tokenValue = 0;
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
136 return;
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
137 }
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
138
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
139 tokenType = 'a';
64
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
140 tokenValue = *ptr;
65
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 64
diff changeset
141 return;
63
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
142
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
143 if (*ptr == '\\') ptr++; // need more proccesing
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
144 /*
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
145 \277
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
146 \0xa5
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
147 \[
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
148 \\
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
149 \utf-8 etc...
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
150 */
8fd3d35e9861 add token function
masa
parents: 62
diff changeset
151
55
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
152 }
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
153 }
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
154
64
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
155 // <regexAtom> ::= <literal>|<charClass>|<group>
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
156 NodePtr regexAtom() {
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
157
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
158 token();
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
159 NodePtr n = NULL;
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
160 if (tokenType == 'a') n = literal();
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
161 else if (tokenType == '[') n = charClass();
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
162 else if (tokenType == '(') n = group();
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
163
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
164 return n;
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
165 }
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
166
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
167 // <regex> ::= <regexAtom>|<regexAtom>'*'|<regexAtom>'|'<regex>|<regexAtom><regex>
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
168 NodePtr regex() {
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
169 NodePtr n = regexAtom();
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
170 while (*ptr) {
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
171 token();
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
172 if (tokenType == '*') {
66
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
173 n = createNode('*',n,0); ptr++;
64
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
174 } else if (tokenType == '|') {
66
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
175 ptr++;
64
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
176 NodePtr n1 = regex();
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
177 n = createNode('|',n,n1);
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
178 } else {
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
179 NodePtr n1 = regex();
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
180 n = createNode('+',n,n1);
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
181 }
67
4842ca2cf8ee print character
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 66
diff changeset
182 } return n;
68
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
183 }
66
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
184 /*
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
185 * e.g.
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
186 *
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
187 * % ./regexParser -regex abc
68
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
188 * c
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
189 * +
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
190 * b
66
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
191 * +
68
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
192 * a
66
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
193 *
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
194 * % ./regexParser -regex (a*|bc)d
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
195 *
68
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
196 * d
66
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
197 * +
68
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
198 * c
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
199 * +
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
200 * b
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
201 * |
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
202 * *
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
203 * a
66
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
204 */
68
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
205
69
eecddded9b91 implement printTree
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 68
diff changeset
206 void descendTree(NodePtr n) {
eecddded9b91 implement printTree
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 68
diff changeset
207 static int d = 0;
68
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
208 if (n->right != NULL) {
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
209 d++;
69
eecddded9b91 implement printTree
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 68
diff changeset
210 descendTree(n->right);
eecddded9b91 implement printTree
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 68
diff changeset
211 d--;
eecddded9b91 implement printTree
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 68
diff changeset
212 }
eecddded9b91 implement printTree
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 68
diff changeset
213 printf("%*c%c\n",d*4, ' ',n->Value.character);
eecddded9b91 implement printTree
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 68
diff changeset
214 if (n->left != NULL) {
68
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
215 d++;
69
eecddded9b91 implement printTree
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 68
diff changeset
216 descendTree(n->left);
eecddded9b91 implement printTree
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 68
diff changeset
217 d--;
68
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
218 }
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
219 }
d27b3af1fe75 remove string()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 67
diff changeset
220
66
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
221 void printTree(NodePtr n) {
69
eecddded9b91 implement printTree
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 68
diff changeset
222 descendTree(n);
66
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
223 }
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
224
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
225
62
a49b4a8b8c14 implement isLiteral
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 61
diff changeset
226 int main(int argc, char **argv)
55
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
227 {
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
228 for (int i = 1; i < argc; i++) {
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
229 if (strcmp(argv[i],"-regex") == 0) {
64
e0ad6c145f89 remove some errors
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 63
diff changeset
230 ptr = (unsigned char*)argv[i+1]; i++;
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
231 }
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
232 }
55
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 54
diff changeset
233
56
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
234 printf("regex : %s\n",ptr);
8901bc071d33 implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents: 55
diff changeset
235 NodePtr n = regex();
66
f8fb3b463f70 fix when '|' come procces
Masataka Kohagura <e085726@ie.u-ryukyu.ac.jp>
parents: 65
diff changeset
236 printTree(n);
45
89a198fa6b23 add dfrTobin
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
237 return 0;
89a198fa6b23 add dfrTobin
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
238 }