Mercurial > hg > Applications > Grep
annotate regexParser/CeriumGrep.cc @ 312:c9ac6f06e706
add loop
author | Shinji KONO <kono@ie.u-ryukyu.ac.jp> |
---|---|
date | Tue, 09 Feb 2016 10:59:22 +0900 |
parents | bdfe0a32c48f |
children | a4484c02cba5 |
rev | line source |
---|---|
45 | 1 #include <stdio.h> |
56
8901bc071d33
implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
55
diff
changeset
|
2 #include <stdlib.h> |
8901bc071d33
implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
55
diff
changeset
|
3 #include <string.h> |
235
4aab1e93a971
fix condition grepWalk.cc
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
232
diff
changeset
|
4 #include <unistd.h> |
266 | 5 #include "CeriumGrep.h" |
216 | 6 #include "subsetConstruction.h" |
190
3e8e5780ad4a
change node::State to State
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
189
diff
changeset
|
7 #include "node.h" |
231
d67649929e96
add grepWalk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
228
diff
changeset
|
8 #include "grepWalk.h" |
232
1a34e702776a
add fileread.cc
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
231
diff
changeset
|
9 #include "fileread.h" |
260
3f3c9902bb6d
initialize node in allocateNode()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
259
diff
changeset
|
10 #include "threadedSearch.h" |
312 | 11 #include "generateSequentialSearch.h" |
76 | 12 |
266 | 13 Search grep(int argc,char **argv,bool parallel) |
55 | 14 { |
216 | 15 bool generate = true; |
16 bool subset = false; | |
312 | 17 void (*generateSequentialSearch)(TransitionGeneratorPtr) = NULL; |
260
3f3c9902bb6d
initialize node in allocateNode()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
259
diff
changeset
|
18 bool ts = false; |
269
3a95be4a5bb0
filename=NULL initialized
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
268
diff
changeset
|
19 char *filename = NULL; |
266 | 20 Search s; |
269
3a95be4a5bb0
filename=NULL initialized
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
268
diff
changeset
|
21 s.filename = 0; |
266 | 22 s.tg = NULL; |
216 | 23 |
178
5e8c6857934c
implement charClassMerge
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
167
diff
changeset
|
24 RegexInfo ri; |
5e8c6857934c
implement charClassMerge
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
167
diff
changeset
|
25 ri.stateNumber = 1; |
56
8901bc071d33
implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
55
diff
changeset
|
26 for (int i = 1; i < argc; i++) { |
8901bc071d33
implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
55
diff
changeset
|
27 if (strcmp(argv[i],"-regex") == 0) { |
178
5e8c6857934c
implement charClassMerge
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
167
diff
changeset
|
28 ri.ptr = (unsigned char*)argv[i+1]; i++; |
216 | 29 } else if (strcmp(argv[i],"-noGeneration") == 0) { |
30 generate = false; | |
31 } else if (strcmp(argv[i],"-subset") == 0) { | |
32 subset = true; | |
228
399380ad95b7
fix generateTransitionGenerator
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
222
diff
changeset
|
33 } else if (strcmp(argv[i],"-seq") == 0) { |
312 | 34 generateSequentialSearch = exportState; |
35 } else if (strcmp(argv[i],"-loop") == 0) { | |
36 generateSequentialSearch = exportStateLoop; | |
37 } else if (strcmp(argv[i],"-cbc") == 0) { | |
38 generateSequentialSearch = exportStateCbC; | |
232
1a34e702776a
add fileread.cc
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
231
diff
changeset
|
39 } else if (strcmp(argv[i],"-file") == 0) { |
266 | 40 s.filename = filename = argv[i+1]; i++; |
260
3f3c9902bb6d
initialize node in allocateNode()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
259
diff
changeset
|
41 } else if (strcmp(argv[i],"-ts") == 0) { |
3f3c9902bb6d
initialize node in allocateNode()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
259
diff
changeset
|
42 ts = true; |
56
8901bc071d33
implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
55
diff
changeset
|
43 } |
8901bc071d33
implement string() and literal()
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
55
diff
changeset
|
44 } |
266 | 45 if (!ri.ptr) return s; |
216 | 46 |
178
5e8c6857934c
implement charClassMerge
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
167
diff
changeset
|
47 printf("regex : %s\n",ri.ptr); |
216 | 48 NodePtr n = regex(&ri); // parse only |
214
a94f57af1600
remove allocateCCstate createCCState
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
195
diff
changeset
|
49 printTree(n); |
216 | 50 |
231
d67649929e96
add grepWalk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
228
diff
changeset
|
51 TGValue tgv; |
219
a8e477f1352d
add an example for subset construction
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
217
diff
changeset
|
52 if (generate && !subset) { // NFA generation |
231
d67649929e96
add grepWalk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
228
diff
changeset
|
53 tgv = generateTransitionList(n); |
217 | 54 printTree(n); |
216 | 55 printState(tgv.tg); |
228
399380ad95b7
fix generateTransitionGenerator
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
222
diff
changeset
|
56 if (generateSequentialSearch) { |
399380ad95b7
fix generateTransitionGenerator
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
222
diff
changeset
|
57 exportState(tgv.tg); |
399380ad95b7
fix generateTransitionGenerator
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
222
diff
changeset
|
58 } |
216 | 59 } else if (subset) { |
231
d67649929e96
add grepWalk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
228
diff
changeset
|
60 tgv = generateTransitionList(n); |
249
9493800265a8
remove SCValue(not all remove)
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
235
diff
changeset
|
61 subsetConstruction(tgv.tg); // Determinization |
216 | 62 printState(tgv.tg); |
228
399380ad95b7
fix generateTransitionGenerator
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
222
diff
changeset
|
63 if (generateSequentialSearch) { |
312 | 64 generateSequentialSearch(tgv.tg); |
228
399380ad95b7
fix generateTransitionGenerator
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
222
diff
changeset
|
65 } |
216 | 66 } |
231
d67649929e96
add grepWalk
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
228
diff
changeset
|
67 |
266 | 68 if (filename != NULL && !parallel) { |
232
1a34e702776a
add fileread.cc
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
231
diff
changeset
|
69 int fd = 0; |
1a34e702776a
add fileread.cc
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
231
diff
changeset
|
70 st_mmap_t st_mmap = createSt_mmap(filename,fd); |
1a34e702776a
add fileread.cc
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
231
diff
changeset
|
71 Buffer buff = createBuffer(st_mmap); |
262
157f6886ba55
write driver of threadedSearch
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
260
diff
changeset
|
72 if (ts) threadedSearch(tgv.tg,buff); |
299 | 73 else grepWalk(tgv.tg,buff); |
235
4aab1e93a971
fix condition grepWalk.cc
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
232
diff
changeset
|
74 close(fd); |
232
1a34e702776a
add fileread.cc
Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
parents:
231
diff
changeset
|
75 } |
266 | 76 |
77 s.tg = tgv.tg; | |
78 return s; | |
45 | 79 } |