Applications/Grep: c/regexParser/regexParser.cc comparison

comparison c/regexParser/regexParser.cc @ 122:188d866227a4 pairPro

fix

author	Masataka Kohagura <kohagura@cr.ie.u-ryukyu.ac.jp>
date	Mon, 30 Nov 2015 23:43:53 +0900
parents	aa266a4db47c
children	c363a66dc1a7 4d6ac69801ad

comparison

equal deleted inserted replaced

-:aa266a4db47c
+:188d866227a4
 #include <stdlib.h>
 #include <stdio.h>
+#include <string.h>
+#include <ctype.h>
 #include "regexParser.h"
 #include "error.h"
 static NodePtr allocateNode();
 static NodePtr createNode(RegexInfoPtr,unsigned char*,NodePtr,NodePtr);
 ri->nodeNumber++;
 if (ri->tokenType == 'a') {
 ri->tokenType = 0;
 n->cc->cond->w = getWord(ri->tokenValue);
-ri->ptr += n->cc->cond->w->length-1;
 } else {
 WordPtr w = (WordPtr)malloc(sizeof(Word));
 w->word = character;
 w->length = 1;
 n->cc->cond->w = w;
 }
 // <charClass> ::= '['<literal>'-'<literal>']'
 static
 NodePtr charClass(RegexInfoPtr ri) {
-NodePtr n = (NodePtr)malloc(sizeof(Node));
+NodePtr n = allocateNode();
 if (n == NULL) {
 mallocFailedMessage();
 }
-while (ri->ptr[0] == '-') {
-ri->ptr++;
+n->tokenType = ri->tokenType;
+n->nodeNumber = ri->nodeNumber;
+ri->nodeNumber++;
+n->cc->cond->w = (WordPtr)malloc(sizeof(Word));
+int i = 0;
+while (ri->ptr[i] != ']') {
+if (ri->ptr[i] == '-') {
+n->cc->begin = ri->ptr[i-1];
+n->cc->end = ri->ptr[i+1];
+}
+i++;
 }
+n->cc->cond->w->word = (unsigned char*)malloc(sizeof(unsigned char)*(i+1));
+strncpy((char*)n->cc->cond->w->word, (char*)ri->ptr,i+1);
+n->cc->cond->w->word[i] = '\0';
+ri->ptr += i+1;
 return n;
 }
 // <literal> ::= [a-z][A-Z][0-9]
 static
 ri->tokenType = ')';
 ri->tokenValue = ri->ptr;
 return;
 } else if (ri->ptr[0] == '[') {
 ri->ptr++;
-ri->tokenType = '[';
+ri->tokenType = 'c';
 ri->tokenValue = ri->ptr;
 if (ri->ptr[1] == ']') {
 ri->ptr++;
 }
 return;
 \utf-8 etc...
 */
 } else {
 ri->tokenType = 'a';
 ri->tokenValue = ri->ptr;
-ri->ptr++;
+while (isalnum(ri->ptr[0])) {
+ri->ptr++;
+}
 return;
 }
 }
 return;
 }
 NodePtr regexAtom(RegexInfoPtr ri) {
 token(ri);
 NodePtr n = NULL;
 if (ri->tokenType == 'a') n = literal(ri);
-else if (ri->tokenType == '[') n = charClass(ri);
+else if (ri->tokenType == 'c') n = charClass(ri);
 else if (ri->tokenType == '(') n = group(ri);
 return n;
 }
-// <regex> ::= <regexAtom>|<regexAtom>'*'|<regexAtom>'|'<regex>|<regexAtom><regex>
+// <regex> ::= <regexAtom> | <regexAtom><regex>'*' | <regexAtom>'*' | <regexAtom>'|'<regex> | <regexAtom><regex> | '(' regex ')'
 NodePtr regex(RegexInfoPtr ri) {
 NodePtr n = regexAtom(ri);
 while (ri->ptr[0]) {
 token(ri);
 if (ri->tokenType == '*') {

Mercurial > hg > Applications > Grep

comparison c/regexParser/regexParser.cc @ 122:188d866227a4 pairPro