WebSVN – spk – Diff – /libspk/src/x2bc/x2bc_common/bod_text_parser.cpp

 #include "bod_text_parser.h"
 #include "../common/strutils.h"
 #include <memory.h>
 //---------------------------------------------------------------------------------
+// ERROR
+const char* bod_text_parser::Error::m_messages[]={
+	"No error",
+	"Newline in constant"
+};
 // TOKEN
-const char* bod_text_parser::token::specialChars[]={ "{", "}", ";", ":", "/!", "!/" };
+const char* bod_text_parser::token::specialChars[]={ "{", "}", ";", ":", "=", "/!", "!/", "/#", "(", ")", "/", ".", "+" };
 char bod_text_parser::token::tabWidth;
 const char* bod_text_parser::token::getText() const
+{
 	if(type >= t_text)
 	else
 		return specialChars[(int)type];
+}
 //---------------------------------------------------------------------------------
 void bod_text_parser::preParseBuffer(char *pszBuffer, size_t size)
 {
-	//m_lineCount=parseLines(pszBuffer, size, &m_lines);
 	m_pszBuffer=pszBuffer;
 	m_buffLen=size;
+}
 //---------------------------------------------------------------------------------
 size_t bod_text_parser::parseBuffer(size_t limit)
+{
+	char *ln;
 	size_t old=tokens.size();
-	/*for(size_t i=m_newLineIdx; i < m_lineCount; i++){
+	while(ln=nextLine()){
-		parseLine(m_lines[i], (int)i + 1);
+		if(parseLine(ln, ++m_lineIdx)==false)
-		if(limit!=-1 && ((tokens.size() - old) >= limit)){
-			i++;
 			break;
-		}
-	}
-	m_newLineIdx=i;*/
-	char *ln;
-	while(ln=nextLine()){
-		parseLine(ln, ++m_lineIdx);
 		if(limit!=-1 && ((tokens.size() - old) >= limit)){
 			break;
+		}
+	}
 	return tokens.size() - old;
+}
 //---------------------------------------------------------------------------------
+#define PUSH_PREVIOUS_STRING() { t=new token(); \
+t->type=token::t_text; \
+t->line=idx; \
+t->text=old; \
+t->col=(int)(old - line + 1); \
+tokens.push_back(t); }
+#define PUSH_TOKEN(_type, _col, _text) { t=new token(); \
+t->type=_type; \
+t->line=idx; \
+t->col=(int)(_col); \
+t->text=_text; \
+tokens.push_back(t); }
-void bod_text_parser::parseLine(char *line, int idx)
+bool bod_text_parser::parseLine(char *line, int idx)
+{
 	char *old=line, *pos=line, ch;
 	token *t;
+	bool bInQuotedString=false;
 	while(*pos!=0){
 		ch=*pos;
+		if(bInQuotedString || (ch=='"' && testFlag(parseQuotedStrings))){
-		if(ch==';' || ch==&apos;:') {
+			if(ch=='&quot;'){
+				bInQuotedString=!bInQuotedString;
+				*pos=0;
+				if(bInQuotedString){
+					if(*old!=0)
+						PUSH_PREVIOUS_STRING();
+				}
+				// got string
+				else
+					PUSH_TOKEN(token::t_quotedString, old - line, old);
+				old=pos + 1;
+			}
+			else{
+				++pos;
+				continue;
+			}
+		}
+		else if(ch==';' || ch==':' || (ch=='=' && testFlag(parseEqual)) ||
+		(testFlag(parseOperators) && (ch=='.' || ch=='+'))) {
 			*pos=0;
-			if(*old!=0){
+			if(*old!=0)
+				PUSH_PREVIOUS_STRING();
-				t=new token();
+			token::Type ty;
+			switch(ch){
+				case ';':
-				t->type=token::t_text;
+					ty=token::t_semicolon;
-				t->line=idx;
+					break;
-				t-&gt;text=old;
+				case &apos;:&apos;:
-				t->col=(int)(old - line + 1);
+					ty=token::t_colon;
+					break;
+				case '=':
-				tokens.push_back(t);
+					ty=token::t_equal;
-			}
+					break;
-			t=new token();
+				case &apos;.':
-			t->type=(ch==';' ? token::t_semicolon : token::t_colon);
+					ty=token::t_dot;
-			t->line=idx;
+					break;
-			t-&gt;col=(int)(pos - line + 1);
+				case &apos;+&apos;:
-			tokens.push_back(t);
+					ty=token::t_plus;
+					break;
+			}
+			PUSH_TOKEN(ty, pos - line + 1, 0);
 			old=pos + 1;
+		}
 		// space or tabulator
 		else if(ch==' ' || ch==0x9){
 			*pos=0;
-			if(*old!=0){
+			if(*old!=0)
-				t=new token();
-				t->type=token::t_text;
-				t->line=idx;
-				t->text=old;
-				t->col=(int)(old - line + 1);
-				tokens.push_back(t);
+				PUSH_PREVIOUS_STRING();
-			}
 			old=pos + 1;
+		}
+		// brackets
-		else if(ch=='{' || ch=='}') {
+		else if(ch=='{' || ch=='}' || (testFlag(parseStdBrackets) && (ch=='(' || ch==')'))) {
 			*pos=0;
-			if(*old!=0){
+			if(*old!=0)
+				PUSH_PREVIOUS_STRING();
-				t=new token();
+			token::Type ty;
+			switch(ch){
+				case '{':
+					ty=token::t_openCrBracket;
-				t->text=old;
+					break;
-				t-&gt;line=idx;
+				case &apos;}&apos;:
-				t->col=(int)(old - line) + 1;
+					ty=token::t_closeCrBracket;
+					break;
+				case '(':
-				t->type=token::t_text;
+					ty=token::t_openStdBracket;
+					break;
+				case ')':
-				tokens.push_back(t);
+					ty=token::t_closeStdBracket;
+					break;
+			}
-			t=new token();
+			PUSH_TOKEN(ty, pos - line + 1, 0);
-			t->type=(ch=='{' ? token::t_openBracket : token::t_closeBracket);
-			t->line=idx;
-			t->col=(int)(old - line + 1);
 			old=pos + 1;
-			tokens.push_back(t);
+		}
 		// either comment, header info or processing instruction
 		else if(ch=='/') {
 			if(pos[1]=='#'){
 				t=new token();
 					t->line=idx;
 					t->col=(int)(pos - line) + 1;
 					t->type=token::t_hdrinfo;
 					tokens.push_back(t);
+				}
 			}
 			// open proc instruction /!
 			if(pos[1]=='!') {
-				t=new token();
-				t->type=token::t_openInstrBlock;
+				PUSH_TOKEN(token::t_openInstrBlock, pos - line + 1, 0);
-				t->line=idx;
-				t->col=(int)(pos - line) + 1;
-				tokens.push_back(t);
 				old=pos + 2;
 				pos++;
 			}
-			// comment
+			// slash
+			else{
+				/* if ignore slash is on then do nothing
+				  else treat it as comment unless C comments are specified, in which case there must
+				  be // to make comment, otherwise / is treated as token
+				*/
-			else if(ignoreRemarks()==false){
+				if(testFlag(parseIgnoreSlash)==false){
+					if(testFlag(parseBODComments)) {
+						*pos=0;
+						pos--;
+					}
+					else if(testFlag(parseCComments) && pos[1]=='/') {
-				*pos=0;
+						*pos=0;
-				break;
+						pos--;
+					}
+					else {
+						*pos=0;
+						if(*old!=0)
+							PUSH_PREVIOUS_STRING();
+						PUSH_TOKEN(token::t_slash, pos - line + 1, 0);
+						old=pos + 1;
+					}
+				}
+			}
+		}
 		// close proc instruction !/
 		else if(ch=='!' && pos[1]=='/'){
 			*pos=0;
-			if(*old!=0){
+			if(*old!=0)
-				t=new token();
-				t->text=old;
-				t->line=idx;
-				t->col=(int)(old - line) + 1;
-				t->type=token::t_text;
-				tokens.push_back(t);
+				PUSH_PREVIOUS_STRING();
-			}
-			t=new token();
-			t->type=token::t_closeInstrBlock;
+			PUSH_TOKEN(token::t_closeInstrBlock, pos - line + 1, 0);
-			t->line=idx;
-			t->col=(int)(pos - line) + 1;
-			tokens.push_back(t);
 			old=pos + 2;
 			pos++;
+		}
 		pos++;
+	}
+	if(bInQuotedString){
+		error(idx, (int)strlen(line), Error::errNewLineInConstant);
+		return false;
+	}
 	// if there are some chars left after last delimeter (usually ;) this will process them
 	if(old!=pos){
-		t=new token();
-		t->text=old;
-		t->line=idx;
-		t->col=(int)(old - line) + 1;
+		PUSH_TOKEN(token::t_text, old - line + 1, old);
-		t->type=token::t_text;
-		tokens.push_back(t);
 	}
+	return true;
+}
-//---------------------------------------------------------------------------------
-/*size_t bod_text_parser::parseLines(char *buffer, size_t size, char ***array_ptr)
-{
-	size_t lineCount=1;
-	size_t i;
-	for(i=0; i < size; i++){
-		if(buffer[i]==0xD){
-			buffer[i]=0;
-			lineCount++;
-			if(((i + 1) < size) && buffer[i+1]==0xA)
-				buffer[i+1]=1;
-		}
-		else if(buffer[i]==0xA){
-			buffer[i]=0;
-			lineCount++;
-		}
-	}
-	char **lines=new char*[lineCount];
-	char *ptr=buffer, *end=buffer + size;
-	i=0;
-	do{
-		if(ptr && *ptr==1)
-			ptr++;
-		lines[i]=ptr;
-		ptr=(char*)memchr(ptr, 0, end - ptr);
-		if(ptr) ptr++;
-		// this will protect us from binary files where are more zeroes than we expect
-		if(++i==lineCount)
-			break;
-	}
-	while(ptr);
-	*array_ptr=lines;
-	return lineCount;
-}*/
 //---------------------------------------------------------------------------------
 char * bod_text_parser::nextLine()
+{
-/*
-	size_t i, size=m_buffLen;
-	char *line=0, *buffer=(char*)m_pszBuffer;
-	for(i=m_lastCharPos; i < size; i++){
-		if(buffer[i]==0xD){
-			buffer[i]=0;
-			if(((i + 1) < size) && buffer[i+1]==0xA)
-				buffer[i+1]=1;
-			line=buffer + m_lastCharPos;
-			break;
-		}
-		else if(buffer[i]==0xA){
-			buffer[i]=0;
-			line=buffer + m_lastCharPos;
-			break;
-		}
-	}
-	if(line==0) line=buffer + m_lastCharPos;
-	if(*line==0) line++;
-	if(m_lastCharPos==size) return NULL;
-	m_lastCharPos=i;
-	if(line[0]==1)
-		line++;
-	return line;
-	*/
 	size_t i, size=m_buffLen;
 	char *line=0, *buffer=(char*)m_pszBuffer;
 	for(i=m_lastPos; i < size; i++){
 		if(buffer[i]==0xD){

Subversion Repositories spk

(root)/libspk/src/x2bc/x2bc_common/bod_text_parser.cpp – Rev 1 → 114