From ba22a750093f5b918aefd58ba698f38dff6a14e1 Mon Sep 17 00:00:00 2001
From: Jan Breuer <jan.breuer@jaybee.cz>
Date: 摹曛, 20 6月 2013 22:03:49 +0800
Subject: [PATCH] Unexpected character handling

---
 libscpi/src/lexer.c |  337 ++++++++++++++++++++++++++++++-------------------------
 1 files changed, 184 insertions(+), 153 deletions(-)

diff --git a/libscpi/src/lexer.c b/libscpi/src/lexer.c
index 0b3bf09..65824df 100644
--- a/libscpi/src/lexer.c
+++ b/libscpi/src/lexer.c
@@ -40,23 +40,22 @@
 
 #include "scpi/lexer.h"
 
-
 /* identify character */
-static int isws ( int c ) {
+static int isws(int c) {
     if ((c == ' ') || (c == '\t')) {
         return 1;
     }
     return 0;
 }
 
-static int isbdigit ( int c ) {
+static int isbdigit(int c) {
     if ((c == '0') || (c == '1')) {
         return 1;
     }
     return 0;
 }
 
-static int isqdigit ( int c ) {
+static int isqdigit(int c) {
     if ((c == '0') || (c == '1') || (c == '2') || (c == '3') || (c == '4') || (c == '5') || (c == '6') || (c == '7')) {
         return 1;
     }
@@ -71,6 +70,10 @@
     }
 }
 
+int SCPI_LexIsEos(lex_state_t * state) {
+    return iseos(state);
+}
+
 static int ischr(lex_state_t * state, char chr) {
     return (state->pos[0] == chr);
 }
@@ -80,31 +83,36 @@
 }
 
 static int isH(int c) {
-    return c == 'h' || c == 'H';  
+    return c == 'h' || c == 'H';
 }
 
 static int isB(int c) {
-    return c == 'b' || c == 'B';  
+    return c == 'b' || c == 'B';
 }
 
 static int isQ(int c) {
-    return c == 'q' || c == 'Q';  
+    return c == 'q' || c == 'Q';
 }
 
 static int isE(int c) {
-    return c == 'e' || c == 'E';  
+    return c == 'e' || c == 'E';
 }
+
+#define SKIP_NONE       0
+#define SKIP_OK         1
+#define SKIP_INCOMPLETE -1
 
 /* skip characters */
 /* 7.4.1 <PROGRAM MESSAGE UNIT SEPARATOR>*/
 // TODO: static int skipProgramMessageUnitSeparator(lex_state_t * state)
+
 static int skipWs(lex_state_t * state) {
     int someSpace = 0;
-    while(!iseos(state) && isws(state->pos[0])) {
+    while (!iseos(state) && isws(state->pos[0])) {
         state->pos++;
         someSpace++;
     }
-    
+
     return someSpace;
 }
 
@@ -115,17 +123,17 @@
 // static int skipProgramMessageTerminator(lex_state_t * state)
 
 static int skipDigit(lex_state_t * state) {
-    if(!iseos(state) && isdigit(state->pos[0])) {
+    if (!iseos(state) && isdigit(state->pos[0])) {
         state->pos++;
-        return 1;
+        return SKIP_OK;
     } else {
-        return 0;
+        return SKIP_NONE;
     }
 }
 
 static int skipNumbers(lex_state_t * state) {
     int someNumbers = 0;
-    while(!iseos(state) && isdigit(state->pos[0])) {
+    while (!iseos(state) && isdigit(state->pos[0])) {
         state->pos++;
         someNumbers++;
     }
@@ -133,258 +141,283 @@
 }
 
 static int skipPlusmn(lex_state_t * state) {
-    if(!iseos(state) && isplusmn(state->pos[0])) {
+    if (!iseos(state) && isplusmn(state->pos[0])) {
         state->pos++;
-        return 1;
+        return SKIP_OK;
     } else {
-        return 0;
+        return SKIP_NONE;
     }
 }
 
 static int skipAlpha(lex_state_t * state) {
     int someLetters = 0;
-    while(!iseos(state) && isalpha(state->pos[0])) {
+    while (!iseos(state) && isalpha(state->pos[0])) {
         state->pos++;
         someLetters++;
     }
-    return someLetters;    
+    return someLetters;
 }
 
 static int skipChr(lex_state_t * state, int chr) {
-    if(!iseos(state) && ischr(state, chr)) {
+    if (!iseos(state) && ischr(state, chr)) {
         state->pos++;
-        return 1;
+        return SKIP_OK;
     } else {
-        return 0;
+        return SKIP_NONE;
     }
 }
 
 static int skipSlashDot(lex_state_t * state) {
-    if(!iseos(state) && (ischr(state, '/') | ischr(state, '.'))) {
+    if (!iseos(state) && (ischr(state, '/') | ischr(state, '.'))) {
         state->pos++;
-        return 1;
+        return SKIP_OK;
     } else {
-        return 0;
-    }    
+        return SKIP_NONE;
+    }
 }
 
 static int skipStar(lex_state_t * state) {
-    if(!iseos(state) && ischr(state, '*')) {
+    if (!iseos(state) && ischr(state, '*')) {
         state->pos++;
-        return 1;
+        return SKIP_OK;
     } else {
-        return 0;
-    }    
+        return SKIP_NONE;
+    }
 }
 
 static int skipColon(lex_state_t * state) {
-    if(!iseos(state) && ischr(state, ':')) {
+    if (!iseos(state) && ischr(state, ':')) {
         state->pos++;
-        return 1;
+        return SKIP_OK;
     } else {
-        return 0;
-    }    
+        return SKIP_NONE;
+    }
 }
 
 /* 7.6.1.2 <COMMAND PROGRAM HEADER> */
 static int skipProgramMnemonic(lex_state_t * state) {
     const char * startPos = state->pos;
-    if(!iseos(state) && isalpha(state->pos[0])) {
+    if (!iseos(state) && isalpha(state->pos[0])) {
         state->pos++;
-        while(!iseos(state) && (isalnum(state->pos[0]) || ischr(state, '_'))) {
+        while (!iseos(state) && (isalnum(state->pos[0]) || ischr(state, '_'))) {
             state->pos++;
         }
     }
-    
-    return state->pos - startPos;
+
+    if (iseos(state)) {
+        return (state->pos - startPos) * SKIP_INCOMPLETE;
+    } else {
+        return (state->pos - startPos) * SKIP_OK;
+    }
 }
 
 /* tokens */
 int SCPI_LexWhiteSpace(lex_state_t * state, token_t * token) {
     token->ptr = state->pos;
-    
+
     skipWs(state);
-    
-    token->len = state->pos - token->ptr;  
-    
+
+    token->len = state->pos - token->ptr;
+
     if (token->len > 0) {
         token->type = TokWhiteSpace;
     } else {
         token->type = TokUnknown;
-    }        
-    
+    }
+
     return token->len;
 }
 
 /* 7.6.1 <COMMAND PROGRAM HEADER> */
 static int skipCommonProgramHeader(lex_state_t * state) {
+    int res;
     if (skipStar(state)) {
-        if(!skipProgramMnemonic(state)) {
-            state->pos--;
+        res = skipProgramMnemonic(state);
+        if (res == SKIP_NONE && iseos(state)) {
+            return SKIP_INCOMPLETE;
+        } else if (res <= SKIP_INCOMPLETE) {
+            return SKIP_OK;
+        } else if (res >= SKIP_OK) {
+            return SKIP_OK;
         } else {
-            return 1;
+            return SKIP_INCOMPLETE;
         }
     }
-    return 0;
+    return SKIP_NONE;
 }
 
 static int skipCompoundProgramHeader(lex_state_t * state) {
-    const char * rollback = state->pos;
-    
-    skipColon(state);
-    
-    if(skipProgramMnemonic(state)) {
-        while(skipColon(state)) {
-            if(!skipProgramMnemonic(state)) {
-                state->pos = rollback;
-                return 0;
+    int res;
+    int firstColon = skipColon(state);
+
+    res = skipProgramMnemonic(state);
+    if (res >= SKIP_OK) {
+        while (skipColon(state)) {
+            res = skipProgramMnemonic(state);
+            if (res <= SKIP_INCOMPLETE) {
+                return SKIP_OK;
+            } else if (res == SKIP_NONE) {
+                return SKIP_INCOMPLETE;
             }
         }
-        return 1;
+        return SKIP_OK;
+    } else if (res <= SKIP_INCOMPLETE) {
+        return SKIP_OK;
+    } else if (firstColon) {
+        return SKIP_INCOMPLETE;
     } else {
-        state->pos = rollback;        
-        return 0;
+        return SKIP_NONE;
     }
 }
 
-int SCPI_LexProgramHeader(lex_state_t * state,  token_t * token) {
+int SCPI_LexProgramHeader(lex_state_t * state, token_t * token) {
+    int res;
     token->ptr = state->pos;
     token->type = TokUnknown;
-    
-    if(skipCommonProgramHeader(state)) {
-        if (skipChr(state, '?')) {
+
+    res = skipCommonProgramHeader(state);
+    if (res >= SKIP_OK) {
+        if (skipChr(state, '?') >= SKIP_OK) {
             token->type = TokCommonQueryProgramHeader;
         } else {
             token->type = TokCommonProgramHeader;
         }
-    } else if(skipCompoundProgramHeader(state)) {
-        if (skipChr(state, '?')) {
-            token->type = TokCompoundQueryProgramHeader;
-        } else {
-            token->type = TokCompoundProgramHeader;
-        }
+    } else if (res <= SKIP_INCOMPLETE) {
+        token->type = TokIncompleteCommonProgramHeader;
+    } else if (res == SKIP_NONE) {
+        res = skipCompoundProgramHeader(state);
+
+        if (res >= SKIP_OK) {
+            if (skipChr(state, '?') >= SKIP_OK) {
+                token->type = TokCompoundQueryProgramHeader;
+            } else {
+                token->type = TokCompoundProgramHeader;
+            }
+        } else if (res <= SKIP_INCOMPLETE) {
+            token->type = TokIncompleteCompoundProgramHeader;
+        } 
     }
-    
+
     if (token->type != TokUnknown) {
         token->len = state->pos - token->ptr;
     } else {
         token->len = 0;
         state->pos = token->ptr;
     }
-    
-    return token->len;    
+
+    return token->len;
 }
 
 /* 7.7.1 <CHARACTER PROGRAM DATA> */
 int SCPI_LexCharacterProgramData(lex_state_t * state, token_t * token) {
     token->ptr = state->pos;
-    
-    if(!iseos(state) && isalpha(state->pos[0])) {
+
+    if (!iseos(state) && isalpha(state->pos[0])) {
         state->pos++;
-        while(!iseos(state) && (isalnum(state->pos[0]) || ischr(state, '_'))) {
+        while (!iseos(state) && (isalnum(state->pos[0]) || ischr(state, '_'))) {
             state->pos++;
         }
     }
-    
+
     token->len = state->pos - token->ptr;
-    if(token->len > 0) {
+    if (token->len > 0) {
         token->type = TokProgramMnemonic;
     } else {
         token->type = TokUnknown;
     }
-    
+
     return token->len;
 }
 
 /* 7.7.2 <DECIMAL NUMERIC PROGRAM DATA> */
 static int skipMantisa(lex_state_t * state) {
     int someNumbers = 0;
-    
+
     skipPlusmn(state);
-    
+
     someNumbers += skipNumbers(state);
-    
-    if(skipChr(state, '.')) {
+
+    if (skipChr(state, '.')) {
         someNumbers += skipNumbers(state);
     }
-    
+
     return someNumbers;
 }
 
 static int skipExponent(lex_state_t * state) {
     int someNumbers = 0;
-    
-    if(!iseos(state) && isE(state->pos[0])) {
+
+    if (!iseos(state) && isE(state->pos[0])) {
         state->pos++;
-        
+
         skipWs(state);
-        
+
         skipPlusmn(state);
-        
+
         someNumbers = skipNumbers(state);
     }
-    
+
     return someNumbers;
 }
 
 int SCPI_LexDecimalNumericProgramData(lex_state_t * state, token_t * token) {
     const char * rollback;
     token->ptr = state->pos;
-    
+
     if (skipMantisa(state)) {
         rollback = state->pos;
         skipWs(state);
-        if(!skipExponent(state)) {
+        if (!skipExponent(state)) {
             state->pos = rollback;
         }
     } else {
         state->pos = token->ptr;
     }
-    
+
     token->len = state->pos - token->ptr;
-    if(token->len > 0) {
+    if (token->len > 0) {
         token->type = TokDecimalNumericProgramData;
     } else {
         token->type = TokUnknown;
     }
-    
+
     return token->len;
 }
 
 /* 7.7.3 <SUFFIX PROGRAM DATA> */
 int SCPI_LexSuffixProgramData(lex_state_t * state, token_t * token) {
     token->ptr = state->pos;
-    
+
     skipChr(state, '/');
-    
+
     // TODO: strict parsing  : SLASH? (ALPHA+ (MINUS? DIGIT)?) ((SLASH | DOT) (ALPHA+ (MINUS? DIGIT)?))*
     if (skipAlpha(state)) {
         skipChr(state, '-');
         skipDigit(state);
-        
+
         while (skipSlashDot(state)) {
             skipAlpha(state);
             skipChr(state, '-');
-            skipDigit(state);            
+            skipDigit(state);
         }
     }
-    
+
     token->len = state->pos - token->ptr;
-    if((token->len > 0)) {
+    if ((token->len > 0)) {
         token->type = TokSuffixProgramData;
     } else {
         token->type = TokUnknown;
         state->pos = token->ptr;
         token->len = 0;
     }
-    
+
     return token->len;
 }
 
 /* 7.7.4 <NONDECIMAL NUMERIC PROGRAM DATA> */
 static int skipHexNum(lex_state_t * state) {
     int someNumbers = 0;
-    while(!iseos(state) && isxdigit(state->pos[0])) {
+    while (!iseos(state) && isxdigit(state->pos[0])) {
         state->pos++;
         someNumbers++;
     }
@@ -393,7 +426,7 @@
 
 static int skipOctNum(lex_state_t * state) {
     int someNumbers = 0;
-    while(!iseos(state) && isqdigit(state->pos[0])) {
+    while (!iseos(state) && isqdigit(state->pos[0])) {
         state->pos++;
         someNumbers++;
     }
@@ -402,35 +435,34 @@
 
 static int skipBinNum(lex_state_t * state) {
     int someNumbers = 0;
-    while(!iseos(state) && isbdigit(state->pos[0])) {
+    while (!iseos(state) && isbdigit(state->pos[0])) {
         state->pos++;
         someNumbers++;
     }
     return someNumbers;
 }
 
-
 int SCPI_LexNondecimalNumericData(lex_state_t * state, token_t * token) {
     token->ptr = state->pos;
     int someNumbers = 0;
-    if(skipChr(state, '#')) {
-        if(!iseos(state)) {
-            if(isH(state->pos[0])) {
+    if (skipChr(state, '#')) {
+        if (!iseos(state)) {
+            if (isH(state->pos[0])) {
                 state->pos++;
                 someNumbers = skipHexNum(state);
                 token->type = TokHexnum;
-            } else if(isQ(state->pos[0])) {
+            } else if (isQ(state->pos[0])) {
                 state->pos++;
                 someNumbers = skipOctNum(state);
                 token->type = TokOctnum;
-            } else if(isB(state->pos[0])) {
+            } else if (isB(state->pos[0])) {
                 state->pos++;
                 someNumbers = skipBinNum(state);
                 token->type = TokBinnum;
             }
         }
     }
-    
+
     if (someNumbers) {
         token->ptr += 2; // ignore number prefix
         token->len = state->pos - token->ptr;
@@ -442,15 +474,13 @@
     return token->len > 0 ? token->len + 2 : 0;
 }
 
-
 /* 7.7.5 <STRING PROGRAM DATA> */
 static int isascii7bit(int c) {
     return (c >= 0) && (c <= 0x7f);
 }
 
-
 static int skipQuoteProgramData(lex_state_t * state, int quote) {
-    while(!iseos(state)) {
+    while (!iseos(state)) {
         if (isascii7bit(state->pos[0]) && !ischr(state, quote)) {
             state->pos++;
         } else if (ischr(state, quote)) {
@@ -464,7 +494,7 @@
         }
     }
 }
-    
+
 static int skipDoubleQuoteProgramData(lex_state_t * state) {
     skipQuoteProgramData(state, '"');
 }
@@ -473,9 +503,9 @@
     skipQuoteProgramData(state, '\'');
 }
 
-int SCPI_LexStringProgramData(lex_state_t * state,  token_t * token) {
+int SCPI_LexStringProgramData(lex_state_t * state, token_t * token) {
     token->ptr = state->pos;
-    
+
     if (!iseos(state)) {
         if (ischr(state, '"')) {
             state->pos++;
@@ -499,10 +529,10 @@
             }
         }
     }
-    
+
     token->len = state->pos - token->ptr;
-    
-    if((token->len > 0)) {
+
+    if ((token->len > 0)) {
         token->ptr++;
         token->len -= 2;
     } else {
@@ -510,7 +540,7 @@
         state->pos = token->ptr;
         token->len = 0;
     }
-    
+
     return token->len > 0 ? token->len + 2 : 0;
 }
 
@@ -530,8 +560,8 @@
             /* Get number of digits */
             i = state->pos[0] - '0';
             state->pos++;
-            
-            for(; i > 0; i--) {
+
+            for (; i > 0; i--) {
                 if (!iseos(state) && isdigit(state->pos[0])) {
                     j *= 10;
                     j += (state->pos[0] - '0');
@@ -540,8 +570,8 @@
                     break;
                 }
             }
-            
-            if(i == 0) {
+
+            if (i == 0) {
                 state->pos += j;
                 if ((state->buffer + state->len) < (state->pos)) {
                     token->len = 0;
@@ -557,47 +587,48 @@
         }
     }
 
-    if((token->len > 0)) {
+    if ((token->len > 0)) {
         token->type = TokArbitraryBlockProgramData;
     } else {
         token->type = TokUnknown;
         state->pos = token->ptr;
         token->len = 0;
     }
-    
+
     return token->len + (token->ptr - ptr);
 }
 
 /* 7.7.7 <EXPRESSION PROGRAM DATA> */
 static int isProgramExpression(int c) {
-    if ((c >= 0x20) && (c<=0x7e)) {
-        if ((c!= 0x22)
-            && (c!= 0x23) 
-            && (c!= 0x27) 
-            && (c!= 0x28) 
-            && (c!= 0x29) 
-            && (c!= 0x3B)) {
+    if ((c >= 0x20) && (c <= 0x7e)) {
+        if ((c != 0x22)
+                && (c != 0x23)
+                && (c != 0x27)
+                && (c != 0x28)
+                && (c != 0x29)
+                && (c != 0x3B)) {
             return 1;
         }
     }
-    
+
     return 0;
 }
 
 static void skipProgramExpression(lex_state_t * state) {
-    while(!iseos(state) && isProgramExpression(state->pos[0])) {
+    while (!iseos(state) && isProgramExpression(state->pos[0])) {
         state->pos++;
     }
 }
 
 // TODO: 7.7.7.2-2 recursive - any program data
-int SCPI_LexProgramExpression(lex_state_t * state,  token_t * token) {
+
+int SCPI_LexProgramExpression(lex_state_t * state, token_t * token) {
     token->ptr = state->pos;
-    
+
     if (!iseos(state) && ischr(state, '(')) {
         state->pos++;
         skipProgramExpression(state);
-        
+
         if (!iseos(state) && ischr(state, ')')) {
             state->pos++;
             token->len = state->pos - token->ptr;
@@ -605,21 +636,21 @@
             token->len = 0;
         }
     }
-    
-    if((token->len > 0)) {
+
+    if ((token->len > 0)) {
         token->type = TokProgramExpression;
     } else {
         token->type = TokUnknown;
         state->pos = token->ptr;
         token->len = 0;
     }
-    
+
     return token->len;
 }
 
 int SCPI_LexComma(lex_state_t * state, token_t * token) {
     token->ptr = state->pos;
-    
+
     if (skipChr(state, ',')) {
         token->len = 1;
         token->type = TokComma;
@@ -627,13 +658,13 @@
         token->len = 0;
         token->type = TokUnknown;
     }
-    
+
     return token->len;
 }
 
 int SCPI_LexSemicolon(lex_state_t * state, token_t * token) {
     token->ptr = state->pos;
-    
+
     if (skipChr(state, ';')) {
         token->len = 1;
         token->type = TokSemicolon;
@@ -641,26 +672,26 @@
         token->len = 0;
         token->type = TokUnknown;
     }
-    
+
     return token->len;
 }
 
-int SCPI_LexNewLine(lex_state_t * state,  token_t * token) {
+int SCPI_LexNewLine(lex_state_t * state, token_t * token) {
     token->ptr = state->pos;
-    
+
     skipChr(state, '\r');
     skipChr(state, '\n');
-    
+
     token->len = state->pos - token->ptr;
-    
-    if((token->len > 0)) {
+
+    if ((token->len > 0)) {
         token->type = TokNewLine;
     } else {
         token->type = TokUnknown;
         state->pos = token->ptr;
         token->len = 0;
     }
-    
+
     return token->len;
 }
 

--
Gitblit v1.9.1