scanner.c

// TEAM

// First team member name  : Robert Valladares

// Second team member name : Danish Waheed

/**
 *  scanner.c
 *  Lexical Analizer
 *
 *  Created by Robert Valladares and Danish Waheed on 06/01/15.
 *  Copyright (c) 2015 ROBERT VALLADARES and DANISH WAHEED. All rights reserved.
 *  UPDATED CharType functions 6/19/2015 to binary search --DEPRECATED
 *  UPDATED CharType functions 6/29/2015 to O(1) search with int arrays of 1's, 0's
 */

// Library declarations
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "globals.h"

int OTC = 0;
int LineNumber = 0;
int TokenCount = 1;
int lexemeLine[1000] = {0};
char *FILECLEANUP[] = {"lexemelist.txt", "lexemeline.txt", "lexemetable.txt"};


//------------------ global constants and given constants by assigment -------

//------------------- Read ahead function prototypes--------------
void    createFilePointers();
int     charCount(FILE *fp);
void    readInput(FILE *fp, char foo[]);
void    fileReadError(char fileName[], int reading);
void    cleanInput(FILE *fp, char src[], int count, char cleanSrc[]);
int     charType(char c);
void    splitInputTokens(char cleanSrc[], char *caCleanInputTokens[]);
int     isSpecialChar(char c);
char    *cleanInputTokenCalloc(int tknSize);
void    freeInputTokenCalloc(char *caCleanInputTokens[]);
int     isReserverdWord(char *str);
void    IdentifyInputToken(char *caCleanInputTokens[], namerecord_t *record_table);
int     stringIsNumber(char *str);
int     isValidVariableAndNotReserved(char *str);
int     validSymbolPair(char c1, char c2);
void    initializeNamerecord_table(namerecord_t *record_table);
void    insertNamerecord_table(int RecordIndex, namerecord_t *record_table, int tknKind, int ComboChars, char c1, char c2, char *lexeme, int tknType);
void    printNamerecord_table(namerecord_t *record_table);

//--- Replacement functions for <ctype.h> Name changed slightly to avoid conflicting names -----// Added 6/12/2015
int isNewLine(char c); // added 7/29/15
int isAlpha(char c);
int isDigit(char c);
int isPunct(char c);
int binarySearch (int *Array, int top, int target);
int strsAreEqual(char * stt1, char *str2);


// -----------------Initial call to program  -----------------
int main(int argc, char *argv[]) {
    // ---------deprecated for #3 ----------
    // if a file name for input is passed
    // use that name instead of the default in
    // FNS[0] = input.txt
    // ---------deprecated for #3 ----------
    
    int i = 0;
    
    // -------must redo this section to take -l -a -v user input from console
    // ---------deprecated for #3 ----------
    if(argc > 1) {
        OTC = strsAreEqual(argv[1], "-l");
        
    }
    
    // initialize global ctype int arrays
    gInitGlobalintIsCharArrays();
    // create file pointers for input output
    // createFilePointers handles null pointer exception
    createFilePointers();
    // copy input file pointer
    FILE *ifp = m_FPS[input_txt];
    // copy clean input file pointer
    FILE *cifp = m_FPS[cleaninput_txt];
    
    
    // how many characters in file
    int count = charCount(ifp);
    if (count < 0) {
        printError(err27, FNS[input_txt]);
        //fileReadError(FNS[input_txt], input_txt);
        // this is fatal error
        exit(EXIT_FAILURE);
    }
    
    char code[count];
    // cleanCode will have input without comments
    char cleanCode[count];
    // initialize code arrays
    for (i = 0; i < count; i++) {
        code[i] = ' ';
        cleanCode[i] = ' ';
    }
    
    // read input file into array code[]
    readInput(ifp, code);
    // close the input file
    fclose(ifp);
    
    // remove comments from input
    //cleanCode[] will contain -comments free- input
    cleanInput(cifp, code, count, cleanCode);
    // close the -clean input- file
    fclose(cifp);
    
    // there will be at most m_nCleanCount separate string tokens
    char *caCleanInputTokens[m_nCleanCount];
    // separate cleanCode into tokens, allocate space as needed with calloc
    // need to free each caCleanInputTokens[] array index that calloc was done to
    // if caCleanInputTokens[] is not null, free it before exiting program
    // or after printing it to file
    splitInputTokens(cleanCode, caCleanInputTokens);
    
    // there will be at most m_nCleanCount separate namerecord_t tokens
    namerecord_t namerecord_table[m_nCleanCount];
    initializeNamerecord_table(namerecord_table);
    
    // identify what kind of lexeme each token is
    IdentifyInputToken(caCleanInputTokens, namerecord_table);
    
    // print each record to both lexemelist.txt and lexemetable.txt
    printNamerecord_table(namerecord_table);
    
    // call freeInputTokenCalloc after finishing the use of the array
    freeInputTokenCalloc(caCleanInputTokens);
    // print how many tokens are per line
    FILE *lexLine = NULL;
    lexLine = fopen("lexemeline.txt", "w");
    for (i = 0; i < 1000; i++) {
        
        if(lexemeLine[i]) {
            fprintf( lexLine, "%d ", lexemeLine[i] );
        }
        else {
            continue;
        }
    }
    fclose(lexLine);
    
    // program finished, if no error were found, it will reach this point
    
    
    return 0;
}

/*
 * "createFilePointers()"
 * create all the file pointers and initialize them
 * file pointers are stored in an array for global use
 * handle null pointer exeptions immediatly
 */
void createFilePointers(){
    
    char *mode = "r";
    int i = 0;
    for (i = 0; i < MAX_FILES; i++) {
        // initialize the file pointer array index
        m_FPS[i] = NULL;
        
        if (i) {
            mode = "w";
        }
        // if file pointer fails to open filename
        // then a null is stored into array
        FILE *fp = NULL;
        fp = fopen(FNS[i], mode);
        if (fp == NULL) {
            fileReadError(FNS[i], i);
        }
        m_FPS[i] = fp;
    }
}

/**
 * "int charCount(FILE *fp)"
 * count the amount of characters in input file
 * without reading the file
 * return an integer , count of characters
 *
 */
int charCount(FILE *fp){
    
    long off_end;
    int rc;
    size_t fSize;
    int c;
    char lett;
    int i = 0;
    
    // if the file pointer is null return error
    if (fp != NULL) {
        
        // go to end of file
        rc = fseek(fp, 0L, SEEK_END);
        if (rc != 0) {
            // error ocurred
            return -1;
        }
        // Byte offset to the end of the file (size)
        if (0 > ( off_end = ftell(fp) ) ){
            return -1;
        }
        
        fSize = (size_t)off_end;
        // reset the file reader pointer to the begining of the file
        rc = 0;
        rc = fseek(fp, 0L, SEEK_SET);
        if (rc != 0) {
            // error ocurred
            return -1;
        }
        // return the count of characters in the input file
        return (int)fSize;
    }
    
    return -1;
    
}

/**
 * "readInput(FILE *fp, char src[])"
 * read each individual character into array passed from main
 * input file will be then store for use by other functions
 *
 */
void readInput(FILE *fp, char src[]){
    
    int i = 0;
    int c;
    int rc = 0;
    
    if (fp == NULL || src == NULL) {
        //if the file pointer or the char array is null, return error
        return;
    }
    
    // declare char array to store file input
    
    // return to the begining of file reader pointer
    rc = fseek(fp, 0L, SEEK_SET);
    if (rc != 0) {
        // error ocurred
        fileReadError(FNS[input_txt], input_txt);
        // this is a fatal error
        printError(err27, FNS[input_txt]);
        exit(EXIT_FAILURE);
    }
    // store each character into -array passed- from main
    while ( (c = fgetc(fp)) != EOF ){
        src[i++] = c;
    }
    
    return;
}

/**
 * "cleanInput(FILE *fp, char src[], int count, char cleanSrc[])"
 * remove the comments from the input code
 * print valid
 *
 */
void cleanInput(FILE *fp, char src[], int count, char cleanSrc[]){
    
    int p = 1;
    int i = 0;
    
    while (i < count) {
        // check if this is the begining of a comment block
        if (src[i] == '/' && p == 1) {
            if (src[i + 1] == '*') {
                // set print to false and skip the initial comment "/*" signal
                p = 0;
                i += 2;
            }
        }
        // check if this is the end of a comment block
        if (src[i] == '*' && p == 0) {
            if (src[i + 1] == '/') {
                // set print to true and skip the ending comment "*/" signal
                p = 1;
                i += 2;
                // continue, dont print immediatly, check if there are
                // adjacent comment blocks
                continue;
            }
        }
        
        if (p) {
            // print character to file
            fprintf( fp, "%c", src[i] );
            // copy input code without comments into new array
            cleanSrc[ m_nCleanCount++] = src[i];
            
        }
        
        i++;
        
    }
    // check if file only contains a comment opening statement
    if (p == 0){
        printError(err29, "/*");
        //printf("ERROR, input file contains a open ended comment line\n");
        exit(EXIT_FAILURE);
    }
    // reset the end of file for clean code array
    cleanSrc[m_nCleanCount] = EOF;
    
}

/**
 * "fileReadError(char fileName[], int reading)"
 * prints a standard file read-open-write error message
 * if int reading = 1, then print reading, else reading = 0 = writing
 *  -----------DEPRECATED, NO LONGER NEEDED, WILL DELETE AT A LATER TIME -------------
 *
 */
void fileReadError(char fileName[], int writing ){
    
    int i = 1;
    if (writing) {
        i = 0;
    }
    char *str[] = {"writing", "reading"};
    printf("Warning!, Could not open the file %s for %s\n", fileName, str[i]);
    return;
    
}

/*
 *  "int charType(char c)"
 *  return 0, 1, 2, 3 for the character type
 *  0 for neither, 1 for numerical, 2 for letter, 3 for punctuation
 */
int charType(char c){
    
    int result =0;
    int target = (int)c;
    
    if (target > 9) {
        if ( (result = isDigit( c )) || (result = isPunct( c ) ) || ( result = isAlpha( c ) ) ){
            // if any is true, then result will have the corresponding value already
            // result = 1 for numerical, result = 2 for letter, result = 3 for punctuation
            return (result);
        }
    }
    
    // else default, return 0, is neither of the three types
    return 0;
}

/*
 *   "void splitInputTokens(char cleanSrc[])"
 *   split clean source code into tokens
 */
void splitInputTokens(char cleanSrc[], char *caCleanInputTokens[]){
    
    int curCharIsSpecial = 0;
    int i = 0;
    int j = 0;
    char tkn[MAX_STR] = " ";
    
    while (i <= m_nCleanCount ) {
        
        // if this is a non empty character, store it into local token array
        if (charType(cleanSrc[i])) {
            // increase both token index and cleanSrc index
            
            // check if this character is a special character, if it is
            //mark a flag and print it, reset token in next code block
            curCharIsSpecial = isSpecialChar(cleanSrc[i]);
            
            tkn[j++] = cleanSrc[i++];
            
        }
        
        // check if this is a new line or space (empty character)
        if ( isSpecialChar(cleanSrc[i]) ||(charType(cleanSrc[i]) == 0 ) || curCharIsSpecial ) {
            // if at least one chacter is in local token array, print it and reset token
            //printf("clean source %c\n", cleanSrc[i] );
            if(j) {
                // allocate space for token, store token, increase token count
                //printf("tkn %s\n",tkn);
                caCleanInputTokens[m_nCleanInputTokens] = cleanInputTokenCalloc(j);
                strcpy(caCleanInputTokens[m_nCleanInputTokens], tkn);
                m_nCleanInputTokens++;
                lexemeLine[LineNumber] = TokenCount++; // store the number of tokens in this line
                
            }
            
            // reset local token array
            memset(tkn, 0, sizeof(tkn));
            j = 0;
            
            // count how many new line char are in code
            if ( isNewLine(cleanSrc[i]) ){
                LineNumber++;
                TokenCount = 1;
            }
            
            // check if this is a new line or space (empty character)
            if  (charType(cleanSrc[i]) == 0 ){
                // increase cleanSrc index
                i++;
                // skip code beyond here and continue to next character
                continue;
            }
        }
        // check next character in the loop after all 3 if cases
        
    }
    
}

/*
 *   "isSpecialChar(char c)"
 *   check if character passed is a special Symbol punctuation
 */
int isSpecialChar(char c){
    // if char c is a special char it will have a non 0 return with offset of 1
    // that will be handled by caller
    return g_naIsSpecialChar[ (int)c ];
    
}

/*
 *   "char *cleanInputTokenCalloc(int tknSize)"
 *   allocate memory for caCleanInputTokens[index] strings
 */
char *cleanInputTokenCalloc(int tknSize){
    char *temp = calloc(tknSize + 1, sizeof(char));
    if (temp == NULL) {
        printError(err30, "scanner calloc");
        //printf("Error using calloc to create space for token string\n");
        exit(EXIT_FAILURE);
    }
    return temp;
}

/*
 *   "void freeInputTokenCalloc(char *caCleanInputTokens[])"
 *   free memory allocated for clean tokens
 */
void freeInputTokenCalloc(char *caCleanInputTokens[]){
    
    int i = 0;
    // check each array index for non null strings
    for (i = 0; i < m_nCleanInputTokens ; i++) {
        if (caCleanInputTokens[i] != NULL) {
            // free the memory allocated to avoid seg fault
            free(caCleanInputTokens[i] );
        }
        
    }
    
}

/*
 * "int isReserverdWord(char *str)"
 * check is a string passed is a reserved word from the *word[] array
 * if its reserved, it will return the index i + 1, else it will return 0
 */
int isReserverdWord(char *str){
    
    int i = 0;
    for (i = 0; i < MAX_WORDS; i++) {
        if(strcmp(str, word[i]) == 0){
            // i+1 will be used to identify enum value later
            return (i + 1);
        }
    }
    return 0;
    
}

/*
 *   "long stringIsNumber(char *str);"
 *   check if string is numerical, it will not check if its of 5 digits
 *   we need to know if it is a number regardless of legth
 *   a false (false return) would interfere with other checks, i.e. variable check
 */
int stringIsNumber(char *str){
    
    int i = 0;
    // base case check for null
    if (str == NULL) {
        return 0;
    }
    // get the string length
    int len = strlen(str);
    // if any of the string characters is not a numerical, then string is not numerical
    // return a defined invalid int value
    for (i = 0; i < len; i++) {
        if (charType(str[i]) != 1) {
            return 0;
        }
    }
    
    // if string is numerical, but has more than 5 digits, exit error
    if (len > 5) {
        printError(err25, str);
        //printf("Error, string: %s is numerical, but it has more than 5 digits\n", str);
        exit(EXIT_FAILURE);
    }
    
    // if the string is numerical, then return 1
    //strtol(str, (char **)NULL, 10)
    return 1;
    
}

/*
 *   "int isValidVariable(char *str)"
 *   check if string of valid length, does not start with number or symbol
 *   does not contain symbols in the middle, special symbols have been check by now
 */
int isValidVariableAndNotReserved(char *str){
    
    // base case check for null or is a reserved word or is numerical
    if (str == NULL || isReserverdWord(str) || stringIsNumber(str)) {
        return 0;
    }
    
    // get the string length
    int len = strlen(str);
    
    // is token a punctuation or symbol
    if (len == 1) {
        if (charType(str[0]) == 3){
            return 0;
        }
    }
    
    // does variable start with a letter, or is of legal size
    if ((charType(str[0]) != 2) || len > MAX_VAR_LEN ) {
        printError(err31, str);
        //printf("Error, variable %s is invalid\n", str);
        exit(EXIT_FAILURE);
    }
    
    // at this point, isnumber, is symbol, is reserved word, is special char have all been checked
    
    return 1;
}

/*
 *  IdentifyInputToken(char *caCleanInputTokens[])
 *  take each token and check if its a reserved word, numerical or symbol pail, or variable
 *  if token is an illegal lexeme, print out error and exit program
 *
 */
void IdentifyInputToken(char *caCleanInputTokens[], namerecord_t *record_table){
    
    int ssNext = 0;
    int ss = 0;
    int rw = 0;
    int tknlen = 0;
    int tknLenNext = 0;
    int i = 0;
    int vs = 0;
    int LexRecordIndex = 0; // keep track of the lexeme table records
    
    for (i = 0; i < m_nCleanInputTokens ; i++) {
        
        char *str = caCleanInputTokens[i];
        tknlen = strlen(str);
        // typedef enum {lexConstant = 1, lexVar, lexProc} eLexemeKind;
        // [integer = constant = 1], [variable = var = 2], [reserved word = proc = 3]
        
        // check if it is a reserved word
        if ( ( rw = isReserverdWord(str) ) && tknlen > 1 ){
            // insert token record in record_table
            insertNamerecord_table(LexRecordIndex++, record_table, lexProc, 0, ' ', ' ', str, m_naWsym[(rw - 1)] );
            
            continue;
        }
        
        // check if token is number
        if  (stringIsNumber(str)){
            // if is invalid length or illegal number, it will fail at check
            
            // insert token record in record_table
            insertNamerecord_table(LexRecordIndex++, record_table, lexConstant, 0, ' ', ' ', str, 3 );
            
            continue;
        }
        
        // check if token is variable
        if  (isValidVariableAndNotReserved(str)){
            // if is invalid length or illegal variable, it will fail at check
            
            // insert token record in record_table
            insertNamerecord_table(LexRecordIndex++, record_table, lexVar, 0, ' ', ' ', str, 2 );
            
            continue;
        }
        
        // check if token special symbol
        if  ( ( ss = isSpecialChar(str[0]) ) && tknlen == 1 ){
            
            // current token is a symbol, check if next token is symbol
            // do not increase index counter, just look ahead
            if (i < m_nCleanInputTokens -1){
                char *strNext = caCleanInputTokens[i + 1];
                tknLenNext = strlen(str);
                // isSpecialChar(strNext[0]) == 7
                if ( strlen(strNext) == 1 && (isSpecialChar(strNext[0]) == 12 || isSpecialChar(strNext[0]) == 13  ) ) {
                    // next token is of length 1, is a symbol
                    // check if they are a legal symbol pair : >=, <=, < >, :=
                    if ((vs = validSymbolPair(str[0], strNext[0])) ) {
                        i++;
                        
                        // insert token record in record_table
                        insertNamerecord_table(LexRecordIndex++, record_table, lexProc, 1, str[0], strNext[0], " ", vs );
                        
                        continue;
                    }
                }
            }
            
            // insert token record in record_table
            insertNamerecord_table(LexRecordIndex++, record_table, lexProc, 0, ' ', ' ', str, m_naSpecialSymbols[(ss - 1)]  );
            
            continue;
        }
    }
    
}

/*
 *  "validSymbolPair(char c1, char c2)"
 *  it will take current character c1, and next char c2
 *  check if the combo of both is a legal lexime >=, <=, :=, < >
 *  it it is legal lexeme, it returns the lexeme value for the combo
 *  if it is illegal, is a fatal error and exit program
 */
int validSymbolPair(char c1, char c2){
    // c1, is current symbol, c2 is next symbol
    // check if they are a legal symbol pair : >=, <=, :=, < >
    
    int r = 0;
    char symbolPair[3];
    
    switch (c2) {
        case '=':
            if (r += ( (c1 == '>') ? geqsym : 0 )) { break; }
            if (r += ( (c1 == '<') ? leqsym : 0 )) { break; }
            if (r += ( (c1 == ':') ? becomessym : 0 )) { break; }
            break;
            
        case '>':
            if (r += ( (c1 == '<') ? neqsym : 0 )) { break; }
            break;
            
        default:
            //char symbolPair[3];
            symbolPair[0] = c1; symbolPair[1] = c2; symbolPair[2] = '\0';
            printError(err32, symbolPair);
            exit(EXIT_FAILURE);
            break;
    }
    
    return r;
    
}

//----------------------ctype functions ---- 1 for numerical, 2 for letter, 3 for punctuation

/*
 *  binarySearch (int *Array, int top, int target)
 *  search for a char c ascii value, if it is in list of values in Array passed
 *  return 1, else is not found return 0;
 *  -----------DEPRECATED, NO LONGER NEEDED, WILL DELETE AT A LATER TIME -------------
 */
int binarySearch (int *Array, int top, int target) {
    // Given a ascending sorted Array[0..top],
    // Return 1 such that Array[i] = target.
    // Return 0 if target is not in Array.
    
    int lower, middle, upper;
    lower = 0;
    upper = top;
    
    while ( upper >= lower  ) {
        middle = ( upper + lower ) / 2;
        if  (Array[middle] == target){
            return( middle + 1 );
        }
        if (Array[middle] < target){
            lower = middle + 1;
        }
        else { upper = middle - 1;}
    };
    
    // not found.
    return( 0 );
}


/*
 *  isDigit(char c)
 *  return 1 if char is a digit, 0 if not
 */
int isDigit(char c){
    // if char c is a number, it will return a 1, else 0 as found in global array
    return g_naIsNumerical[ (int)c ];
    
}

/*
 *  isAlpha(char c)
 *  return 2 if char is an alpha, 0 if not
 */
int isAlpha(char c){
    // if char c is a letter, it will return a 1, else 0 as found in global array
    return g_naIsAlphaChar[ (int)c ] * 2;
    
}

/*
 *  isPunct(char c)
 *  return 3 if char is an punctuation, 0 if not
 */
int isPunct(char c){
    // if char c is a punctuation, it will return a 1, else 0 as found in global array
    return g_naIsPunctChar[ (int)c ] * 3;
    
}

int isNewLine(char c){
    return (int)c == 13 || (int)c == 10 ? 1 : 0;
}

/*
 *  initializeNamerecord_table(namerecord_t *record_table)
 *  set the default values for the namerecord_t record_table
 *  check that strcpy was valid for the char arrray
 */
void initializeNamerecord_table(namerecord_t *record_table){
    // initialize tokens record table
    int i = 0;
    for (i = 0; i < m_nCleanCount ; i++) {
        
        record_table[i].kind = 0;           // constant = 1; var = 2, proc = 3
        if ( strcpy(record_table[i].name, "") == NULL) {
            printError(err33, "Namerecord_table");
            exit(EXIT_FAILURE);
        };                                  // name up to 11 characters long, 11 + 1 for \0
        record_table[i].val = 0;            // number (ASCII value)
        record_table[i].level = 0;          // L level
        record_table[i].adr = 0;            // M address
    }
    return;
    
}

/*
 *  insertNamerecord_table(.....)
 *  enter one record at a time as being passed from "IdentifyInputToken(...)"
 *
 */
void insertNamerecord_table(int RecordIndex, namerecord_t *record_table, int tknKind, int ComboChars, char c1, char c2, char *lexeme, int tknType){
    int i = RecordIndex;
    // tknKind are >= 1
    // typedef enum {lexConstant = 1, lexVar, lexProc} eLexemeKind;
    if (tknKind) {
        
        record_table[i].kind = tknKind;           // constant = 1; var = 2, proc = 3
        if (ComboChars ) {
            record_table[i].name[0] = c1;
            record_table[i].name[1] = c2;
            record_table[i].name[2] = '\0';
        } else {
            if ( strcpy(record_table[i].name, lexeme) == NULL) {
                printError(err34, lexeme);
                //printf("Error: fail creating space to store token string: %s \n", lexeme);
                exit(EXIT_FAILURE);
            };
        }                                   // name up to 11 characters long, 11 + 1 for \0
        record_table[i].val = tknType;      // number (ASCII value)
        record_table[i].level = 0;          // L level
        record_table[i].adr = 0;            // M address
    }
    return;
    
}

/*
 * "printNamerecord_table(namerecord_t *record_table)"
 *  print each record from the table to lexemetable and lexemelist
 */
void printNamerecord_table(namerecord_t *record_table){
    
    
    // copy lexemetable file pointer
    FILE *lexTable = m_FPS[lexemetable_txt];
    // copy lexemelist file pointer
    FILE *lexList = m_FPS[lexemelist_txt];
    
    int i = 0;
    
    if (record_table != NULL) {
        
        // print headers to screen
        // printf("\n\n%-12s%s\n", LBLS[0], LBLS[1]); // deprecated for #3
        
        if (OTC) { printf("\nScanners LexemeList\n");}
        
        // print headers to lexemetable.txt file
        fprintf( lexTable, "%-12s%s\n", LBLS[0], LBLS[1] );
        
        // print each lexeme record from record_table
        for (i = 0; i < m_nCleanCount; i++) {
            if (record_table[i].kind) {
                // print lexeme to screen
                // printf("%-12s%d\n",record_table[i].name, record_table[i].val ); // deprecated for #3
                // print lexeme to lexemetable.txt file
                fprintf( lexTable, "%-12s%d\n", record_table[i].name, record_table[i].val );
                
                // print lexeme list
                if (OTC ) { printf("%d ", record_table[i].val ); }
                fprintf( lexList, "%d ", record_table[i].val );
                // if lexeme is either a variable or a constant, print the variable or the constant right after the token type
                if ( (record_table[i].val == 2) || (record_table[i].val == 3) ){
                    if (OTC) { printf( "%s ", record_table[i].name ); }
                    fprintf( lexList, "%s ", record_table[i].name );
                }
                
            }
        }
    }
    if (OTC) { printf("\n\n");}
    // close the -lexemetable.txt- file pointer
    fclose(lexTable);
    // close the -lexemelist.txt- file pointer
    fclose(lexList);
    
    return;
}

/*
 *  printError(int ErrorNumber)
 *  Print the string that is represented by the error number passed
 */
void printError(int ErrorNumber, char *strToken){
    int i = 0;
    // always print what caused the error, then if error number is identified
    // print error information, else general message outside "IF" statement
    if(strToken) {
        printf("Lexeme or token  %s  caused an error\n", strToken);
    }
    
    // print the error message given an error number from g_caErrorMsgs[] char* array
    if (ErrorNumber <= MAX_ERROR) {
        // to find error string, substract offset of 1
        printf("Error %d, %s\n", ErrorNumber, g_caErrorMsgs[ErrorNumber - 1]);
        return;
    }
    // if error number is not in array, still print there is an error, but number
    // not recognized
    printf("Error, ErrorNumber %d not recognized\n", ErrorNumber);
    // empty the files to avoid trash print by sybsequent components of the virtual machine
    FILE *fpClean = NULL;
    for (i = 0; i < 3; i++) {
        fpClean = fopen(FILECLEANUP[i],"w");
        fclose(fpClean);
    }
    fpClean = NULL;
    return;
    
}

/*
 *  gInitGlobalintIsCharArrays()
 *  Initialize all the ischar arrays to 0 zero first
 *  then initialize to 1 those chars that belong to each group
 */
void gInitGlobalintIsCharArrays(){
    
    int i = 0, p = 0, n = 0, s = 0, temp = 0;
    
    // initialize all indexes to 0
    for (i = 0; i < MAX_ASCII; i++) {
        g_naIsAlphaChar[i] = g_naIsPunctChar[i] = g_naIsNumerical[i] = g_naIsSpecialChar[i] = 0;
    }
    // set each array index to 1 or 0 is char belongs to group
    // for special characters, set the global index to the special chars index containing the
    // lexememe index value with
    // an offset of 1, i.e. index 0 == 1, to allow searches in spcial char lexeme array with offset of -1
    for (i = 0; i < AlphaTop; i++, n++, s++, p++ ) {
        
        ( n < NumberTop ) ?  g_naIsNumerical[ m_naNumericalChars[n] ] = 1 : 0;
        ( s < SpecialCharTop ) ? g_naIsSpecialChar[ m_naSpecSymPunt[s] ] = (s + 1) : 0;
        ( p < PunctTop ) ?  g_naIsPunctChar[ m_naPunctChars[p] ] = 1 : 0;
        g_naIsAlphaChar[ m_naAlphaChars[i] ] = 1;
        
    }
    
}

// are strings equal, return 1 for true, 0 for false
int strsAreEqual(char * stt1, char *str2){
    
    return strcmp(stt1, str2) == 0;
    
}