├── test
    ├── .gitkeep
    ├── mocha.opts
    ├── cpp_unit
    │   ├── cases
    │   │   ├── case_1.c
    │   │   ├── case_1.c.pp
    │   │   ├── case_2.c.pp
    │   │   ├── case_2.c
    │   │   ├── case_4.c.pp
    │   │   ├── case_4.c
    │   │   ├── case_3.c.pp
    │   │   └── case_3.c
    │   └── cpp_unit.js
    └── lex_unit
    │   ├── cases
    │       ├── case_1.c.pp
    │       ├── case_2.c.pp
    │       ├── case_3.c.pp
    │       └── case_4.c.pp
    │   └── lex_unit.js
├── .gitignore
├── index.js
├── lib
    ├── node-c-lexer.js
    ├── cpp-unit.js
    ├── token-rules.js
    └── lex-unit.js
├── package.json
└── README.md


/test/.gitkeep:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
1 | node_modules
2 | 


--------------------------------------------------------------------------------
/test/mocha.opts:
--------------------------------------------------------------------------------
1 | --recursive
2 | 


--------------------------------------------------------------------------------
/index.js:
--------------------------------------------------------------------------------
1 | module.exports =  require('./lib/node-c-lexer');
2 | 


--------------------------------------------------------------------------------
/test/cpp_unit/cases/case_1.c:
--------------------------------------------------------------------------------
1 | int main(){
2 |     return 0;
3 | }
4 | 


--------------------------------------------------------------------------------
/test/cpp_unit/cases/case_1.c.pp:
--------------------------------------------------------------------------------
1 | int main(){
2 |     return 0;
3 | }
4 | 


--------------------------------------------------------------------------------
/test/lex_unit/cases/case_1.c.pp:
--------------------------------------------------------------------------------
1 | int main(){
2 |     return 0;
3 | }
4 | 


--------------------------------------------------------------------------------
/test/cpp_unit/cases/case_2.c.pp:
--------------------------------------------------------------------------------
1 | 
2 | 
3 | int main(){
4 |     int a[100];
5 |     return 0;
6 | }
7 | 


--------------------------------------------------------------------------------
/test/lex_unit/cases/case_2.c.pp:
--------------------------------------------------------------------------------
1 | 
2 | 
3 | int main(){
4 |     int a[100];
5 |     return 0;
6 | }
7 | 


--------------------------------------------------------------------------------
/test/cpp_unit/cases/case_2.c:
--------------------------------------------------------------------------------
1 | #define MAX 100
2 | 
3 | int main(){
4 |     int a[MAX];
5 |     return 0;
6 | }
7 | 


--------------------------------------------------------------------------------
/lib/node-c-lexer.js:
--------------------------------------------------------------------------------
1 | var lexUnit = require("./lex-unit");
2 | module.exports.lexUnit = lexUnit;
3 | 
4 | var cppUnit = require("./cpp-unit");
5 | module.exports.cppUnit = cppUnit;
6 | 


--------------------------------------------------------------------------------
/test/cpp_unit/cases/case_4.c.pp:
--------------------------------------------------------------------------------
 1 | 
 2 | 
 3 | 
 4 | int main()
 5 | {
 6 |     int i;
 7 |     clock_t time1, time2;
 8 |     time1= clock();
 9 |     for (i=1; i<=100000; i++);
10 |     time2=clock();
11 |     printf("%f seconds\n",(float)(time2-time1)/((clock_t) 1000000));
12 | 
13 | }
14 | 


--------------------------------------------------------------------------------
/test/cpp_unit/cases/case_4.c:
--------------------------------------------------------------------------------
 1 | #include <stdio.h>
 2 | #include <time.h>
 3 | 
 4 | int main()
 5 | {
 6 |     int i;
 7 |     clock_t time1, time2;
 8 |     time1= clock();
 9 |     for (i=1; i<=100000; i++);
10 |     time2=clock();
11 |     printf("%f seconds\n",(float)(time2-time1)/CLOCKS_PER_SEC);
12 | 
13 | }
14 | 


--------------------------------------------------------------------------------
/test/cpp_unit/cases/case_3.c.pp:
--------------------------------------------------------------------------------
 1 | 
 2 | 
 3 | int factorial(int n){
 4 |     if(n == 1) return 1;
 5 |     else return n*factorial(n-1);
 6 | }
 7 | 
 8 | int main(){
 9 |     int a;
10 |     printf("Input number:\n");
11 |     scanf("%d", &a);
12 |     printf("Factorial of given number is: %d\n", factorial(a));
13 |     return 0;
14 | }
15 | 


--------------------------------------------------------------------------------
/test/lex_unit/cases/case_3.c.pp:
--------------------------------------------------------------------------------
 1 | 
 2 | 
 3 | int factorial(int n){
 4 |     if(n == 1) return 1;
 5 |     else return n*factorial(n-1);
 6 | }
 7 | 
 8 | int main(){
 9 |     int a;
10 |     printf("Input number:\n");
11 |     scanf("%d", &a);
12 |     printf("Factorial of given number is: %d\n", factorial(a));
13 |     return 0;
14 | }
15 | 


--------------------------------------------------------------------------------
/test/cpp_unit/cases/case_3.c:
--------------------------------------------------------------------------------
 1 | #include <stdio.h>
 2 | 
 3 | int factorial(int n){
 4 |     if(n == 1) return 1;
 5 |     else return n*factorial(n-1);
 6 | }
 7 | 
 8 | int main(){
 9 |     int a;
10 |     printf("Input number:\n");
11 |     scanf("%d", &a);
12 |     printf("Factorial of given number is: %d\n", factorial(a));
13 |     return 0;
14 | }
15 | 


--------------------------------------------------------------------------------
/test/lex_unit/cases/case_4.c.pp:
--------------------------------------------------------------------------------
 1 | 
 2 | 
 3 | int factorial(int n){
 4 |     // Terminal condition of recursion.
 5 |     /*
 6 |     If n is equal to 1 then no need to go any deeper level of recursion.
 7 |     Rather return 1. Because factorial of 1 is 1.
 8 |     */
 9 |     if(n == 1) return 1;
10 |     else return n*factorial(n-1);
11 | }
12 | 
13 | int main(){
14 |     int a;
15 |     /*** Print a message
16 | 	 * A message to inform user what to provide
17 | 	 **/
18 |     printf("Input number:\n");
19 | 	/**
20 | 	 * Take input
21 | 	 */
22 |     scanf("%d", &a);
23 |     printf("Factorial of given number is: %d\n", factorial(a));
24 |     return 0;
25 | }
26 | 


--------------------------------------------------------------------------------
/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "node-c-lexer",
 3 |   "version": "1.0.5",
 4 |   "description": "NodeJS library to get token stream from C code.",
 5 |   "main": "index.js",
 6 |   "scripts": {
 7 |     "test": "node_modules/.bin/mocha"
 8 |   },
 9 |   "repository": {
10 |     "type": "git",
11 |     "url": "https://github.com/taufique71/node-c-lexer.git"
12 |   },
13 |   "keywords": [
14 |     "node",
15 |     "c",
16 |     "lexer"
17 |   ],
18 |   "author": "Md. Taufique Hussain",
19 |   "license": "ISC",
20 |   "bugs": {
21 |     "url": "https://github.com/taufique71/node-c-lexer/issues"
22 |   },
23 |   "homepage": "https://github.com/taufique71/node-c-lexer",
24 |   "dependencies": {
25 |     "async": "^1.5.1",
26 |     "jison": "^0.4.15",
27 |     "lex": "^1.7.9",
28 |     "uuid": "^2.0.1"
29 |   },
30 |   "devDependencies": {
31 |     "assert": "^1.4.1",
32 |     "async": "^1.5.2",
33 |     "chai": "^3.5.0",
34 |     "diff": "^3.0.1",
35 |     "mocha": "^2.3.4"
36 |   }
37 | }
38 | 


--------------------------------------------------------------------------------
/test/lex_unit/lex_unit.js:
--------------------------------------------------------------------------------
 1 | var fs = require("fs");
 2 | var diff = require("diff");
 3 | var async = require("async");
 4 | var assert = require("chai").assert;
 5 | var expect = require("chai").expect;
 6 | var should = require("chai").should();
 7 | 
 8 | describe("Tests for lexing unit", function(){
 9 |     it("Should be able to require tokenize as function", function(){
10 |         var tokenize = require("../../lib/lex-unit.js").tokenize;
11 |         assert(tokenize);
12 |         assert(typeof(tokenize), "function");
13 |     });
14 |     it("case_1 should have 9 tokens", function(done){
15 |         var input_file = __dirname + "/cases/case_1.c.pp";
16 |         var tokenize = require("../../lib/lex-unit.js").tokenize;
17 |         fs.readFile(input_file, "utf-8", function(err, code_text){
18 |             if(err) done(err);
19 |             else{
20 |                 var tokens = tokenize(code_text);
21 |                 assert.equal(tokens.length, 9);
22 |                 done();
23 |             }
24 |         });
25 |     });
26 |     it("case_2 should have 15 tokens", function(done){
27 |         var input_file = __dirname + "/cases/case_2.c.pp";
28 |         var tokenize = require("../../lib/lex-unit.js").tokenize;
29 |         fs.readFile(input_file, "utf-8", function(err, code_text){
30 |             if(err) done(err);
31 |             else{
32 |                 var tokens = tokenize(code_text);
33 |                 assert.equal(tokens.length, 15);
34 |                 done();
35 |             }
36 |         });
37 |     });
38 |     it("case_3 should have 63 tokens", function(done){
39 |         var input_file = __dirname + "/cases/case_3.c.pp";
40 |         var tokenize = require("../../lib/lex-unit.js").tokenize;
41 |         fs.readFile(input_file, "utf-8", function(err, code_text){
42 |             if(err) done(err);
43 |             else{
44 |                 var tokens = tokenize(code_text);
45 |                 assert.equal(tokens.length, 63);
46 |                 done();
47 |             }
48 |         });
49 |     });
50 |     it("case_4 should have 63 tokens", function(done){
51 |         var input_file = __dirname + "/cases/case_4.c.pp";
52 |         var tokenize = require("../../lib/lex-unit.js").tokenize;
53 |         fs.readFile(input_file, "utf-8", function(err, code_text){
54 |             if(err) done(err);
55 |             else{
56 |                 var tokens = tokenize(code_text);
57 |                 assert.equal(tokens.length, 63);
58 |                 done();
59 |             }
60 |         });
61 |     });
62 | });
63 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # node-c-lexer
 2 | Lexical analyzer library for C programming language in NodeJS
 3 | 
 4 | ### Usage
 5 | There are two units in the library - preprocessing unit and lexical analyzing
 6 | unit. These two units can be used independently. Purpose of including
 7 | preprocessing unit within the library is so that user can remove the
 8 | preprocessor with it and then feed it to scanning unit to get token stream.
 9 | 
10 | ##### Preprocessing Unit
11 | To use preprocessing unit C code needs to be resided in a file.
12 | ```js
13 | var lexer = require("node-c-lexer");
14 | lexer.cppUnit.clearPreprocessors("./a.c", function(err, codeText){
15 |     if(err){
16 |         /* Some error occured */
17 |     }
18 |     else{
19 |         /* Do what you want to do with preprocessor free code text */
20 |     }
21 | });
22 | ```
23 | The clearPreprocessors method by default invokes `cpp` on the first arguement,
24 | producing an intermediate preprocessed file. It then finalizes the output by stripping
25 | the output of the preprocessor from the intermediate file and passing it to your callback
26 | as codeText.
27 | 
28 | If you already have preprocessed files (.ii) at hand, you can skip the preprocessing step
29 | by passing the path to your preprocessed file as your last arguement.
30 | 
31 | A reason why would want to do something like this is if you, for instance, have a
32 | separate environment on which your .ii(s) are generated(e.g preprocessed files are produced
33 | within your windows bash environment). Or if your preprocessing pass diverges from
34 | the execution of a simple 'cpp' command in general.
35 | ```js
36 | var lexer = require("node-c-lexer");
37 | lexer.cppUnit.clearPreprocessors("./a.c", function(err, codeText){
38 |     if(err){
39 |         /* Some error occured */
40 |     }
41 |     else{
42 |         /* Do what you want to do with preprocessor free code text */
43 |     }
44 | }, "./a.ii");
45 | ```
46 | 
47 | ##### Scanning Unit
48 | ```js
49 | var lexer = require("node-c-lexer");
50 | var tokenStream = lexer.lexUnit.tokenize(codeText);
51 | /* Now do what you want with token stream */
52 | ```
53 | Token stream is actually an array of tokens. Single token is a single javascript
54 | object. Format of a single token is following
55 | ```js
56 | {
57 |     "lexeme": "func",
58 |     "row": 5,
59 |     "col": 3,
60 |     "tokenClass": "IDENTIFIER",
61 |     "keyword": False,
62 |     "parent": null,
63 |     "child": null
64 | }
65 | ```
66 | ```parent``` and ```child```
67 | these two are kept so that parse tree can be built using the tokens as nodes.
68 | 


--------------------------------------------------------------------------------
/lib/cpp-unit.js:
--------------------------------------------------------------------------------
 1 | var exec = require("child_process").exec;
 2 | var uuid = require("uuid");
 3 | var fs = require("fs");
 4 | 
 5 | /**
 6 |  * Extracts preprocessor directives from a file
 7 |  * with the 'cpp' command that's in your PATH.
 8 |  * @param {string} fileName - Absolute path to the input file.
 9 |  * @param {outputCallback} cb - function called with the output (codeText)
10 |  * @param {string} outFile - An optional paramater that is assummed
11 |  *  To be the corresponding preprocessed file, when provided
12 |  *  Automatic preprocessing with 'cpp' is omitted.
13 |  */
14 | var clearPreprocessors = function(fileName, cb, outFile){
15 |     var cppFileName = uuid.v1();
16 |     var commandToExecute = "cpp" + " " + fileName + " " + cppFileName;
17 |     if (outFile != null){
18 |         clear_pp_portion(fileName, outFile, cb, false);
19 |     }
20 |     else{
21 |         exec(commandToExecute, function(err, stdout, stderr){
22 |             if(!err){
23 |                 clear_pp_portion(fileName, cppFileName, cb, true);
24 |             }
25 |             else{
26 |                 cb(err);
27 |             }
28 |         });
29 |     }
30 | 
31 |     /**
32 |      * Extracts preprocessor directives from an already
33 |      * preprocessed file
34 |      * @param {string} original - Absolute path to the unpreprocessed file.
35 |      * @param {string} preprocessed - Absolute path the the coresseponding preprocessed file.
36 |      * @param {outputCallback} cb - function called with the output (codeText)
37 |      * @param {bool} delPreprocessed - delete (preprocessed) if true
38 |      */
39 |     function clear_pp_portion(original, preprocessed, cb, delPreprocessed){
40 |         var line_reader = require('readline').createInterface({
41 |             input: require('fs').createReadStream(preprocessed)
42 |         });
43 | 
44 |         var on_off_flag = false;
45 |         var list_of_lines = [];
46 |         var code_text = "";
47 |         var prev_line = "";
48 |         var target_line_no = 0;
49 |         var file_name_to_match = '"' + original + '"';
50 | 
51 |         line_reader.on('line', function (line) {
52 |             var tokens = line.split(" ");
53 |             if(tokens[0] === "#"){
54 |                 var line_no = parseInt(tokens[1]);
55 |                 var file_name = tokens[2];
56 |                 if(file_name === file_name_to_match){
57 |                     on_off_flag = true;
58 |                     target_line_no = line_no;
59 |                 }
60 |                 else{
61 |                     if(on_off_flag === true){
62 |                         list_of_lines.push("");
63 |                     }
64 |                     on_off_flag = false;
65 |                 }
66 |             }
67 |             else{
68 |                 if(on_off_flag === true){
69 |                     if(target_line_no <= list_of_lines.length){
70 |                         line = line.trim();
71 |                         list_of_lines[target_line_no - 1] = list_of_lines[target_line_no - 1] + line;
72 |                         target_line_no++;
73 |                     }
74 |                     else{
75 |                         list_of_lines.push(line);
76 |                         target_line_no++;
77 |                     }
78 |                 }
79 |             }
80 | 
81 |         });
82 | 
83 |         line_reader.on('close', function() {
84 |             if (delPreprocessed){
85 |                 commandToExecute = "rm " + cppFileName;
86 |                 exec(commandToExecute, function(err, stdout, stderr){
87 |                     cb(null, list_of_lines.join("\n")+"\n");
88 |                 });
89 |             }
90 |             else{
91 |                 cb(null, list_of_lines.join("\n")+"\n");
92 |             }
93 |         });
94 |     }
95 | }
96 | module.exports.clearPreprocessors = clearPreprocessors;
97 | 


--------------------------------------------------------------------------------
/lib/token-rules.js:
--------------------------------------------------------------------------------
  1 | var tokenRules = {
  2 |     "singleLineComment":            /\/\/.*/,
  3 |     "multiLineComment":             /\/\*([^\*]|[\r\n]|(\*+([^\/\*]|[\n\r])))*\*+\//,
  4 |     "while":                        /while/,
  5 |     "volatile":                     /volatile/,
  6 |     "void":                         /void/,
  7 |     "unsigned":                     /unsigned/,
  8 |     "union":                        /union/,
  9 |     "typedef":                      /typedef/,
 10 |     "switch":                       /switch/,
 11 |     "struct":                       /struct/,
 12 |     "static":                       /static/,
 13 |     "sizeof":                       /sizeof/,
 14 |     "signed":                       /signed/,
 15 |     "short":                        /short/,
 16 |     "return":                       /return/,
 17 |     "register":                     /register/,
 18 |     "long":                         /long/,
 19 |     "int":                          /int/,
 20 |     "if":                           /if/,
 21 |     "goto":                         /goto/,
 22 |     "for":                          /for/,
 23 |     "float":                        /float/,
 24 |     "extern":                       /extern/,
 25 |     "enum":                         /enum/,
 26 |     "else":                         /else/,
 27 |     "double":                       /double/,
 28 |     "do":                           /do/,
 29 |     "default":                      /default/,
 30 |     "continue":                     /continue/,
 31 |     "const":                        /const/,
 32 |     "char":                         /char/,
 33 |     "case":                         /case/,
 34 |     "break":                        /break/,
 35 |     "auto":                         /auto/,
 36 |     "bool":                         /_Bool/,
 37 |     "complex":                      /_Complex/,
 38 |     "imaginary":                    /_Imaginary/,
 39 |     "inline":                       /inline/,
 40 |     "restrict":                     /restrict/,
 41 |     "identifier":                   /[A-Za-z_]\w*/,
 42 |     "hexadecimal":                  /0[xX][a-fA-F0-9]+((u|U)|((u|U)?(l|L|ll|LL))|((l|L|ll|LL)(u|U)))?/,
 43 |     "octal":                        /0[0-7]+((u|U)|((u|U)?(l|L|ll|LL))|((l|L|ll|LL)(u|U)))?/,
 44 |     "decimal":                      /[0-9]+((u|U)|((u|U)?(l|L|ll|LL))|((l|L|ll|LL)(u|U)))?/,
 45 |     "char_literal":                 /[a-zA-Z_]?\'(\\.|[^\\'\n])+\'/,
 46 |     "floatWithoutPoint":            /[0-9]+([Ee][+-]?[0-9]+)(f|F|l|L)?/,
 47 |     "floatWithNothingBeforePoint":  /[0-9]*\.[0-9]+([Ee][+-]?[0-9]+)?(f|F|l|L)?/,
 48 |     "floatWithNothingAfterPoint":   /[0-9]+\.[0-9]*([Ee][+-]?[0-9]+)?(f|F|l|L)?/,
 49 |     "string_literal":               /[a-zA-Z_]?\"(\\.|[^\\"\n])*\"/,
 50 |     "ellipsis":                     /\.\.\./,
 51 |     "right_assign":                 />>=/,
 52 |     "left_assign":                  /<<=/,
 53 |     "add_assign":                   /\+=/,
 54 |     "sub_assign":                   /\-=/,
 55 |     "mul_assign":                   /\*=/,
 56 |     "div_assign":                   /\/=/,
 57 |     "mod_assign":                   /%=/,
 58 |     "and_assign":                   /&=/,
 59 |     "xor_assign":                   /\^=/,
 60 |     "or_assign":                    /\|=/,
 61 |     "right_op":                     />>/,
 62 |     "left_op":                      /<</,
 63 |     "inc_op":                       /\+\+/,
 64 |     "dec_op":                       /\-\-/,
 65 |     "ptr_op":                       /\->/,
 66 |     "and_op":                       /&&/,
 67 |     "or_op":                        /\|\|/,
 68 |     "le_op":                        /<=/,
 69 |     "ge_op":                        />=/,
 70 |     "eq_op":                        /==/,
 71 |     "ne_op":                        /!=/,
 72 |     ";":                            /;/,
 73 |     "{":                            /{|<%/,
 74 |     "}":                            /}|%>/,
 75 |     ",":                            /,/,
 76 |     ":":                            /:/,
 77 |     "=":                            /=/,
 78 |     "(":                            /\(/,
 79 |     ")":                            /\)/,
 80 |     "[":                            /\[|<:/,
 81 |     "]":                            /\]|:>/,
 82 |     ".":                            /\./,
 83 |     "&":                            /&/,
 84 |     "!":                            /!/,
 85 |     "~":                            /~/,
 86 |     "-":                            /\-/,
 87 |     "+":                            /\+/,
 88 |     "*":                            /\*/,
 89 |     "/":                            /\//,
 90 |     "%":                            /%/,
 91 |     "<":                            /</,
 92 |     ">":                            />/,
 93 |     "^":                            /\^/,
 94 |     "|":                            /\|/,
 95 |     "?":                            /\?/,
 96 |     "whitespace":                   /[ \t\v\r\n\f]/,
 97 |     "unmatched":                    /./
 98 | };
 99 | module.exports.tokenRules = tokenRules;
100 | 


--------------------------------------------------------------------------------
/test/cpp_unit/cpp_unit.js:
--------------------------------------------------------------------------------
  1 | var fs = require("fs");
  2 | var diff = require("diff");
  3 | var async = require("async");
  4 | var assert = require("chai").assert;
  5 | var expect = require("chai").expect;
  6 | var should = require("chai").should();
  7 | 
  8 | describe("Tests for preprocessor removal unit", function(){
  9 |     it("Should be able to require clearPreprocessors as function", function(){
 10 |         var clearPreprocessors = require("../../lib/cpp-unit.js").clearPreprocessors;
 11 |         assert(clearPreprocessors);
 12 |         assert(typeof(clearPreprocessors), "function");
 13 |     });
 14 |     it("Should successfully remove preprocessor from case_1.c file", function(done){
 15 |         var input_file = __dirname + "/cases/case_1.c";
 16 |         var output_file = __dirname + "/cases/case_1.c.pp";
 17 |         var clearPreprocessors = require("../../lib/cpp-unit.js").clearPreprocessors;
 18 |         async.parallel([
 19 |             function(read_output_file){
 20 |                 fs.readFile(output_file, "utf-8", function(err, data){
 21 |                     if(err) read_output_file(err);
 22 |                     else read_output_file(null, data);
 23 |                 });
 24 |             },
 25 |             function(perform_operation){
 26 |                 clearPreprocessors(input_file, function(err, data){
 27 |                     if(err) perform_operation(err);
 28 |                     else perform_operation(null, data);
 29 |                 });
 30 |             }
 31 |         ], function(err, results){
 32 |             if(err) done(err);
 33 |             else{
 34 |                 var d = diff.diffChars(results[0], results[1]);
 35 |                 assert.equal(d.length, 1);
 36 |                 done(null);
 37 |             }
 38 |         });
 39 |     });
 40 |     it("Should successfully remove preprocessor from case_2.c file", function(done){
 41 |         var input_file = __dirname + "/cases/case_2.c";
 42 |         var output_file = __dirname + "/cases/case_2.c.pp";
 43 |         var clearPreprocessors = require("../../lib/cpp-unit.js").clearPreprocessors;
 44 |         async.parallel([
 45 |             function(read_output_file){
 46 |                 fs.readFile(output_file, "utf-8", function(err, data){
 47 |                     if(err) read_output_file(err);
 48 |                     else read_output_file(null, data);
 49 |                 });
 50 |             },
 51 |             function(perform_operation){
 52 |                 clearPreprocessors(input_file, function(err, data){
 53 |                     if(err) perform_operation(err);
 54 |                     else perform_operation(null, data);
 55 |                 });
 56 |             }
 57 |         ], function(err, results){
 58 |             if(err) done(err);
 59 |             else{
 60 |                 var d = diff.diffChars(results[0], results[1]);
 61 |                 assert.equal(d.length, 1);
 62 |                 done(null);
 63 |             }
 64 |         });
 65 |     });
 66 |     it("Should successfully remove preprocessor from case_3.c file", function(done){
 67 |         var input_file = __dirname + "/cases/case_3.c";
 68 |         var output_file = __dirname + "/cases/case_3.c.pp";
 69 |         var clearPreprocessors = require("../../lib/cpp-unit.js").clearPreprocessors;
 70 |         async.parallel([
 71 |             function(read_output_file){
 72 |                 fs.readFile(output_file, "utf-8", function(err, data){
 73 |                     if(err) read_output_file(err);
 74 |                     else read_output_file(null, data);
 75 |                 });
 76 |             },
 77 |             function(perform_operation){
 78 |                 clearPreprocessors(input_file, function(err, data){
 79 |                     if(err) perform_operation(err);
 80 |                     else perform_operation(null, data);
 81 |                 });
 82 |             }
 83 |         ], function(err, results){
 84 |             if(err) done(err);
 85 |             else{
 86 |                 var d = diff.diffChars(results[0], results[1]);
 87 |                 assert.equal(d.length, 1);
 88 |                 done(null);
 89 |             }
 90 |         });
 91 |     });
 92 |     it("Should successfully remove preprocessor from case_4.c file", function(done){
 93 |         var input_file = __dirname + "/cases/case_4.c";
 94 |         var output_file = __dirname + "/cases/case_4.c.pp";
 95 |         var clearPreprocessors = require("../../lib/cpp-unit.js").clearPreprocessors;
 96 |         async.parallel([
 97 |             function(read_output_file){
 98 |                 fs.readFile(output_file, "utf-8", function(err, data){
 99 |                     if(err) read_output_file(err);
100 |                     else read_output_file(null, data);
101 |                 });
102 |             },
103 |             function(perform_operation){
104 |                 clearPreprocessors(input_file, function(err, data){
105 |                     if(err) perform_operation(err);
106 |                     else perform_operation(null, data);
107 |                 });
108 |             }
109 |         ], function(err, results){
110 |             if(err) done(err);
111 |             else{
112 |                 var d = diff.diffChars(results[0], results[1]);
113 |                 assert.equal(d.length, 1);
114 |                 done(null);
115 |             }
116 |         });
117 |     });
118 | });
119 | 


--------------------------------------------------------------------------------
/lib/lex-unit.js:
--------------------------------------------------------------------------------
   1 | var tokenRules = require("./token-rules")["tokenRules"];
   2 | var Lexer = require("lex");
   3 | var lexer = new Lexer;
   4 | 
   5 | var row = 1, col = 1;
   6 | 
   7 | var count = function(lexeme){
   8 |     for(var i = 0; i<lexeme.length; i++){
   9 |         if(lexeme[i] == '\n'){
  10 |             row = row + 1;
  11 |             col = 1;
  12 |         }
  13 |         else if(lexeme[i] == '\t'){
  14 |             col = col + (4 - (col % 4));
  15 |         }
  16 |         else{
  17 |             col = col + 1;
  18 |         }
  19 |     }
  20 | }
  21 | 
  22 | var tokenize = function(streamOfText){
  23 |     row = 1; col = 1;
  24 |     var streamOfTokens = [];
  25 |     lexer.addRule(tokenRules["singleLineComment"], function(lexeme){
  26 |         var token = {};
  27 |         token["lexeme"] = lexeme;
  28 |         token["row"] = row;
  29 |         token["col"] = col;
  30 |         token["tokenClass"] = "COMMENT";
  31 |         token["keyword"] = false;
  32 |         token["parent"] = null;
  33 |         token["children"] = null;
  34 |         count(lexeme);
  35 |         return token;
  36 |     });
  37 |     lexer.addRule(tokenRules["multiLineComment"], function(lexeme){
  38 |         var token = {};
  39 |         token["lexeme"] = lexeme;
  40 |         token["row"] = row;
  41 |         token["col"] = col;
  42 |         token["tokenClass"] = "COMMENT";
  43 |         token["keyword"] = false;
  44 |         token["parent"] = null;
  45 |         token["children"] = null;
  46 |         count(lexeme);
  47 |         return token;
  48 |     });
  49 |     lexer.addRule(tokenRules["while"], function(lexeme){
  50 |         var token = {};
  51 |         token["lexeme"] = lexeme;
  52 |         token["row"] = row;
  53 |         token["col"] = col;
  54 |         token["tokenClass"] = "WHILE";
  55 |         token["keyword"] = true;
  56 |         token["parent"] = null;
  57 |         token["children"] = null;
  58 |         count(lexeme);
  59 |         return token;
  60 |     });
  61 | 
  62 |     lexer.addRule(tokenRules["while"], function(lexeme){
  63 |         var token = {};
  64 |         token["lexeme"] = lexeme;
  65 |         token["row"] = row;
  66 |         token["col"] = col;
  67 |         token["tokenClass"] = "WHILE";
  68 |         token["keyword"] = true;
  69 |         token["parent"] = null;
  70 |         token["children"] = null;
  71 |         count(lexeme);
  72 |         return token;
  73 |     });
  74 |     lexer.addRule(tokenRules["volatile"], function(lexeme){
  75 |         var token = {};
  76 |         token["lexeme"] = lexeme;
  77 |         token["row"] = row;
  78 |         token["col"] = col;
  79 |         token["tokenClass"] = "VOLATILE";
  80 |         token["keyword"] = true;
  81 |         token["parent"] = null;
  82 |         token["children"] = null;
  83 |         count(lexeme);
  84 |         return token;
  85 |     });
  86 |     lexer.addRule(tokenRules["void"], function(lexeme){
  87 |         var token = {};
  88 |         token["lexeme"] = lexeme;
  89 |         token["row"] = row;
  90 |         token["col"] = col;
  91 |         token["tokenClass"] = "VOID";
  92 |         token["keyword"] = true;
  93 |         token["parent"] = null;
  94 |         token["children"] = null;
  95 |         count(lexeme);
  96 |         return token;
  97 |     });
  98 |     lexer.addRule(tokenRules["unsigned"], function(lexeme){
  99 |         var token = {};
 100 |         token["lexeme"] = lexeme;
 101 |         token["row"] = row;
 102 |         token["col"] = col;
 103 |         token["tokenClass"] = "UNSIGNED";
 104 |         token["keyword"] = true;
 105 |         token["parent"] = null;
 106 |         token["children"] = null;
 107 |         count(lexeme);
 108 |         return token;
 109 |     });
 110 |     lexer.addRule(tokenRules["union"], function(lexeme){
 111 |         var token = {};
 112 |         token["lexeme"] = lexeme;
 113 |         token["row"] = row;
 114 |         token["col"] = col;
 115 |         token["tokenClass"] = "UNION";
 116 |         token["keyword"] = true;
 117 |         token["parent"] = null;
 118 |         token["children"] = null;
 119 |         count(lexeme);
 120 |         return token;
 121 |     });
 122 |     lexer.addRule(tokenRules["typedef"], function(lexeme){
 123 |         var token = {};
 124 |         token["lexeme"] = lexeme;
 125 |         token["row"] = row;
 126 |         token["col"] = col;
 127 |         token["tokenClass"] = "TYPEDEF";
 128 |         token["keyword"] = true;
 129 |         token["parent"] = null;
 130 |         token["children"] = null;
 131 |         count(lexeme);
 132 |         return token;
 133 |     });
 134 |     lexer.addRule(tokenRules["switch"], function(lexeme){
 135 |         var token = {};
 136 |         token["lexeme"] = lexeme;
 137 |         token["row"] = row;
 138 |         token["col"] = col;
 139 |         token["tokenClass"] = "SWITCH";
 140 |         token["keyword"] = true;
 141 |         token["parent"] = null;
 142 |         token["children"] = null;
 143 |         count(lexeme);
 144 |         return token;
 145 |     });
 146 |     lexer.addRule(tokenRules["struct"], function(lexeme){
 147 |         var token = {};
 148 |         token["lexeme"] = lexeme;
 149 |         token["row"] = row;
 150 |         token["col"] = col;
 151 |         token["tokenClass"] = "STRUCT";
 152 |         token["keyword"] = true;
 153 |         token["parent"] = null;
 154 |         token["children"] = null;
 155 |         count(lexeme);
 156 |         return token;
 157 |     });
 158 |     lexer.addRule(tokenRules["static"], function(lexeme){
 159 |         var token = {};
 160 |         token["lexeme"] = lexeme;
 161 |         token["row"] = row;
 162 |         token["col"] = col;
 163 |         token["tokenClass"] = "STATIC";
 164 |         token["keyword"] = true;
 165 |         token["parent"] = null;
 166 |         token["children"] = null;
 167 |         count(lexeme);
 168 |         return token;
 169 |     });
 170 |     lexer.addRule(tokenRules["sizeof"], function(lexeme){
 171 |         var token = {};
 172 |         token["lexeme"] = lexeme;
 173 |         token["row"] = row;
 174 |         token["col"] = col;
 175 |         token["tokenClass"] = "SIZEOF";
 176 |         token["keyword"] = true;
 177 |         token["parent"] = null;
 178 |         token["children"] = null;
 179 |         count(lexeme);
 180 |         return token;
 181 |     });
 182 |     lexer.addRule(tokenRules["signed"], function(lexeme){
 183 |         var token = {};
 184 |         token["lexeme"] = lexeme;
 185 |         token["row"] = row;
 186 |         token["col"] = col;
 187 |         token["tokenClass"] = "SIGNED";
 188 |         token["parent"] = null;
 189 |         token["keyword"] = true;
 190 |         token["children"] = null;
 191 |         count(lexeme);
 192 |         return token;
 193 |     });
 194 |     lexer.addRule(tokenRules["short"], function(lexeme){
 195 |         var token = {};
 196 |         token["lexeme"] = lexeme;
 197 |         token["row"] = row;
 198 |         token["col"] = col;
 199 |         token["tokenClass"] = "SHORT";
 200 |         token["keyword"] = true;
 201 |         token["parent"] = null;
 202 |         token["children"] = null;
 203 |         count(lexeme);
 204 |         return token;
 205 |     });
 206 |     lexer.addRule(tokenRules["return"], function(lexeme){
 207 |         var token = {};
 208 |         token["lexeme"] = lexeme;
 209 |         token["row"] = row;
 210 |         token["col"] = col;
 211 |         token["tokenClass"] = "RETURN";
 212 |         token["keyword"] = true;
 213 |         token["parent"] = null;
 214 |         token["children"] = null;
 215 |         count(lexeme);
 216 |         return token;
 217 |     });
 218 |     lexer.addRule(tokenRules["register"], function(lexeme){
 219 |         var token = {};
 220 |         token["lexeme"] = lexeme;
 221 |         token["row"] = row;
 222 |         token["col"] = col;
 223 |         token["tokenClass"] = "REGISTER";
 224 |         token["keyword"] = true;
 225 |         token["parent"] = null;
 226 |         token["children"] = null;
 227 |         count(lexeme);
 228 |         return token;
 229 |     });
 230 |     lexer.addRule(tokenRules["long"], function(lexeme){
 231 |         var token = {};
 232 |         token["lexeme"] = lexeme;
 233 |         token["row"] = row;
 234 |         token["col"] = col;
 235 |         token["tokenClass"] = "LONG";
 236 |         token["keyword"] = true;
 237 |         token["parent"] = null;
 238 |         token["children"] = null;
 239 |         count(lexeme);
 240 |         return token;
 241 |     });
 242 |     lexer.addRule(tokenRules["int"], function(lexeme){
 243 |         var token = {};
 244 |         token["lexeme"] = lexeme;
 245 |         token["row"] = row;
 246 |         token["col"] = col;
 247 |         token["tokenClass"] = "INT";
 248 |         token["keyword"] = true;
 249 |         token["parent"] = null;
 250 |         token["children"] = null;
 251 |         count(lexeme);
 252 |         return token;
 253 |     });
 254 |     lexer.addRule(tokenRules["if"], function(lexeme){
 255 |         var token = {};
 256 |         token["lexeme"] = lexeme;
 257 |         token["row"] = row;
 258 |         token["col"] = col;
 259 |         token["tokenClass"] = "IF";
 260 |         token["keyword"] = true;
 261 |         token["parent"] = null;
 262 |         token["children"] = null;
 263 |         count(lexeme);
 264 |         return token;
 265 |     });
 266 |     lexer.addRule(tokenRules["goto"], function(lexeme){
 267 |         var token = {};
 268 |         token["lexeme"] = lexeme;
 269 |         token["row"] = row;
 270 |         token["col"] = col;
 271 |         token["tokenClass"] = "GOTO";
 272 |         token["keyword"] = true;
 273 |         token["parent"] = null;
 274 |         token["children"] = null;
 275 |         count(lexeme);
 276 |         return token;
 277 |     });
 278 |     lexer.addRule(tokenRules["for"], function(lexeme){
 279 |         var token = {};
 280 |         token["lexeme"] = lexeme;
 281 |         token["row"] = row;
 282 |         token["col"] = col;
 283 |         token["tokenClass"] = "FOR";
 284 |         token["keyword"] = true;
 285 |         token["parent"] = null;
 286 |         token["children"] = null;
 287 |         count(lexeme);
 288 |         return token;
 289 |     });
 290 |     lexer.addRule(tokenRules["float"], function(lexeme){
 291 |         var token = {};
 292 |         token["lexeme"] = lexeme;
 293 |         token["row"] = row;
 294 |         token["col"] = col;
 295 |         token["tokenClass"] = "FLOAT";
 296 |         token["keyword"] = true;
 297 |         token["parent"] = null;
 298 |         token["children"] = null;
 299 |         count(lexeme);
 300 |         return token;
 301 |     });
 302 |     lexer.addRule(tokenRules["extern"], function(lexeme){
 303 |         var token = {};
 304 |         token["lexeme"] = lexeme;
 305 |         token["row"] = row;
 306 |         token["col"] = col;
 307 |         token["tokenClass"] = "EXTERN";
 308 |         token["keyword"] = true;
 309 |         token["parent"] = null;
 310 |         token["children"] = null;
 311 |         count(lexeme);
 312 |         return token;
 313 |     });
 314 |     lexer.addRule(tokenRules["enum"], function(lexeme){
 315 |         var token = {};
 316 |         token["lexeme"] = lexeme;
 317 |         token["row"] = row;
 318 |         token["col"] = col;
 319 |         token["tokenClass"] = "ENUM";
 320 |         token["keyword"] = true;
 321 |         token["parent"] = null;
 322 |         token["children"] = null;
 323 |         count(lexeme);
 324 |         return token;
 325 |     });
 326 |     lexer.addRule(tokenRules["else"], function(lexeme){
 327 |         var token = {};
 328 |         token["lexeme"] = lexeme;
 329 |         token["row"] = row;
 330 |         token["col"] = col;
 331 |         token["tokenClass"] = "ELSE";
 332 |         token["keyword"] = true;
 333 |         token["parent"] = null;
 334 |         token["children"] = null;
 335 |         count(lexeme);
 336 |         return token;
 337 |     });
 338 |     lexer.addRule(tokenRules["double"], function(lexeme){
 339 |         var token = {};
 340 |         token["lexeme"] = lexeme;
 341 |         token["row"] = row;
 342 |         token["col"] = col;
 343 |         token["tokenClass"] = "DOUBLE";
 344 |         token["keyword"] = true;
 345 |         token["parent"] = null;
 346 |         token["children"] = null;
 347 |         count(lexeme);
 348 |         return token;
 349 |     });
 350 |     lexer.addRule(tokenRules["do"], function(lexeme){
 351 |         var token = {};
 352 |         token["lexeme"] = lexeme;
 353 |         token["row"] = row;
 354 |         token["col"] = col;
 355 |         token["tokenClass"] = "DO";
 356 |         token["keyword"] = true;
 357 |         token["parent"] = null;
 358 |         token["children"] = null;
 359 |         count(lexeme);
 360 |         return token;
 361 |     });
 362 |     lexer.addRule(tokenRules["default"], function(lexeme){
 363 |         var token = {};
 364 |         token["lexeme"] = lexeme;
 365 |         token["row"] = row;
 366 |         token["col"] = col;
 367 |         token["tokenClass"] = "DEFAULT";
 368 |         token["keyword"] = true;
 369 |         token["parent"] = null;
 370 |         token["children"] = null;
 371 |         count(lexeme);
 372 |         return token;
 373 |     });
 374 |     lexer.addRule(tokenRules["continue"], function(lexeme){
 375 |         var token = {};
 376 |         token["lexeme"] = lexeme;
 377 |         token["row"] = row;
 378 |         token["col"] = col;
 379 |         token["tokenClass"] = "CONTINUE";
 380 |         token["keyword"] = true;
 381 |         token["parent"] = null;
 382 |         token["children"] = null;
 383 |         count(lexeme);
 384 |         return token;
 385 |     });
 386 |     lexer.addRule(tokenRules["const"], function(lexeme){
 387 |         var token = {};
 388 |         token["lexeme"] = lexeme;
 389 |         token["row"] = row;
 390 |         token["col"] = col;
 391 |         token["tokenClass"] = "CONST";
 392 |         token["keyword"] = true;
 393 |         token["parent"] = null;
 394 |         token["children"] = null;
 395 |         count(lexeme);
 396 |         return token;
 397 |     });
 398 |     lexer.addRule(tokenRules["char"], function(lexeme){
 399 |         var token = {};
 400 |         token["lexeme"] = lexeme;
 401 |         token["row"] = row;
 402 |         token["col"] = col;
 403 |         token["tokenClass"] = "CHAR";
 404 |         token["keyword"] = true;
 405 |         token["parent"] = null;
 406 |         token["children"] = null;
 407 |         count(lexeme);
 408 |         return token;
 409 |     });
 410 |     lexer.addRule(tokenRules["case"], function(lexeme){
 411 |         var token = {};
 412 |         token["lexeme"] = lexeme;
 413 |         token["row"] = row;
 414 |         token["col"] = col;
 415 |         token["tokenClass"] = "CASE";
 416 |         token["keyword"] = true;
 417 |         token["parent"] = null;
 418 |         token["children"] = null;
 419 |         count(lexeme);
 420 |         return token;
 421 |     });
 422 |     lexer.addRule(tokenRules["break"], function(lexeme){
 423 |         var token = {};
 424 |         token["lexeme"] = lexeme;
 425 |         token["row"] = row;
 426 |         token["col"] = col;
 427 |         token["tokenClass"] = "BREAK";
 428 |         token["keyword"] = true;
 429 |         token["parent"] = null;
 430 |         token["children"] = null;
 431 |         count(lexeme);
 432 |         return token;
 433 |     });
 434 |     lexer.addRule(tokenRules["auto"], function(lexeme){
 435 |         var token = {};
 436 |         token["lexeme"] = lexeme;
 437 |         token["row"] = row;
 438 |         token["col"] = col;
 439 |         token["tokenClass"] = "AUTO";
 440 |         token["keyword"] = true;
 441 |         token["parent"] = null;
 442 |         token["children"] = null;
 443 |         count(lexeme);
 444 |         return token;
 445 |     });
 446 |     lexer.addRule(tokenRules["bool"], function(lexeme){
 447 |         var token = {};
 448 |         token["lexeme"] = lexeme;
 449 |         token["row"] = row;
 450 |         token["col"] = col;
 451 |         token["tokenClass"] = "BOOL";
 452 |         token["keyword"] = true;
 453 |         token["parent"] = null;
 454 |         token["children"] = null;
 455 |         count(lexeme);
 456 |         return token;
 457 |     });
 458 |     lexer.addRule(tokenRules["complex"], function(lexeme){
 459 |         var token = {};
 460 |         token["lexeme"] = lexeme;
 461 |         token["row"] = row;
 462 |         token["col"] = col;
 463 |         token["tokenClass"] = "COMPLEX";
 464 |         token["keyword"] = true;
 465 |         token["parent"] = null;
 466 |         token["children"] = null;
 467 |         count(lexeme);
 468 |         return token;
 469 |     });
 470 |     lexer.addRule(tokenRules["imaginary"], function(lexeme){
 471 |         var token = {};
 472 |         token["lexeme"] = lexeme;
 473 |         token["row"] = row;
 474 |         token["col"] = col;
 475 |         token["tokenClass"] = "IMAGINARY";
 476 |         token["keyword"] = true;
 477 |         token["parent"] = null;
 478 |         token["children"] = null;
 479 |         count(lexeme);
 480 |         return token;
 481 |     });
 482 |     lexer.addRule(tokenRules["inline"], function(lexeme){
 483 |         var token = {};
 484 |         token["lexeme"] = lexeme;
 485 |         token["row"] = row;
 486 |         token["col"] = col;
 487 |         token["tokenClass"] = "INLINE";
 488 |         token["keyword"] = true;
 489 |         token["parent"] = null;
 490 |         token["children"] = null;
 491 |         count(lexeme);
 492 |         return token;
 493 |     });
 494 |     lexer.addRule(tokenRules["restrict"], function(lexeme){
 495 |         var token = {};
 496 |         token["lexeme"] = lexeme;
 497 |         token["row"] = row;
 498 |         token["col"] = col;
 499 |         token["tokenClass"] = "RESTRICT";
 500 |         token["keyword"] = true;
 501 |         token["parent"] = null;
 502 |         token["children"] = null;
 503 |         count(lexeme);
 504 |         return token;
 505 |     });
 506 |     lexer.addRule(tokenRules["identifier"], function(lexeme){
 507 |         var token = {};
 508 |         token["lexeme"] = lexeme;
 509 |         token["row"] = row;
 510 |         token["col"] = col;
 511 |         token["tokenClass"] = "IDENTIFIER";
 512 |         token["parent"] = null;
 513 |         token["children"] = null;
 514 |         count(lexeme);
 515 |         return token;
 516 |     });
 517 |     lexer.addRule(tokenRules["hexadecimal"], function(lexeme){
 518 |         var token = {};
 519 |         token["lexeme"] = lexeme;
 520 |         token["row"] = row;
 521 |         token["col"] = col;
 522 |         token["tokenClass"] = "CONSTANT";
 523 |         token["parent"] = null;
 524 |         token["children"] = null;
 525 |         count(lexeme);
 526 |         return token;
 527 |     });
 528 |     lexer.addRule(tokenRules["octal"], function(lexeme){
 529 |         var token = {};
 530 |         token["lexeme"] = lexeme;
 531 |         token["row"] = row;
 532 |         token["col"] = col;
 533 |         token["tokenClass"] = "CONSTANT";
 534 |         token["parent"] = null;
 535 |         token["children"] = null;
 536 |         count(lexeme);
 537 |         return token;
 538 |     });
 539 |     lexer.addRule(tokenRules["decimal"], function(lexeme){
 540 |         var token = {};
 541 |         token["lexeme"] = lexeme;
 542 |         token["row"] = row;
 543 |         token["col"] = col;
 544 |         token["tokenClass"] = "CONSTANT";
 545 |         token["parent"] = null;
 546 |         token["children"] = null;
 547 |         count(lexeme);
 548 |         return token;
 549 |     });
 550 |     lexer.addRule(tokenRules["char_literal"], function(lexeme){
 551 |         var token = {};
 552 |         token["lexeme"] = lexeme;
 553 |         token["row"] = row;
 554 |         token["col"] = col;
 555 |         token["tokenClass"] = "CONSTANT";
 556 |         token["parent"] = null;
 557 |         token["children"] = null;
 558 |         count(lexeme);
 559 |         return token;
 560 |     });
 561 |     lexer.addRule(tokenRules["floatWithoutPoint"], function(lexeme){
 562 |         var token = {};
 563 |         token["lexeme"] = lexeme;
 564 |         token["row"] = row;
 565 |         token["col"] = col;
 566 |         token["tokenClass"] = "CONSTANT";
 567 |         token["parent"] = null;
 568 |         token["children"] = null;
 569 |         count(lexeme);
 570 |         return token;
 571 |     });
 572 |     lexer.addRule(tokenRules["floatWithNothingBeforePoint"], function(lexeme){
 573 |         var token = {};
 574 |         token["lexeme"] = lexeme;
 575 |         token["row"] = row;
 576 |         token["col"] = col;
 577 |         token["tokenClass"] = "CONSTANT";
 578 |         token["parent"] = null;
 579 |         token["children"] = null;
 580 |         count(lexeme);
 581 |         return token;
 582 |     });
 583 |     lexer.addRule(tokenRules["floatWithNothingAfterPoint"], function(lexeme){
 584 |         var token = {};
 585 |         token["lexeme"] = lexeme;
 586 |         token["row"] = row;
 587 |         token["col"] = col;
 588 |         token["tokenClass"] = "CONSTANT";
 589 |         token["parent"] = null;
 590 |         token["children"] = null;
 591 |         count(lexeme);
 592 |         return token;
 593 |     });
 594 |     lexer.addRule(tokenRules["string_literal"], function(lexeme){
 595 |         var token = {};
 596 |         token["lexeme"] = lexeme;
 597 |         token["row"] = row;
 598 |         token["col"] = col;
 599 |         token["tokenClass"] = "STRING_LITERAL";
 600 |         token["parent"] = null;
 601 |         token["children"] = null;
 602 |         count(lexeme);
 603 |         return token;
 604 |     });
 605 |     lexer.addRule(tokenRules["ellipsis"], function(lexeme){
 606 |         var token = {};
 607 |         token["lexeme"] = lexeme;
 608 |         token["row"] = row;
 609 |         token["col"] = col;
 610 |         token["tokenClass"] = "ELLIPSIS";
 611 |         token["parent"] = null;
 612 |         token["children"] = null;
 613 |         count(lexeme);
 614 |         return token;
 615 |     });
 616 |     lexer.addRule(tokenRules["right_assign"], function(lexeme){
 617 |         var token = {};
 618 |         token["lexeme"] = lexeme;
 619 |         token["row"] = row;
 620 |         token["col"] = col;
 621 |         token["tokenClass"] = "RIGHT_ASSIGN";
 622 |         token["parent"] = null;
 623 |         token["children"] = null;
 624 |         count(lexeme);
 625 |         return token;
 626 |     });
 627 |     lexer.addRule(tokenRules["left_assign"], function(lexeme){
 628 |         var token = {};
 629 |         token["lexeme"] = lexeme;
 630 |         token["row"] = row;
 631 |         token["col"] = col;
 632 |         token["tokenClass"] = "LEFT_ASSIGN";
 633 |         token["parent"] = null;
 634 |         token["children"] = null;
 635 |         count(lexeme);
 636 |         return token;
 637 |     });
 638 |     lexer.addRule(tokenRules["add_assign"], function(lexeme){
 639 |         var token = {};
 640 |         token["lexeme"] = lexeme;
 641 |         token["row"] = row;
 642 |         token["col"] = col;
 643 |         token["tokenClass"] = "ADD_ASSIGN";
 644 |         token["parent"] = null;
 645 |         token["children"] = null;
 646 |         count(lexeme);
 647 |         return token;
 648 |     });
 649 |     lexer.addRule(tokenRules["sub_assign"], function(lexeme){
 650 |         var token = {};
 651 |         token["lexeme"] = lexeme;
 652 |         token["row"] = row;
 653 |         token["col"] = col;
 654 |         token["tokenClass"] = "SUB_ASSIGN";
 655 |         token["parent"] = null;
 656 |         token["children"] = null;
 657 |         count(lexeme);
 658 |         return token;
 659 |     });
 660 |     lexer.addRule(tokenRules["mul_assign"], function(lexeme){
 661 |         var token = {};
 662 |         token["lexeme"] = lexeme;
 663 |         token["row"] = row;
 664 |         token["col"] = col;
 665 |         token["tokenClass"] = "MUL_ASSIGN";
 666 |         token["parent"] = null;
 667 |         token["children"] = null;
 668 |         count(lexeme);
 669 |         return token;
 670 |     });
 671 |     lexer.addRule(tokenRules["div_assign"], function(lexeme){
 672 |         var token = {};
 673 |         token["lexeme"] = lexeme;
 674 |         token["row"] = row;
 675 |         token["col"] = col;
 676 |         token["tokenClass"] = "DIV_ASSIGN";
 677 |         token["parent"] = null;
 678 |         token["children"] = null;
 679 |         count(lexeme);
 680 |         return token;
 681 |     });
 682 |     lexer.addRule(tokenRules["mod_assign"], function(lexeme){
 683 |         var token = {};
 684 |         token["lexeme"] = lexeme;
 685 |         token["row"] = row;
 686 |         token["col"] = col;
 687 |         token["tokenClass"] = "MOD_ASSIGN";
 688 |         token["parent"] = null;
 689 |         token["children"] = null;
 690 |         count(lexeme);
 691 |         return token;
 692 |     });
 693 |     lexer.addRule(tokenRules["and_assign"], function(lexeme){
 694 |         var token = {};
 695 |         token["lexeme"] = lexeme;
 696 |         token["row"] = row;
 697 |         token["col"] = col;
 698 |         token["tokenClass"] = "AND_ASSIGN";
 699 |         token["parent"] = null;
 700 |         token["children"] = null;
 701 |         count(lexeme);
 702 |         return token;
 703 |     });
 704 |     lexer.addRule(tokenRules["xor_assign"], function(lexeme){
 705 |         var token = {};
 706 |         token["lexeme"] = lexeme;
 707 |         token["row"] = row;
 708 |         token["col"] = col;
 709 |         token["tokenClass"] = "XOR_ASSIGN";
 710 |         token["parent"] = null;
 711 |         token["children"] = null;
 712 |         count(lexeme);
 713 |         return token;
 714 |     });
 715 |     lexer.addRule(tokenRules["or_assign"], function(lexeme){
 716 |         var token = {};
 717 |         token["lexeme"] = lexeme;
 718 |         token["row"] = row;
 719 |         token["col"] = col;
 720 |         token["tokenClass"] = "OR_ASSIGN";
 721 |         token["parent"] = null;
 722 |         token["children"] = null;
 723 |         count(lexeme);
 724 |         return token;
 725 |     });
 726 |     lexer.addRule(tokenRules["right_op"], function(lexeme){
 727 |         var token = {};
 728 |         token["lexeme"] = lexeme;
 729 |         token["row"] = row;
 730 |         token["col"] = col;
 731 |         token["tokenClass"] = "RIGHT_OP";
 732 |         token["parent"] = null;
 733 |         token["children"] = null;
 734 |         count(lexeme);
 735 |         return token;
 736 |     });
 737 |     lexer.addRule(tokenRules["left_op"], function(lexeme){
 738 |         var token = {};
 739 |         token["lexeme"] = lexeme;
 740 |         token["row"] = row;
 741 |         token["col"] = col;
 742 |         token["tokenClass"] = "LEFT_OP";
 743 |         token["parent"] = null;
 744 |         token["children"] = null;
 745 |         count(lexeme);
 746 |         return token;
 747 |     });
 748 |     lexer.addRule(tokenRules["inc_op"], function(lexeme){
 749 |         var token = {};
 750 |         token["lexeme"] = lexeme;
 751 |         token["row"] = row;
 752 |         token["col"] = col;
 753 |         token["tokenClass"] = "INC_OP";
 754 |         token["parent"] = null;
 755 |         token["children"] = null;
 756 |         count(lexeme);
 757 |         return token;
 758 |     });
 759 |     lexer.addRule(tokenRules["dec_op"], function(lexeme){
 760 |         var token = {};
 761 |         token["lexeme"] = lexeme;
 762 |         token["row"] = row;
 763 |         token["col"] = col;
 764 |         token["tokenClass"] = "DEC_OP";
 765 |         token["parent"] = null;
 766 |         token["children"] = null;
 767 |         count(lexeme);
 768 |         return token;
 769 |     });
 770 |     lexer.addRule(tokenRules["ptr_op"], function(lexeme){
 771 |         var token = {};
 772 |         token["lexeme"] = lexeme;
 773 |         token["row"] = row;
 774 |         token["col"] = col;
 775 |         token["tokenClass"] = "PTR_OP";
 776 |         token["parent"] = null;
 777 |         token["children"] = null;
 778 |         count(lexeme);
 779 |         return token;
 780 |     });
 781 |     lexer.addRule(tokenRules["and_op"], function(lexeme){
 782 |         var token = {};
 783 |         token["lexeme"] = lexeme;
 784 |         token["row"] = row;
 785 |         token["col"] = col;
 786 |         token["tokenClass"] = "AND_OP";
 787 |         token["parent"] = null;
 788 |         token["children"] = null;
 789 |         count(lexeme);
 790 |         return token;
 791 |     });
 792 |     lexer.addRule(tokenRules["or_op"], function(lexeme){
 793 |         var token = {};
 794 |         token["lexeme"] = lexeme;
 795 |         token["row"] = row;
 796 |         token["col"] = col;
 797 |         token["tokenClass"] = "OR_OP";
 798 |         token["parent"] = null;
 799 |         token["children"] = null;
 800 |         count(lexeme);
 801 |         return token;
 802 |     });
 803 |     lexer.addRule(tokenRules["le_op"], function(lexeme){
 804 |         var token = {};
 805 |         token["lexeme"] = lexeme;
 806 |         token["row"] = row;
 807 |         token["col"] = col;
 808 |         token["tokenClass"] = "LE_OP";
 809 |         token["parent"] = null;
 810 |         token["children"] = null;
 811 |         count(lexeme);
 812 |         return token;
 813 |     });
 814 |     lexer.addRule(tokenRules["ge_op"], function(lexeme){
 815 |         var token = {};
 816 |         token["lexeme"] = lexeme;
 817 |         token["row"] = row;
 818 |         token["col"] = col;
 819 |         token["tokenClass"] = "GE_OP";
 820 |         token["parent"] = null;
 821 |         token["children"] = null;
 822 |         count(lexeme);
 823 |         return token;
 824 |     });
 825 |     lexer.addRule(tokenRules["eq_op"], function(lexeme){
 826 |         var token = {};
 827 |         token["lexeme"] = lexeme;
 828 |         token["row"] = row;
 829 |         token["col"] = col;
 830 |         token["tokenClass"] = "EQ_OP";
 831 |         token["parent"] = null;
 832 |         token["children"] = null;
 833 |         count(lexeme);
 834 |         return token;
 835 |     });
 836 |     lexer.addRule(tokenRules["ne_op"], function(lexeme){
 837 |         var token = {};
 838 |         token["lexeme"] = lexeme;
 839 |         token["row"] = row;
 840 |         token["col"] = col;
 841 |         token["tokenClass"] = "NE_OP";
 842 |         token["parent"] = null;
 843 |         token["children"] = null;
 844 |         count(lexeme);
 845 |         return token;
 846 |     });
 847 |     lexer.addRule(tokenRules[";"], function(lexeme){
 848 |         var token = {};
 849 |         token["lexeme"] = lexeme;
 850 |         token["row"] = row;
 851 |         token["col"] = col;
 852 |         token["tokenClass"] = ";";
 853 |         token["parent"] = null;
 854 |         token["children"] = null;
 855 |         count(lexeme);
 856 |         return token;
 857 |     });
 858 |     lexer.addRule(tokenRules["{"], function(lexeme){
 859 |         var token = {};
 860 |         token["lexeme"] = lexeme;
 861 |         token["row"] = row;
 862 |         token["col"] = col;
 863 |         token["tokenClass"] = "{";
 864 |         token["parent"] = null;
 865 |         token["children"] = null;
 866 |         count(lexeme);
 867 |         return token;
 868 |     });
 869 |     lexer.addRule(tokenRules["}"], function(lexeme){
 870 |         var token = {};
 871 |         token["lexeme"] = lexeme;
 872 |         token["row"] = row;
 873 |         token["col"] = col;
 874 |         token["tokenClass"] = "}";
 875 |         token["parent"] = null;
 876 |         token["children"] = null;
 877 |         count(lexeme);
 878 |         return token;
 879 |     });
 880 |     lexer.addRule(tokenRules[","], function(lexeme){
 881 |         var token = {};
 882 |         token["lexeme"] = lexeme;
 883 |         token["row"] = row;
 884 |         token["col"] = col;
 885 |         token["tokenClass"] = ",";
 886 |         token["parent"] = null;
 887 |         token["children"] = null;
 888 |         count(lexeme);
 889 |         return token;
 890 |     });
 891 |     lexer.addRule(tokenRules[":"], function(lexeme){
 892 |         var token = {};
 893 |         token["lexeme"] = lexeme;
 894 |         token["row"] = row;
 895 |         token["col"] = col;
 896 |         token["tokenClass"] = ":";
 897 |         token["parent"] = null;
 898 |         token["children"] = null;
 899 |         count(lexeme);
 900 |         return token;
 901 |     });
 902 |     lexer.addRule(tokenRules["="], function(lexeme){
 903 |         var token = {};
 904 |         token["lexeme"] = lexeme;
 905 |         token["row"] = row;
 906 |         token["col"] = col;
 907 |         token["tokenClass"] = "=";
 908 |         token["parent"] = null;
 909 |         token["children"] = null;
 910 |         count(lexeme);
 911 |         return token;
 912 |     });
 913 |     lexer.addRule(tokenRules["("], function(lexeme){
 914 |         var token = {};
 915 |         token["lexeme"] = lexeme;
 916 |         token["row"] = row;
 917 |         token["col"] = col;
 918 |         token["tokenClass"] = "(";
 919 |         token["parent"] = null;
 920 |         token["children"] = null;
 921 |         count(lexeme);
 922 |         return token;
 923 |     });
 924 |     lexer.addRule(tokenRules[")"], function(lexeme){
 925 |         var token = {};
 926 |         token["lexeme"] = lexeme;
 927 |         token["row"] = row;
 928 |         token["col"] = col;
 929 |         token["tokenClass"] = ")";
 930 |         token["parent"] = null;
 931 |         token["children"] = null;
 932 |         count(lexeme);
 933 |         return token;
 934 |     });
 935 |     lexer.addRule(tokenRules["["], function(lexeme){
 936 |         var token = {};
 937 |         token["lexeme"] = lexeme;
 938 |         token["row"] = row;
 939 |         token["col"] = col;
 940 |         token["tokenClass"] = "[";
 941 |         token["parent"] = null;
 942 |         token["children"] = null;
 943 |         count(lexeme);
 944 |         return token;
 945 |     });
 946 |     lexer.addRule(tokenRules["]"], function(lexeme){
 947 |         var token = {};
 948 |         token["lexeme"] = lexeme;
 949 |         token["row"] = row;
 950 |         token["col"] = col;
 951 |         token["tokenClass"] = "]";
 952 |         token["parent"] = null;
 953 |         token["children"] = null;
 954 |         count(lexeme);
 955 |         return token;
 956 |     });
 957 |     lexer.addRule(tokenRules["."], function(lexeme){
 958 |         var token = {};
 959 |         token["lexeme"] = lexeme;
 960 |         token["row"] = row;
 961 |         token["col"] = col;
 962 |         token["tokenClass"] = ".";
 963 |         token["parent"] = null;
 964 |         token["children"] = null;
 965 |         count(lexeme);
 966 |         return token;
 967 |     });
 968 |     lexer.addRule(tokenRules["&"], function(lexeme){
 969 |         var token = {};
 970 |         token["lexeme"] = lexeme;
 971 |         token["row"] = row;
 972 |         token["col"] = col;
 973 |         token["tokenClass"] = "&";
 974 |         token["parent"] = null;
 975 |         token["children"] = null;
 976 |         count(lexeme);
 977 |         return token;
 978 |     });
 979 |     lexer.addRule(tokenRules["!"], function(lexeme){
 980 |         var token = {};
 981 |         token["lexeme"] = lexeme;
 982 |         token["row"] = row;
 983 |         token["col"] = col;
 984 |         token["tokenClass"] = "!";
 985 |         token["parent"] = null;
 986 |         token["children"] = null;
 987 |         count(lexeme);
 988 |         return token;
 989 |     });
 990 |     lexer.addRule(tokenRules["~"], function(lexeme){
 991 |         var token = {};
 992 |         token["lexeme"] = lexeme;
 993 |         token["row"] = row;
 994 |         token["col"] = col;
 995 |         token["tokenClass"] = "~";
 996 |         token["parent"] = null;
 997 |         token["children"] = null;
 998 |         count(lexeme);
 999 |         return token;
1000 |     });
1001 |     lexer.addRule(tokenRules["-"], function(lexeme){
1002 |         var token = {};
1003 |         token["lexeme"] = lexeme;
1004 |         token["row"] = row;
1005 |         token["col"] = col;
1006 |         token["tokenClass"] = "-";
1007 |         token["parent"] = null;
1008 |         token["children"] = null;
1009 |         count(lexeme);
1010 |         return token;
1011 |     });
1012 |     lexer.addRule(tokenRules["+"], function(lexeme){
1013 |         var token = {};
1014 |         token["lexeme"] = lexeme;
1015 |         token["row"] = row;
1016 |         token["col"] = col;
1017 |         token["tokenClass"] = "+";
1018 |         token["parent"] = null;
1019 |         token["children"] = null;
1020 |         count(lexeme);
1021 |         return token;
1022 |     });
1023 |     lexer.addRule(tokenRules["*"], function(lexeme){
1024 |         var token = {};
1025 |         token["lexeme"] = lexeme;
1026 |         token["row"] = row;
1027 |         token["col"] = col;
1028 |         token["tokenClass"] = "*";
1029 |         token["parent"] = null;
1030 |         token["children"] = null;
1031 |         count(lexeme);
1032 |         return token;
1033 |     });
1034 |     lexer.addRule(tokenRules["/"], function(lexeme){
1035 |         var token = {};
1036 |         token["lexeme"] = lexeme;
1037 |         token["row"] = row;
1038 |         token["col"] = col;
1039 |         token["tokenClass"] = "/";
1040 |         token["parent"] = null;
1041 |         token["children"] = null;
1042 |         count(lexeme);
1043 |         return token;
1044 |     });
1045 |     lexer.addRule(tokenRules["%"], function(lexeme){
1046 |         var token = {};
1047 |         token["lexeme"] = lexeme;
1048 |         token["row"] = row;
1049 |         token["col"] = col;
1050 |         token["tokenClass"] = "%";
1051 |         token["parent"] = null;
1052 |         token["children"] = null;
1053 |         count(lexeme);
1054 |         return token;
1055 |     });
1056 |     lexer.addRule(tokenRules["<"], function(lexeme){
1057 |         var token = {};
1058 |         token["lexeme"] = lexeme;
1059 |         token["row"] = row;
1060 |         token["col"] = col;
1061 |         token["tokenClass"] = "<";
1062 |         token["parent"] = null;
1063 |         token["children"] = null;
1064 |         count(lexeme);
1065 |         return token;
1066 |     });
1067 |     lexer.addRule(tokenRules[">"], function(lexeme){
1068 |         var token = {};
1069 |         token["lexeme"] = lexeme;
1070 |         token["row"] = row;
1071 |         token["col"] = col;
1072 |         token["tokenClass"] = ">";
1073 |         token["parent"] = null;
1074 |         token["children"] = null;
1075 |         count(lexeme);
1076 |         return token;
1077 |     });
1078 |     lexer.addRule(tokenRules["^"], function(lexeme){
1079 |         var token = {};
1080 |         token["lexeme"] = lexeme;
1081 |         token["row"] = row;
1082 |         token["col"] = col;
1083 |         token["tokenClass"] = "^";
1084 |         token["parent"] = null;
1085 |         token["children"] = null;
1086 |         count(lexeme);
1087 |         return token;
1088 |     });
1089 |     lexer.addRule(tokenRules["|"], function(lexeme){
1090 |         var token = {};
1091 |         token["lexeme"] = lexeme;
1092 |         token["row"] = row;
1093 |         token["col"] = col;
1094 |         token["tokenClass"] = "|";
1095 |         token["parent"] = null;
1096 |         token["children"] = null;
1097 |         count(lexeme);
1098 |         return token;
1099 |     });
1100 |     lexer.addRule(tokenRules["?"], function(lexeme){
1101 |         var token = {};
1102 |         token["lexeme"] = lexeme;
1103 |         token["row"] = row;
1104 |         token["col"] = col;
1105 |         token["tokenClass"] = "?";
1106 |         token["parent"] = null;
1107 |         token["children"] = null;
1108 |         count(lexeme);
1109 |         return token;
1110 |     });
1111 |     lexer.addRule(tokenRules["whitespace"], function(lexeme){
1112 |         var token = {};
1113 |         token["lexeme"] = lexeme;
1114 |         token["row"] = row;
1115 |         token["col"] = col;
1116 |         token["tokenClass"] = "WHITESPACE";
1117 |         token["parent"] = null;
1118 |         token["children"] = null;
1119 |         count(lexeme);
1120 |         return token;
1121 |     });
1122 |     lexer.addRule(tokenRules["unmatched"], function(lexeme){
1123 |         var token = {};
1124 |         token["lexeme"] = lexeme;
1125 |         token["row"] = row;
1126 |         token["col"] = col;
1127 |         token["tokenClass"] = "UNMATCHED";
1128 |         token["parent"] = null;
1129 |         token["children"] = null;
1130 |         count(lexeme);
1131 |         return token;
1132 |     });
1133 | 
1134 |     lexer.setInput(streamOfText);
1135 |     var x = lexer.lex();
1136 |     while(x != undefined){
1137 |         if((x.tokenClass != "UNMATCHED") && (x.tokenClass != "WHITESPACE") && (x.tokenClass != "COMMENT")){
1138 |             streamOfTokens.push(x);
1139 |         }
1140 |         x = lexer.lex();
1141 |     };
1142 |     return streamOfTokens;
1143 | }
1144 | module.exports.tokenize = tokenize;
1145 | 


--------------------------------------------------------------------------------