├── requirements.txt
├── tests
    ├── fixtures
    │   ├── empty_file.hcl
    │   ├── float.hcl
    │   ├── empty.hcl
    │   ├── escape.hcl
    │   ├── flat.hcl
    │   ├── float.json
    │   ├── multi_line_comment.json
    │   ├── multiline.json
    │   ├── single_line_comment.json
    │   ├── multiline_bad.hcl
    │   ├── tab_heredoc.json
    │   ├── tab_heredoc.hcl
    │   ├── basic.hcl
    │   ├── array_comment.hcl
    │   ├── basic_squish.hcl
    │   ├── multi_line_comment.hcl
    │   ├── structure_list.hcl
    │   ├── array_comment.json
    │   ├── basic.json
    │   ├── only_comments.hcl
    │   ├── structure_flatmap.hcl
    │   ├── structure_multi.hcl
    │   ├── heredoc_terminator_same_line.json
    │   ├── scientific.hcl
    │   ├── terraform_heroku.hcl
    │   ├── structure_flatmap.json
    │   ├── heredoc_terminator_same_line.hcl
    │   ├── structure.hcl
    │   ├── structure_list.json
    │   ├── multi_line_comment_M.json
    │   ├── structure.json
    │   ├── structure_flat.json
    │   ├── single_line_comment.hcl
    │   ├── terraform_heroku.json
    │   ├── structure_comment.hcl
    │   ├── structure_comment_L.json
    │   ├── scientific.json
    │   ├── structure_comment_M.json
    │   ├── structure_multi.json
    │   ├── structure2.json
    │   ├── structure2.hcl
    │   ├── nested_lists.hcl
    │   ├── single_line_comment_L.json
    │   ├── decode_tf_variable.hcl
    │   ├── structure_comment_A.json
    │   ├── decode_policy.hcl
    │   ├── structure_list_deep.hcl
    │   ├── function.hcl
    │   ├── issue12.hcl
    │   ├── decode_tf_variable.json
    │   ├── nested_lists.json
    │   ├── structure_three_tiers.hcl
    │   ├── decode_policy.json
    │   ├── function.json
    │   ├── issue12.json
    │   ├── structure_list_deep.json
    │   └── structure_three_tiers.json
    ├── lex-fixtures
    │   ├── list.hcl
    │   ├── list_comma.hcl
    │   ├── empty_heredoc.hcl
    │   ├── multiple.hcl
    │   ├── structure_empty.hcl
    │   ├── unterminated_block_comment.hcl
    │   ├── nested_comment.hcl
    │   ├── old.hcl
    │   ├── array_comment.hcl
    │   ├── assign_deep.hcl
    │   ├── heredoc_terminator_same_line.hcl
    │   ├── structure_basic.hcl
    │   ├── assign_colon.hcl
    │   ├── structure_comma.hcl
    │   ├── structure.hcl
    │   ├── list_of_maps.hcl
    │   ├── types.hcl
    │   ├── comment.hcl
    │   ├── windows_heredoc.hcl
    │   ├── complex.hcl
    │   ├── terraform0.12syntax.hcl
    │   └── conditional_operator.hcl
    ├── run_tests.sh
    ├── test_load_dump.py
    ├── test_parser.py
    ├── test_decoder.py
    └── test_lexer.py
├── testing-requirements.txt
├── setup.cfg
├── src
    └── hcl
    │   ├── ply
    │       ├── __init__.py
    │       └── lex.py
    │   ├── __init__.py
    │   ├── api.py
    │   ├── lexer.py
    │   └── parser.py
├── .gitignore
├── MANIFEST.in
├── pyproject.toml
├── scripts
    └── hcltool
├── CHANGELOG.md
├── .github
    └── workflows
    │   └── dist.yml
├── README.rst
├── setup.py
└── LICENSE


/requirements.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/tests/fixtures/empty_file.hcl:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/tests/fixtures/float.hcl:
--------------------------------------------------------------------------------
1 | a = 1.02
2 | 


--------------------------------------------------------------------------------
/testing-requirements.txt:
--------------------------------------------------------------------------------
1 | pytest
2 | coverage
3 | 


--------------------------------------------------------------------------------
/tests/fixtures/empty.hcl:
--------------------------------------------------------------------------------
1 | resource "foo" {}
2 | 


--------------------------------------------------------------------------------
/tests/fixtures/escape.hcl:
--------------------------------------------------------------------------------
1 | foo = "bar\"baz\\n"
2 | 


--------------------------------------------------------------------------------
/tests/fixtures/flat.hcl:
--------------------------------------------------------------------------------
1 | foo = "bar"
2 | Key = 7
3 | 


--------------------------------------------------------------------------------
/tests/fixtures/float.json:
--------------------------------------------------------------------------------
1 | {
2 | 	"a": 1.02
3 | }
4 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/list.hcl:
--------------------------------------------------------------------------------
1 | foo = [1, 2, "foo"]
2 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/list_comma.hcl:
--------------------------------------------------------------------------------
1 | foo = [1, 2, "foo",]
2 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/empty_heredoc.hcl:
--------------------------------------------------------------------------------
1 | empty = <<DOC
2 | DOC
3 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/multiple.hcl:
--------------------------------------------------------------------------------
1 | foo = "bar"
2 | key = 7
3 | 


--------------------------------------------------------------------------------
/tests/fixtures/multi_line_comment.json:
--------------------------------------------------------------------------------
1 | {
2 |     "foo": "bar"
3 | }


--------------------------------------------------------------------------------
/tests/fixtures/multiline.json:
--------------------------------------------------------------------------------
1 | {
2 |     "foo": "bar\nbaz"
3 | }
4 | 


--------------------------------------------------------------------------------
/tests/fixtures/single_line_comment.json:
--------------------------------------------------------------------------------
1 | {
2 |     "foo": "bar"
3 | }


--------------------------------------------------------------------------------
/tests/lex-fixtures/structure_empty.hcl:
--------------------------------------------------------------------------------
1 | resource "foo" "bar" {}
2 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/unterminated_block_comment.hcl:
--------------------------------------------------------------------------------
1 | /*
2 | Foo
3 | 


--------------------------------------------------------------------------------
/tests/fixtures/multiline_bad.hcl:
--------------------------------------------------------------------------------
1 | foo = <<EOF
2 | bar
3 | baz
4 | EOF
5 | 


--------------------------------------------------------------------------------
/tests/fixtures/tab_heredoc.json:
--------------------------------------------------------------------------------
1 | {
2 |     "foo": "bar\nbaz"
3 | }
4 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/nested_comment.hcl:
--------------------------------------------------------------------------------
1 | /*
2 | /*
3 | Baz
4 | */
5 | */
6 | 


--------------------------------------------------------------------------------
/tests/fixtures/tab_heredoc.hcl:
--------------------------------------------------------------------------------
1 | 	foo = <<-EOF
2 | 	bar
3 | 	baz
4 | 	EOF
5 | 


--------------------------------------------------------------------------------
/tests/fixtures/basic.hcl:
--------------------------------------------------------------------------------
1 | foo = "bar"
2 | bar = "${file("bing/bong.txt")}"
3 | 


--------------------------------------------------------------------------------
/tests/fixtures/array_comment.hcl:
--------------------------------------------------------------------------------
1 | foo = [
2 |     "1",
3 |     "2", # comment
4 | ]
5 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/old.hcl:
--------------------------------------------------------------------------------
1 | default = {
2 |     "eu-west-1": "ami-b1cf19c6",
3 | }
4 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/array_comment.hcl:
--------------------------------------------------------------------------------
1 | foo = [
2 |     "1",
3 |     "2", # comment
4 | ]
5 | 


--------------------------------------------------------------------------------
/tests/fixtures/basic_squish.hcl:
--------------------------------------------------------------------------------
1 | foo="bar"
2 | bar="${file("bing/bong.txt")}"
3 | foo-bar="baz"
4 | 


--------------------------------------------------------------------------------
/tests/fixtures/multi_line_comment.hcl:
--------------------------------------------------------------------------------
1 | /*
2 |     test multi line comment
3 | */
4 | foo = "bar"


--------------------------------------------------------------------------------
/tests/fixtures/structure_list.hcl:
--------------------------------------------------------------------------------
1 | foo {
2 |     key = 7
3 | }
4 | foo {
5 |     key = 12
6 | }
7 | 


--------------------------------------------------------------------------------
/tests/fixtures/array_comment.json:
--------------------------------------------------------------------------------
1 | {
2 |     "foo": [
3 |         "1",
4 |         "2"
5 |     ]
6 | }


--------------------------------------------------------------------------------
/tests/lex-fixtures/assign_deep.hcl:
--------------------------------------------------------------------------------
1 | resource = [{
2 | 	foo = [{
3 | 		bar = {}
4 | 	}]
5 | }]
6 | 


--------------------------------------------------------------------------------
/tests/fixtures/basic.json:
--------------------------------------------------------------------------------
1 | {
2 | 	"foo": "bar",
3 |     "bar": "${file(\"bing/bong.txt\")}"
4 | }
5 | 


--------------------------------------------------------------------------------
/tests/fixtures/only_comments.hcl:
--------------------------------------------------------------------------------
1 | # This is an empty file, except for a comment.
2 | 
3 | # Another comment


--------------------------------------------------------------------------------
/tests/fixtures/structure_flatmap.hcl:
--------------------------------------------------------------------------------
1 | foo {
2 | 	key = 7
3 | }
4 | 
5 | foo {
6 | 	foo = "bar"
7 | }
8 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure_multi.hcl:
--------------------------------------------------------------------------------
1 | foo "baz" {
2 | 	key = 7
3 | }
4 | 
5 | foo "bar" {
6 | 	key = 12
7 | }
8 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/heredoc_terminator_same_line.hcl:
--------------------------------------------------------------------------------
1 | foo = <<EOF
2 | 
3 | The terminator is on this lineEOF
4 | 


--------------------------------------------------------------------------------
/tests/fixtures/heredoc_terminator_same_line.json:
--------------------------------------------------------------------------------
1 | {
2 |     "foo": "\nbar\nbaz",
3 |     "bar": "foo\nbaz"
4 | }
5 | 


--------------------------------------------------------------------------------
/tests/fixtures/scientific.hcl:
--------------------------------------------------------------------------------
1 | a = 1e-10
2 | b = 1e+10
3 | c = 1e10
4 | d = 1.2e-10
5 | e = 1.2e+10
6 | f = 1.2e10
7 | 


--------------------------------------------------------------------------------
/tests/fixtures/terraform_heroku.hcl:
--------------------------------------------------------------------------------
1 | name = "terraform-test-app"
2 | 
3 | config_vars {
4 |     FOO = "bar"
5 | }
6 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/structure_basic.hcl:
--------------------------------------------------------------------------------
1 | foo {
2 | 	value = 7
3 | 	"value" = 8
4 | 	"complex::value" = 9
5 | }
6 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure_flatmap.json:
--------------------------------------------------------------------------------
1 | {
2 |     "foo": {
3 |         "key": 7,
4 |         "foo": "bar"
5 |     }
6 | }
7 | 


--------------------------------------------------------------------------------
/setup.cfg:
--------------------------------------------------------------------------------
1 | [flake8]
2 | max-line-length = 160
3 | ignore = E225,E226,E231,E265,E266,E302,E303,F401,F821,W291,W292,W293,W391
4 | 


--------------------------------------------------------------------------------
/tests/fixtures/heredoc_terminator_same_line.hcl:
--------------------------------------------------------------------------------
1 | foo = <<EOF
2 | 
3 | bar
4 | bazEOF
5 | 
6 | 	bar = <<-EOF
7 | 	foo
8 | 	bazEOF


--------------------------------------------------------------------------------
/tests/fixtures/structure.hcl:
--------------------------------------------------------------------------------
1 | // This is a test structure for the lexer
2 | foo "baz" {
3 | 	key = 7
4 | 	foo = "bar"
5 | }
6 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure_list.json:
--------------------------------------------------------------------------------
1 | {
2 | 	"foo": [{
3 |         "key": 7
4 |     }, {
5 |         "key": 12
6 |     }]
7 | }
8 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/assign_colon.hcl:
--------------------------------------------------------------------------------
1 | resource = [{
2 | 	"foo": {
3 | 		"bar": {},
4 | 		"baz": [1, 2, "foo"],
5 | 	}
6 | }]
7 | 


--------------------------------------------------------------------------------
/tests/fixtures/multi_line_comment_M.json:
--------------------------------------------------------------------------------
1 | {
2 |     "comment-L001": "/*\n    test multi line comment\n*/",
3 |     "foo": "bar"
4 | }


--------------------------------------------------------------------------------
/tests/lex-fixtures/structure_comma.hcl:
--------------------------------------------------------------------------------
1 | foo {
2 |     key = "key",
3 |     value = 7,
4 | }
5 | 
6 | bar {key = "key", value = 7}
7 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure.json:
--------------------------------------------------------------------------------
1 | {
2 | 	"foo": [{
3 | 		"baz": [{
4 | 			"key": 7,
5 | 			"foo": "bar"
6 | 		}]
7 | 	}]
8 | }
9 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure_flat.json:
--------------------------------------------------------------------------------
1 | {
2 | 	"foo": {
3 | 		"baz": {
4 | 			"key": 7,
5 | 			"foo": "bar"
6 | 		}
7 | 	}
8 | }
9 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/structure.hcl:
--------------------------------------------------------------------------------
1 | // This is a test structure for the lexer
2 | foo bar "baz" {
3 | 	key = 7
4 | 	foo = "bar"
5 | }
6 | 


--------------------------------------------------------------------------------
/tests/fixtures/single_line_comment.hcl:
--------------------------------------------------------------------------------
1 | // test single line comment with slash
2 | # test single line comment with hashtag
3 | foo = "bar"
4 | 


--------------------------------------------------------------------------------
/src/hcl/ply/__init__.py:
--------------------------------------------------------------------------------
1 | # PLY package
2 | # Author: David Beazley (dave@dabeaz.com)
3 | 
4 | __version__ = '3.11'
5 | __all__ = ['lex','yacc']
6 | 


--------------------------------------------------------------------------------
/tests/fixtures/terraform_heroku.json:
--------------------------------------------------------------------------------
1 | {
2 |     "name": "terraform-test-app",
3 |     "config_vars": {
4 |         "FOO": "bar"
5 |     }
6 | }
7 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/list_of_maps.hcl:
--------------------------------------------------------------------------------
1 | foo = [
2 |   {somekey1 = "someval1"},
3 |   {somekey2 = "someval2", someextrakey = "someextraval"},
4 | ]
5 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/types.hcl:
--------------------------------------------------------------------------------
1 | foo = "bar"
2 | bar = 7
3 | baz = [1,2,3]
4 | foo = -12
5 | bar = 3.14159
6 | foo = true
7 | bar = false
8 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure_comment.hcl:
--------------------------------------------------------------------------------
1 | foo {
2 |     // single line comment
3 |     /*
4 |         multi line comment
5 |     */
6 |     foo = "bar"
7 | }


--------------------------------------------------------------------------------
/tests/fixtures/structure_comment_L.json:
--------------------------------------------------------------------------------
1 | {
2 |     "foo": {
3 |         "comment-L002": "single line comment",
4 |         "foo": "bar"
5 |     }
6 | }


--------------------------------------------------------------------------------
/tests/fixtures/scientific.json:
--------------------------------------------------------------------------------
1 | {
2 |     "a": 1e-10,
3 |     "b": 1e+10,
4 |     "c": 1e10,
5 |     "d": 1.2e-10,
6 |     "e": 1.2e+10,
7 |     "f": 1.2e10
8 | }
9 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure_comment_M.json:
--------------------------------------------------------------------------------
1 | {
2 |     "foo": {
3 |         "comment-L003": "/*\n        multi line comment\n    */",
4 |         "foo": "bar"
5 |     }
6 | }


--------------------------------------------------------------------------------
/tests/fixtures/structure_multi.json:
--------------------------------------------------------------------------------
 1 | {
 2 | 	"foo": {
 3 | 		"baz": {
 4 | 			"key": 7
 5 | 		},
 6 | 
 7 | 		"bar": {
 8 | 			"key": 12
 9 | 		}
10 | 	}
11 | }
12 | 


--------------------------------------------------------------------------------
/src/hcl/__init__.py:
--------------------------------------------------------------------------------
1 | from .api import dumps, load, loads
2 | 
3 | try:
4 |     from .version import __version__
5 | except ImportError:
6 |     __version__ = 'master'
7 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure2.json:
--------------------------------------------------------------------------------
 1 | {
 2 | 	"foo": [{
 3 | 		"baz": {
 4 | 			"key": 7,
 5 | 			"foo": "bar"
 6 | 		}
 7 |     }, {
 8 | 		"key": 7
 9 | 	}]
10 | }
11 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure2.hcl:
--------------------------------------------------------------------------------
 1 | // This is a test structure for the lexer
 2 | foo "baz" {
 3 | 	key = 7
 4 | 	foo = "bar"
 5 | }
 6 | 
 7 | foo {
 8 | 	key = 7
 9 | }
10 | 


--------------------------------------------------------------------------------
/tests/fixtures/nested_lists.hcl:
--------------------------------------------------------------------------------
1 | MX_RECORDS = [
2 |   ["", [
3 |     "first string",
4 |     "second string",
5 |     "third string",
6 |     "fourth string",
7 |     "fifth string",
8 |   ]],
9 | ]


--------------------------------------------------------------------------------
/tests/fixtures/single_line_comment_L.json:
--------------------------------------------------------------------------------
1 | {
2 |     "comment-L001": "test single line comment with slash",
3 |     "comment-L002": "test single line comment with hashtag",
4 |     "foo": "bar"
5 | }


--------------------------------------------------------------------------------
/tests/lex-fixtures/comment.hcl:
--------------------------------------------------------------------------------
 1 | // Foo
 2 | 
 3 | /* Bar */
 4 | 
 5 | /*
 6 | /*
 7 | Baz
 8 | */
 9 | 
10 | # Another
11 | 
12 | # Multiple
13 | # Lines
14 | 
15 | foo = "bar"
16 | 


--------------------------------------------------------------------------------
/tests/run_tests.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | pip install -e .
 4 | python -m coverage run --source hcl -m pytest tests
 5 | if [ "$?" != "0" ]; then
 6 | 	exit 1
 7 | fi
 8 | 
 9 | python -m coverage report -m
10 | 


--------------------------------------------------------------------------------
/tests/fixtures/decode_tf_variable.hcl:
--------------------------------------------------------------------------------
 1 | variable "foo" {
 2 |     default = "bar"
 3 |     description = "bar"
 4 | }
 5 | 
 6 | variable "amis" {
 7 |     default = {
 8 |         east = "foo"
 9 |     }
10 | }
11 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure_comment_A.json:
--------------------------------------------------------------------------------
1 | {
2 |     "foo": {
3 |         "comment-L002": "single line comment",
4 |         "comment-L003": "/*\n        multi line comment\n    */",
5 |         "foo": "bar"
6 |     }
7 | }


--------------------------------------------------------------------------------
/tests/lex-fixtures/windows_heredoc.hcl:
--------------------------------------------------------------------------------
 1 | # This tests windows style line endings.
 2 | # Please don't change those.
 3 | 
 4 | data_json = <<EOT
 5 | {
 6 |   "foo":   "bar",
 7 |   "pizza": "cheese"
 8 | }
 9 | EOT
10 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | dist
 2 | build
 3 | __pycache__
 4 | *.pyc
 5 | .coverage
 6 | *.egg-info
 7 | *.egg
 8 | *.eggs
 9 | 
10 | .project
11 | .pydevproject
12 | .settings
13 | 
14 | src/hcl/version.py
15 | src/hcl/parsetab.dat
16 | 


--------------------------------------------------------------------------------
/tests/fixtures/decode_policy.hcl:
--------------------------------------------------------------------------------
 1 | key "" {
 2 | 	policy = "read"
 3 | }
 4 | 
 5 | key "foo/" {
 6 | 	policy = "write"
 7 | }
 8 | 
 9 | key "foo/bar/" {
10 | 	policy = "read"
11 | }
12 | 
13 | key "foo/bar/baz" {
14 | 	policy = "deny"
15 | }
16 | 


--------------------------------------------------------------------------------
/MANIFEST.in:
--------------------------------------------------------------------------------
 1 | include requirements.txt
 2 | include testing-requirements.txt
 3 | include README.rst
 4 | include LICENSE
 5 | include CHANGELOG.md
 6 | 
 7 | include src/hcl/parsetab.dat
 8 | 
 9 | recursive-include tests *.py *.hcl *.json *.sh
10 | 
11 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure_list_deep.hcl:
--------------------------------------------------------------------------------
 1 | bar "foo" {
 2 | 
 3 |     name = "terraform_example"
 4 | 
 5 |     ingress {
 6 |         from_port = 22
 7 |     }
 8 | 
 9 |     ingress {
10 |         from_port = 80
11 |     }
12 | 
13 |     ingress {
14 |         from_port = 51
15 |     }
16 | 
17 | }
18 | 


--------------------------------------------------------------------------------
/tests/fixtures/function.hcl:
--------------------------------------------------------------------------------
1 | data "resource" "object" {
2 |   vars = {
3 |     cluster_1         = join("\n", data.template_file.cluster_1.*.rendered)
4 |     cluster_2         = format("name_%02d", count.index + 1)
5 |     PROXY_AUTH        = join(":", [var.proxy_username, var.proxy_password])
6 |   }
7 | }


--------------------------------------------------------------------------------
/tests/fixtures/issue12.hcl:
--------------------------------------------------------------------------------
 1 | resource "aws_db_instance" "mysqldb" {
 2 |     identifier = "${var.environment}-mysqldb"
 3 |     allocated_storage = 100
 4 | }
 5 | resource "aws_db_instance" "mysqldb-readonly" {
 6 |     identifier = "${var.environment}-mysqldb-readonly"
 7 |     allocated_storage = 100
 8 | }
 9 | 
10 | 


--------------------------------------------------------------------------------
/tests/fixtures/decode_tf_variable.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "variable": {
 3 |         "foo": {
 4 |             "default": "bar",
 5 |             "description": "bar"
 6 |         },
 7 | 
 8 |         "amis": {
 9 |             "default": {
10 |                 "east": "foo"
11 |             }
12 |         }
13 |     }
14 | }
15 | 


--------------------------------------------------------------------------------
/tests/fixtures/nested_lists.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "MX_RECORDS": [
 3 |         [
 4 |             "",
 5 |             [
 6 |                 "first string",
 7 |                 "second string",
 8 |                 "third string",
 9 |                 "fourth string",
10 |                 "fifth string"
11 |             ]
12 |         ]
13 |     ]
14 | }


--------------------------------------------------------------------------------
/tests/fixtures/structure_three_tiers.hcl:
--------------------------------------------------------------------------------
 1 | foo "bar" "baz" {
 2 | 	key = 4
 3 | }
 4 | 
 5 | foo "bar" "qux" {
 6 | 	key = 5
 7 | }
 8 | 
 9 | foo "bar" "biz" {
10 | 	key = 11
11 | }
12 | 
13 | bar "foo" "qux" {
14 | 	key = 8
15 | }
16 | 
17 | bar "foo" "biz" {
18 | 	key = 9
19 | 	key2 = 3
20 | }
21 | 
22 | baz "foo" "biz" {
23 | 	key = 9
24 | 	key5 = "somestring"
25 | }
26 | 


--------------------------------------------------------------------------------
/tests/fixtures/decode_policy.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "key": {
 3 |         "": {
 4 |             "policy": "read"
 5 |         },
 6 | 
 7 |         "foo/": {
 8 |             "policy": "write"
 9 |         },
10 | 
11 |         "foo/bar/": {
12 |             "policy": "read"
13 |         },
14 | 
15 |         "foo/bar/baz": {
16 |             "policy": "deny"
17 |         }
18 |     }
19 | }
20 | 


--------------------------------------------------------------------------------
/tests/fixtures/function.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "data": {
 3 |     "resource": {
 4 |       "object": {
 5 |         "vars": {
 6 |           "cluster_1": "join(\"\\n\",data.template_file.cluster_1.*.rendered)",
 7 |           "cluster_2": "format(\"name_%02d\",count.index + 1)",
 8 |           "PROXY_AUTH": "join(\":\",var.proxy_username,var.proxy_password)"
 9 |         }
10 |       }
11 |     }
12 |   }
13 | }
14 | 


--------------------------------------------------------------------------------
/tests/fixtures/issue12.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "resource": {
 3 |         "aws_db_instance": {
 4 |             "mysqldb": {
 5 |                 "allocated_storage": 100,
 6 |                 "identifier": "${var.environment}-mysqldb"
 7 |             },
 8 |             "mysqldb-readonly": {
 9 |                 "allocated_storage": 100,
10 |                 "identifier": "${var.environment}-mysqldb-readonly"
11 |             }
12 |         }
13 |     }
14 | }
15 | 
16 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure_list_deep.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "bar": {
 3 |         "foo": {
 4 |             "name": "terraform_example",
 5 |             "ingress": [
 6 |                 {
 7 |                     "from_port": 22
 8 |                 },
 9 |                 {
10 |                     "from_port": 80
11 |                 },
12 |                 {
13 |                     "from_port": 51
14 |                 }
15 |             ]
16 |         }
17 |     }
18 | }
19 | 
20 | 


--------------------------------------------------------------------------------
/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [build-system]
 2 | requires = ["setuptools", "wheel"]
 3 | 
 4 | [tool.black]
 5 | line-length = 88
 6 | include = '\.pyi?$'
 7 | exclude = '''
 8 | (
 9 |   /(
10 |       \.eggs         # exclude a few common directories in the
11 |     | \.git          # root of the project
12 |     | \.hg
13 |     | \.mypy_cache
14 |     | \.nox
15 |     | \.tox
16 |     | \.venv
17 |     | _build
18 |     | buck-out
19 |     | build
20 |     | dist
21 |     
22 |   )/
23 |   | /src/hcl/ply    # exclude vendored ply module
24 | )
25 | '''
26 | 


--------------------------------------------------------------------------------
/tests/fixtures/structure_three_tiers.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "foo": {
 3 |     "bar": {
 4 |       "baz": {
 5 |         "key": 4
 6 |       },
 7 |       "qux": {
 8 |         "key": 5
 9 |       },
10 |       "biz": {
11 |         "key": 11
12 |       }
13 |     }
14 |   },
15 |   "bar": {
16 |     "foo": {
17 |       "qux": {
18 |         "key": 8
19 |       },
20 |       "biz": {
21 |         "key": 9,
22 |         "key2": 3
23 |       }
24 |     }
25 |   },
26 |   "baz": {
27 |     "foo": {
28 |       "biz": {
29 |         "key": 9,
30 |         "key5": "somestring"
31 |       }
32 |     }
33 |   }
34 | }
35 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/complex.hcl:
--------------------------------------------------------------------------------
 1 | // This comes from Terraform, as a test
 2 | variable "foo" {
 3 |     default = "bar"
 4 |     description = "bar"
 5 | }
 6 | 
 7 | provider "aws" {
 8 |   access_key = "foo"
 9 |   secret_key = "bar"
10 | }
11 | 
12 | provider "do" {
13 |   api_key = "${var.foo}"
14 | }
15 | 
16 | resource "aws_security_group" "firewall" {
17 |     count = 5
18 | }
19 | 
20 | resource aws_instance "web" {
21 |     ami = "${var.foo}"
22 |     security_groups = [
23 |         "foo",
24 |         "${aws_security_group.firewall.foo}"
25 |     ]
26 | 
27 |     network_interface {
28 |         device_index = 0
29 |         description = "Main network interface"
30 |     }
31 | }
32 | 
33 | resource "aws_instance" "db" {
34 |     security_groups = "${aws_security_group.firewall.*.id}"
35 |     VPC = "foo"
36 | 
37 |     depends_on = ["aws_instance.web"]
38 | }
39 | 
40 | output "web_ip" {
41 |     value = "${aws_instance.web.private_ip}"
42 | }
43 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/terraform0.12syntax.hcl:
--------------------------------------------------------------------------------
 1 | locals {
 2 |   https_inbound_sg_id  = coalesce(join("", aws_security_group.https_inbound_sg.*.id), join("", data.aws_security_group.https_inbound_sg.*.id))
 3 | }
 4 | 
 5 | variable "env_variables" {
 6 |   type        = map(string)
 7 |   default     = { terraform: "needs dynamic blocks of code"}
 8 | }
 9 | 
10 | resource "aws_iam_role_policy_attachment" "policy_attachment" {
11 |   count      = var.module_count
12 |   role       = aws_iam_role.role[count.index].name
13 | }
14 | 
15 | resource "aws_rds_cluster" "interaction-database-cluster" {
16 |   cluster_identifier      = local.rds_name
17 | 
18 |   scaling_configuration {
19 |     max_capacity             = 256
20 |     auto_pause               = var.environment == "prod" ? false : true
21 |     seconds_until_auto_pause = var.environment == "prod" ? null : 3600
22 |   }
23 | }
24 | 
25 | resource "aws_lambda_function" "github_collector" {
26 |   function_name    = var.github_collector_function_name
27 | 
28 |   environment {
29 |     variables = {
30 |       PROXY_AUTH    = join(":", [var.proxy_username, var.proxy_password])
31 |     }
32 |   }
33 | }
34 | 


--------------------------------------------------------------------------------
/scripts/hcltool:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | 
 3 | """Command-line tool to validate HCL and pretty-print JSON from it
 4 | 
 5 | Usage::
 6 | 
 7 |     $ echo '{"json":"obj"}' | hcltool
 8 |     {
 9 |         "json": "obj"
10 |     }
11 |     $ echo '{ 1.2:3.4}' | python -m json.tool
12 |     Expecting property name enclosed in double quotes: line 1 column 3 (char 2)
13 | 
14 | Copy/pasted from json.tool, distributed under the python license.
15 | """
16 | 
17 | import sys
18 | import json
19 | import hcl
20 | 
21 | def main():
22 |     if len(sys.argv) == 1:
23 |         infile = sys.stdin
24 |         outfile = sys.stdout
25 |     elif len(sys.argv) == 2:
26 |         infile = open(sys.argv[1], 'rb')
27 |         outfile = sys.stdout
28 |     elif len(sys.argv) == 3:
29 |         infile = open(sys.argv[1], 'rb')
30 |         outfile = open(sys.argv[2], 'wb')
31 |     else:
32 |         raise SystemExit(sys.argv[0] + " [infile [outfile]]")
33 |     with infile:
34 |         try:
35 |             obj = hcl.load(infile)
36 |         except ValueError as e:
37 |             raise SystemExit(e)
38 |     with outfile:
39 |         json.dump(obj, outfile, sort_keys=True,
40 |                   indent=4, separators=(',', ': '))
41 |         outfile.write('\n')
42 | 
43 | 
44 | if __name__ == '__main__':
45 |     main()
46 | 


--------------------------------------------------------------------------------
/CHANGELOG.md:
--------------------------------------------------------------------------------
 1 | 0.4.0 (2020-01-07)
 2 | ------------------
 3 | * Updated for terraform v0.12 syntax
 4 | 
 5 | 0.2.1 (2016-04-14)
 6 | ------------------
 7 | * Fixes for mutliple configuration blocks with same name
 8 | 
 9 | 0.2.0 (2016-03-03)
10 | -------------------
11 | * Added support for three tiered structures:
12 | 
13 |     key1 "key2" "key3" {
14 |         name = value
15 |     }
16 | 
17 | 0.1.15 (2015-10-05)
18 | -------------------
19 | * Fix regression in setup.py
20 | * Remove extra print statement from setup.py
21 | 
22 | 0.1.13 (2015-10-04)
23 | -------------------
24 | * Multi-line comments aren't allowed to terminate with EOF
25 | 
26 | 0.1.12 (2015-10-04)
27 | -------------------
28 | * Move parsetab.dat to build_py step instead of post-install
29 | 
30 | 0.1.11 (2015-04-24)
31 | -------------------
32 | * ply version requirement is now == 3.4
33 | 
34 | 0.1.9 (2015.04.19)
35 | ------------------
36 | * Fix unicode error in python 2.x
37 | 
38 | 0.1.8 (2014-11-14)
39 | ------------------
40 | * Parse floats properly
41 | * Properly decode \\n
42 | * Complex keys can be set using strings
43 | 
44 | 0.1.6 (2014-10-23)
45 | ------------------
46 | * Fix bug that prevented pyhcl from working in a pyinstaller environment
47 | 
48 | 0.1.5 (2014-10-15)
49 | ------------------
50 | * Support escaped strings
51 | * Support trailing commas
52 | * Remove support for alternative boolean values
53 | 
54 | 0.1.3 (2014-09-12)
55 | ------------------
56 | * Update documentation
57 | * Fix py3 support regarding bytes/strings
58 | * Add tests for bytes and strings
59 | * Support various boolean values
60 | 
61 | 0.1.2 (2014-09-10)
62 | ------------------
63 | * Add travis-ci tests, fix minor bugs in setup.py
64 | 
65 | 0.1.0 (2014-09-05)
66 | ------------------
67 | * Initial release
68 | 


--------------------------------------------------------------------------------
/.github/workflows/dist.yml:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: dist
  3 | 
  4 | on:
  5 |   pull_request:
  6 |   push:
  7 |     branches:
  8 |     - main
  9 |     tags:
 10 |     - '*'
 11 | 
 12 | concurrency:
 13 |   group: ${{ github.ref }}
 14 |   cancel-in-progress: true
 15 | 
 16 | jobs:
 17 | 
 18 |   #
 19 |   # Build a wheel
 20 |   #
 21 | 
 22 |   build:
 23 |     runs-on: ubuntu-22.04
 24 |     steps:
 25 |     - uses: actions/checkout@v3
 26 |       with:
 27 |         submodules: recursive
 28 |         fetch-depth: 0
 29 | 
 30 |     - uses: actions/setup-python@v4
 31 |       with:
 32 |         python-version: 3.8
 33 | 
 34 |     - run: pipx run build
 35 | 
 36 |     - name: Upload build artifacts
 37 |       uses: actions/upload-artifact@v3
 38 |       with:
 39 |         name: dist
 40 |         path: dist
 41 | 
 42 |   #
 43 |   # Test wheels
 44 |   #
 45 | 
 46 |   test:
 47 |     needs: [build]
 48 |     runs-on: ${{ matrix.os }}
 49 |     strategy:
 50 |       matrix:
 51 |         os: [windows-2022, macos-11, ubuntu-20.04]
 52 |         python_version:
 53 |         - '3.6'
 54 |         - '3.7'
 55 |         - '3.8'
 56 |         - '3.9'
 57 |         - '3.10'
 58 |         - '3.11'
 59 |         architecture: [x64]
 60 | 
 61 |     steps:
 62 |     - uses: actions/checkout@v3
 63 |       with:
 64 |         submodules: recursive
 65 |         fetch-depth: 0
 66 |     - uses: actions/setup-python@v4
 67 |       with:
 68 |         python-version: ${{ matrix.python_version }}
 69 |         architecture: ${{ matrix.architecture }}
 70 | 
 71 |     - name: Download build artifacts
 72 |       uses: actions/download-artifact@v3
 73 |       with:
 74 |         name: dist
 75 |         path: dist
 76 | 
 77 |     - name: Install test dependencies
 78 |       run: python -m pip --disable-pip-version-check install -r testing-requirements.txt
 79 |     
 80 |     - name: Test wheel
 81 |       shell: bash
 82 |       run: |
 83 |         cd dist
 84 |         python -m pip --disable-pip-version-check install *.whl
 85 |         cd ../tests
 86 |         pytest .
 87 | 
 88 |   publish:
 89 |     runs-on: ubuntu-latest
 90 |     needs: [test]
 91 |     permissions:
 92 |       id-token: write
 93 |     if: github.event_name == 'push' && startsWith(github.event.ref, 'refs/tags')
 94 |     
 95 |     steps:
 96 |     - name: Download build artifacts
 97 |       uses: actions/download-artifact@v3
 98 |       with:
 99 |         name: dist
100 |         path: dist
101 | 
102 |     - name: Publish to PyPI
103 |       uses: pypa/gh-action-pypi-publish@release/v1
104 | 


--------------------------------------------------------------------------------
/tests/test_load_dump.py:
--------------------------------------------------------------------------------
  1 | #
  2 | # These tests are taken from hcl/parse_test.go
  3 | #
  4 | 
  5 | from __future__ import print_function
  6 | 
  7 | from os.path import join, dirname
  8 | import hcl
  9 | import json
 10 | 
 11 | import pytest
 12 | 
 13 | PARSE_FIXTURE_DIR = join(dirname(__file__), 'lex-fixtures')
 14 | PARSE_FIXTURES = [
 15 |     (
 16 |         "assign_colon.hcl",
 17 |         False,
 18 |     ),
 19 |     (
 20 |         "comment.hcl",
 21 |         False,
 22 |     ),
 23 |     (
 24 |         "list_comma.hcl",
 25 |         False,
 26 |     ),
 27 |     (
 28 |         "list_of_maps.hcl",
 29 |         False,
 30 |     ),
 31 |     (
 32 |         "multiple.hcl",
 33 |         False,
 34 |     ),
 35 |     (
 36 |         "structure.hcl",
 37 |         False,
 38 |     ),
 39 |     (
 40 |         "structure_basic.hcl",
 41 |         False,
 42 |     ),
 43 |     (
 44 |         "structure_empty.hcl",
 45 |         False,
 46 |     ),
 47 |     (
 48 |         "complex.hcl",
 49 |         False,
 50 |     ),
 51 |     (
 52 |         "assign_deep.hcl",
 53 |         False,
 54 |     ),
 55 |     (
 56 |         "types.hcl",
 57 |         False,
 58 |     ),
 59 |     (
 60 |         "structure_comma.hcl",
 61 |         False,
 62 |     ),
 63 |     (
 64 |         "terraform0.12syntax.hcl",
 65 |         False,
 66 |     ),
 67 |     (
 68 |         "conditional_operator.hcl",
 69 |         False,
 70 |     ),
 71 | ]
 72 | 
 73 | @pytest.mark.parametrize("export_comments", [None, 'LINE', 'MULTILINE', 'ALL'])
 74 | @pytest.mark.parametrize("hcl_fname,invalid", PARSE_FIXTURES)
 75 | def test_parser_bytes(hcl_fname, invalid, export_comments):
 76 |     with open(join(PARSE_FIXTURE_DIR, hcl_fname), 'rb') as fp:
 77 |         
 78 |         input = fp.read()
 79 |         print(input)
 80 |         
 81 |         if not invalid:
 82 |             hcl.loads(input, export_comments)
 83 |         else:
 84 |             with pytest.raises(ValueError):
 85 |                 hcl.loads(input, export_comments)
 86 |                 
 87 | @pytest.mark.parametrize("export_comments", [None, 'LINE', 'MULTILINE', 'ALL'])
 88 | @pytest.mark.parametrize("hcl_fname,invalid", PARSE_FIXTURES)
 89 | def test_parser_str(hcl_fname, invalid, export_comments):
 90 |     
 91 |     with open(join(PARSE_FIXTURE_DIR, hcl_fname), 'r') as fp:
 92 |         
 93 |         input = fp.read()
 94 |         print(input)
 95 |         
 96 |         if not invalid:
 97 |             hcl.loads(input, export_comments)
 98 |         else:
 99 |             with pytest.raises(ValueError):
100 |                 hcl.loads(input, export_comments)
101 | 


--------------------------------------------------------------------------------
/tests/test_parser.py:
--------------------------------------------------------------------------------
  1 | #
  2 | # These tests are taken from hcl/parse_test.go
  3 | #
  4 | 
  5 | from __future__ import print_function
  6 | 
  7 | from os.path import join, dirname
  8 | import hcl
  9 | import json
 10 | 
 11 | import pytest
 12 | 
 13 | PARSE_FIXTURE_DIR = join(dirname(__file__), 'lex-fixtures')
 14 | PARSE_FIXTURES = [
 15 |     (
 16 |         "assign_colon.hcl",
 17 |         False,
 18 |     ),
 19 |     (
 20 |         "comment.hcl",
 21 |         False,
 22 |     ),
 23 |     (
 24 |         "list_comma.hcl",
 25 |         False,
 26 |     ),
 27 |     (
 28 |         "list_of_maps.hcl",
 29 |         False,
 30 |     ),
 31 |     (
 32 |         "multiple.hcl",
 33 |         False,
 34 |     ),
 35 |     (
 36 |         "structure.hcl",
 37 |         False,
 38 |     ),
 39 |     (
 40 |         "structure_basic.hcl",
 41 |         False,
 42 |     ),
 43 |     (
 44 |         "structure_empty.hcl",
 45 |         False,
 46 |     ),
 47 |     (
 48 |         "complex.hcl",
 49 |         False,
 50 |     ),
 51 |     (
 52 |         "assign_deep.hcl",
 53 |         False,
 54 |     ),
 55 |     (
 56 |         "types.hcl",
 57 |         False,
 58 |     ),
 59 |     (
 60 |         "structure_comma.hcl",
 61 |         False,
 62 |     ),
 63 |     (
 64 |         "terraform0.12syntax.hcl",
 65 |         False,
 66 |     ),
 67 |     (
 68 |         "conditional_operator.hcl",
 69 |         False,
 70 |     ),
 71 | ]
 72 | 
 73 | @pytest.mark.parametrize("export_comments", [None, 'LINE', 'MULTILINE', 'ALL'])
 74 | @pytest.mark.parametrize("hcl_fname,invalid", PARSE_FIXTURES)
 75 | def test_parser_bytes(hcl_fname, invalid, export_comments):
 76 |     
 77 |     with open(join(PARSE_FIXTURE_DIR, hcl_fname), 'rb') as fp:
 78 |         
 79 |         input = fp.read()
 80 |         print(input)
 81 |         
 82 |         if not invalid:
 83 |             hcl.loads(input, export_comments)
 84 |         else:
 85 |             with pytest.raises(ValueError):
 86 |                 hcl.loads(input, export_comments)
 87 |                 
 88 | @pytest.mark.parametrize("export_comments", [None, 'LINE', 'MULTILINE', 'ALL'])
 89 | @pytest.mark.parametrize("hcl_fname,invalid", PARSE_FIXTURES)
 90 | def test_parser_str(hcl_fname, invalid, export_comments):
 91 |     
 92 |     with open(join(PARSE_FIXTURE_DIR, hcl_fname), 'r') as fp:
 93 |         
 94 |         input = fp.read()
 95 |         print(input)
 96 |         
 97 |         if not invalid:
 98 |             hcl.loads(input, export_comments)
 99 |         else:
100 |             with pytest.raises(ValueError):
101 |                 hcl.loads(input, export_comments)
102 | 


--------------------------------------------------------------------------------
/src/hcl/api.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | from .parser import HclParser
 3 | 
 4 | import sys
 5 | 
 6 | if sys.version_info[0] < 3:
 7 | 
 8 |     def u(s):
 9 |         if isinstance(s, unicode):
10 |             return s
11 |         else:
12 |             return unicode(s, 'utf-8')
13 | 
14 | 
15 | else:
16 | 
17 |     def u(s):
18 |         if isinstance(s, bytes):
19 |             return s.decode('utf-8')
20 |         else:
21 |             return s
22 | 
23 | 
24 | def isHcl(s):
25 |     '''
26 |         Detects whether a string is JSON or HCL
27 |         
28 |         :param s: String that may contain HCL or JSON
29 |         
30 |         :returns: True if HCL, False if JSON, raises ValueError
31 |                   if neither
32 |     '''
33 |     if not s:
34 |         return True
35 | 
36 |     for c in s:
37 |         if c.isspace():
38 |             continue
39 | 
40 |         if c == '{':
41 |             return False
42 |         else:
43 |             return True
44 | 
45 |     raise ValueError("No HCL object could be decoded")
46 | 
47 | 
48 | def load(fp, export_comments=None):
49 |     '''
50 |         Deserializes a file-pointer like object into a python dictionary.
51 |         The contents of the file must either be JSON or HCL.
52 |         
53 |         :param fp: An object that has a read() function
54 |         :param export_comments: optional string that allow to export also coded comments. it could be:
55 |             'LINE': to export only single-line comments (// or #)
56 |             'MULTILINE': to export only multi-line comments (/* ... */)
57 |             'ALL': to export both 'LINE' and 'MULTILINE' comments
58 |             default None
59 |         
60 |         :returns: Dictionary
61 |     '''
62 |     return loads(fp.read(), export_comments=export_comments)
63 | 
64 | 
65 | def loads(s, export_comments=None):
66 |     '''
67 |         Deserializes a string and converts it to a dictionary. The contents
68 |         of the string must either be JSON or HCL.
69 |         
70 |         :param s: string to parse
71 |         :param export_comments: optional string that allow to export also coded comments. it could be:
72 |             'LINE': to export only single-line comments (// or #)
73 |             'MULTILINE': to export only multi-line comments (/* ... */)
74 |             'ALL': to export both 'LINE' and 'MULTILINE' comments
75 |             default None
76 |         
77 |         :returns: Dictionary 
78 |     '''
79 |     s = u(s)
80 |     if isHcl(s):
81 |         return HclParser().parse(s, export_comments=export_comments)
82 |     else:
83 |         return json.loads(s)
84 | 
85 | 
86 | def dumps(*args, **kwargs):
87 |     '''Turns a dictionary into JSON, passthru to json.dumps'''
88 |     return json.dumps(*args, **kwargs)
89 | 


--------------------------------------------------------------------------------
/tests/lex-fixtures/conditional_operator.hcl:
--------------------------------------------------------------------------------
 1 | // objectitem : objectkey EQUAL objectkey QMARK objectkey COLON objectkey
 2 | identifier1 = identifier2  ? identifier3 : identifier4
 3 | // objectitem : objectkey EQUAL objectkey QMARK objectkey COLON number
 4 | identifier1 = identifier2 ? identifier3 : 1
 5 | // objectitem : objectkey EQUAL objectkey QMARK objectkey COLON BOOL
 6 | identifier1 = identifier2 ? identifier3 : True
 7 | // objectitem : objectkey EQUAL objectkey QMARK objectkey COLON function
 8 | identifier1 = identifier2 ? identifier3 : element(identifier4, identifier5)
 9 | // objectitem : objectkey EQUAL objectkey QMARK number COLON objectkey
10 | identifier1 = identifier2 ? 1 : identifier3
11 | // objectitem : objectkey EQUAL objectkey QMARK BOOL COLON objectkey
12 | identifier1 = identifier2 ? True : identifier3
13 | // objectitem : objectkey EQUAL objectkey QMARK function COLON objectkey
14 | identifier1 = identifier2 ? element(identifier3, identifier4) : identifier5
15 | // objectitem : objectkey EQUAL objectkey QMARK number COLON number
16 | identifier1 = identifier2 ? 1 : 2
17 | // objectitem : objectkey EQUAL objectkey QMARK number COLON BOOL
18 | identifier1 = identifier2 ? 1 : True
19 | // objectitem : objectkey EQUAL objectkey QMARK number COLON function
20 | identifier1 = identifier2 ? 1 : element(identifier3, identifier4)
21 | // objectitem : objectkey EQUAL objectkey QMARK BOOL COLON number
22 | identifier1 = identifier2 ? True : 1
23 | // objectitem : objectkey EQUAL objectkey QMARK BOOL COLON function
24 | identifier1 = identifier2 ? True : element(identifier3, identifier4)
25 | // objectitem : objectkey EQUAL objectkey QMARK BOOL COLON BOOL
26 | identifier1 = identifier2 ? True : False
27 | 
28 | // objectitem : objectkey EQUAL booleanexp QMARK objectkey COLON objectkey
29 | identifier1 = identifier2 == identifier3 ? identifier4 : identifier5
30 | // objectitem : objectkey EQUAL booleanexp QMARK objectkey COLON number
31 | identifier1 = identifier2 == identifier3 ? identifier4 : 1
32 | // objectitem : objectkey EQUAL booleanexp QMARK objectkey COLON BOOL
33 | identifier1 = identifier2 == identifier3 ? identifier4 : True
34 | // objectitem : objectkey EQUAL booleanexp QMARK objectkey COLON function
35 | identifier1 = identifier2 == identifier3 ? identifier4 : element(identifier5, identifier6)
36 | // objectitem : objectkey EQUAL booleanexp QMARK number COLON objectkey
37 | identifier1 = identifier2 == identifier3 ? 1 : identifier4
38 | // objectitem : objectkey EQUAL booleanexp QMARK BOOL COLON objectkey
39 | identifier1 = identifier2 == identifier3 ? True : identifier4
40 | // objectitem : objectkey EQUAL booleanexp QMARK function COLON objectkey
41 | identifier1 = identifier2 == identifier3 ? element(identifier4, identifier5) : identifier6
42 | // objectitem : objectkey EQUAL booleanexp QMARK number COLON number
43 | identifier1 = identifier2 == identifier3 ? 1 : 2
44 | // objectitem : objectkey EQUAL booleanexp QMARK number COLON BOOL
45 | identifier1 = identifier2 == identifier3 ? 1 : True
46 | // objectitem : objectkey EQUAL booleanexp QMARK number COLON function
47 | identifier1 = identifier2 == identifier3 ? 1 : element(identifier4, identifier5)
48 | // objectitem : objectkey EQUAL booleanexp QMARK BOOL COLON number
49 | identifier1 = identifier2 == identifier3 ? True : 1
50 | // objectitem : objectkey EQUAL booleanexp QMARK BOOL COLON function
51 | identifier1 = identifier2 == identifier3 ? True : element(identifier4, identifier5)
52 | // objectitem : objectkey EQUAL booleanexp QMARK BOOL COLON BOOL
53 | identifier1 = identifier2 == identifier3 ? True : False


--------------------------------------------------------------------------------
/README.rst:
--------------------------------------------------------------------------------
  1 | pyhcl
  2 | =====
  3 | 
  4 | Implements a parser for `HCL (HashiCorp Configuration
  5 | Language) <https://github.com/hashicorp/hcl>`__ in Python. This
  6 | implementation aims to be compatible with the original golang version of
  7 | the parser.
  8 | 
  9 | pyhcl does not support HCL2 (which is what modern terraform uses). You might try
 10 | https://pypi.org/project/python-hcl2/ instead (though I've never personally tried it).
 11 | 
 12 | The grammar and many of the tests/fixtures were copied/ported from the
 13 | golang parser into pyhcl. All releases are tested with a variety of 
 14 | python versions from Python 2.7 onward.
 15 | 
 16 | This version has been modified to work with terraform 0.12 syntax.  
 17 | It should be backward compatible with earlier versions.  
 18 | It doesn't cover every situation.  See discussion in pull request:
 19 | https://github.com/virtuald/pyhcl/pull/57
 20 | 
 21 | Installation
 22 | ============
 23 | 
 24 | ::
 25 | 
 26 |     pip install pyhcl
 27 | 
 28 | Usage
 29 | =====
 30 | 
 31 | This module is intended to be used in mostly the same way that one would
 32 | use the json module in python, and load/loads/dumps are implemented.
 33 | 
 34 | ::
 35 | 
 36 |     import hcl
 37 | 
 38 |     with open('file.hcl', 'r') as fp:
 39 |         obj = hcl.load(fp)
 40 | 
 41 | Currently the dumps function outputs JSON, and not HCL.
 42 | 
 43 | Convert HCL to JSON
 44 | -------------------
 45 | 
 46 | pyhcl comes with a script that you can use to easily convert HCL to JSON,
 47 | similar to the json.tool that comes with python::
 48 | 
 49 | 	hcltool INFILE [OUTFILE]
 50 | 	
 51 | Structure Validation
 52 | --------------------
 53 | 
 54 | Similar to JSON, the output of parsing HCL is a python dictionary with
 55 | no defined structure. The golang library for HCL implements support for
 56 | parsing HCL according to defined objects, but this implementation does
 57 | not currently support such constructs.
 58 | 
 59 | Instead, I recommend that you use tools designed to validate JSON, such
 60 | as the `schematics <https://pypi.python.org/pypi/schematics>`_ library. 
 61 | 
 62 | Syntax
 63 | ======
 64 | 
 65 | -  Single line comments start with ``#`` or ``//``
 66 | 
 67 | -  Multi-line comments are wrapped in ``/*`` and ``*/``
 68 | 
 69 | -  Values are assigned with the syntax ``key = value`` (whitespace
 70 |    doesn't matter). The value can be any primitive: a string, number,
 71 |    boolean, object, or list.
 72 | 
 73 | -  Strings are double-quoted and can contain any UTF-8 characters.
 74 |    Example: ``"Hello, World"``
 75 | 
 76 | -  Numbers are assumed to be base 10. If you prefix a number with 0x, it
 77 |    is treated as a hexadecimal. If it is prefixed with 0, it is treated
 78 |    as an octal. Numbers can be in scientific notation: "1e10".
 79 | 
 80 | -  Boolean values: ``true``, ``false``
 81 | 
 82 | -  Arrays can be made by wrapping it in ``[]``. Example:
 83 |    ``["foo", "bar", 42]``. Arrays can contain primitives and other
 84 |    arrays, but cannot contain objects. Objects must use the block syntax
 85 |    shown below.
 86 | 
 87 | Objects and nested objects are created using the structure shown below::
 88 | 
 89 |     variable "ami" {
 90 |         description = "the AMI to use"
 91 |     }
 92 | 
 93 | Testing
 94 | =======
 95 | 
 96 | To run the tests::
 97 | 
 98 |     pip install -r testing-requirements.txt
 99 |     tests/run_tests.sh
100 |     
101 | Debug Mode
102 | ----------
103 | 
104 | To enable debug mode::
105 | 
106 |     import hcl
107 |     hcl.parser.DEBUG = True
108 | 
109 | Authors
110 | =======
111 | 
112 | Dustin Spicuzza (dustin@virtualroadside.com)
113 | 
114 | Note: This project is not associated with Hashicorp
115 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | 
  3 | from __future__ import print_function
  4 | 
  5 | from os.path import abspath, dirname, join, exists
  6 | 
  7 | try:
  8 |     from setuptools.command.build_py import build_py as _build_py
  9 | except ImportError:
 10 |     from distutils.command.build_py import build_py as _build_py
 11 | 
 12 | from distutils.core import setup
 13 | 
 14 | import os
 15 | import sys
 16 | import subprocess
 17 | 
 18 | setup_dir = abspath(dirname(__file__))
 19 | version_file = join(setup_dir, 'src', 'hcl', 'version.py')
 20 | 
 21 | 
 22 | def _pre_install():
 23 |     '''Initialize the parse table at install time'''
 24 | 
 25 |     # Generate the parsetab.dat file at setup time
 26 |     dat = join(setup_dir, 'src', 'hcl', 'parsetab.dat')
 27 |     if exists(dat):
 28 |         os.unlink(dat)
 29 | 
 30 |     sys.path.insert(0, join(setup_dir, 'src'))
 31 | 
 32 |     import hcl
 33 |     from hcl.parser import HclParser
 34 | 
 35 |     parser = HclParser()
 36 | 
 37 | 
 38 | class build_py(_build_py):
 39 |     def run(self):
 40 |         self.execute(_pre_install, (), msg="generating parse table...")
 41 |         _build_py.run(self)
 42 | 
 43 | 
 44 | # Automatically generate a version.py based on the git version
 45 | if exists(join(setup_dir, '.git')):
 46 |     p = subprocess.Popen(
 47 |         ["git", "describe", "--tags", "--long", "--dirty=-dirty"],
 48 |         stdout=subprocess.PIPE,
 49 |         stderr=subprocess.PIPE,
 50 |     )
 51 |     out, err = p.communicate()
 52 |     # Make sure the git version has at least one tag
 53 |     if err:
 54 |         print("Error: You need to create a tag for this repo to use the builder")
 55 |         sys.exit(1)
 56 | 
 57 |     # Convert git version to PEP440 compliant version
 58 |     # - Older versions of pip choke on local identifiers, so we can't include the git commit
 59 |     v, commits, local = out.decode('utf-8').rstrip().split('-', 2)
 60 |     if commits != '0' or '-dirty' in local:
 61 |         v = '%s.post0.dev%s' % (v, commits)
 62 | 
 63 |     # Create the version.py file
 64 |     with open(version_file, 'w') as fp:
 65 |         fp.write("# Autogenerated by setup.py\n__version__ = '{0}'".format(v))
 66 | 
 67 | with open(join(setup_dir, 'README.rst'), 'r') as readme_file:
 68 |     long_description = readme_file.read()
 69 | 
 70 | with open(version_file) as fp:
 71 |     exec(compile(fp.read(), 'version.py', 'exec'), {}, locals())
 72 | 
 73 | install_requires = open(join(setup_dir, 'requirements.txt')).readlines()
 74 | 
 75 | setup(
 76 |     name='pyhcl',
 77 |     version=__version__,
 78 |     description='HCL configuration parser for python',
 79 |     long_description=long_description,
 80 |     author='Dustin Spicuzza',
 81 |     author_email='dustin@virtualroadside.com',
 82 |     url='https://github.com/virtuald/pyhcl',
 83 |     package_dir={'': 'src'},
 84 |     package_data={'hcl': ['src/hcl/parsetab.dat']},
 85 |     packages=['hcl','hcl.ply'],
 86 |     scripts=["scripts/hcltool"],
 87 |     include_package_data=True,
 88 |     setup_requires=install_requires,
 89 |     install_requires=install_requires,
 90 |     cmdclass={'build_py': build_py},
 91 |     classifiers=[
 92 |         "Development Status :: 5 - Production/Stable",
 93 |         "Intended Audience :: Developers",
 94 |         "License :: OSI Approved :: Mozilla Public License 2.0 (MPL 2.0)",
 95 |         "Operating System :: OS Independent",
 96 |         "Programming Language :: Python",
 97 |         "Programming Language :: Python :: 2",
 98 |         "Programming Language :: Python :: 2.7",
 99 |         "Programming Language :: Python :: 3",
100 |         "Programming Language :: Python :: 3.3",
101 |         "Programming Language :: Python :: 3.4",
102 |         "Topic :: Text Processing",
103 |     ],
104 | )
105 | 


--------------------------------------------------------------------------------
/tests/test_decoder.py:
--------------------------------------------------------------------------------
 1 | #
 2 | # These tests are taken from decoder_test.go
 3 | #
 4 | 
 5 | from __future__ import print_function
 6 | 
 7 | from os.path import join, dirname
 8 | import hcl
 9 | import json
10 | 
11 | import pytest
12 | 
13 | # hcl, json, dict
14 | FIXTURE_DIR = join(dirname(__file__), 'fixtures')
15 | FIXTURES = [
16 |     ('array_comment.hcl', 'array_comment.json', None),
17 |     ('basic.hcl', 'basic.json', None),
18 |     ('basic_squish.hcl', None, {'foo': 'bar', 'bar': '${file("bing/bong.txt")}', 'foo-bar':"baz"}),
19 |     ('decode_policy.hcl', 'decode_policy.json', None),
20 |     ('decode_tf_variable.hcl', 'decode_tf_variable.json', None),
21 |     ('empty.hcl', None, {'resource': {'foo': {}}}),
22 |     ('empty_file.hcl', None, {}),
23 |     ('escape.hcl', None, {'foo': 'bar"baz\\n'}),
24 |     ('flat.hcl', None, {'foo': 'bar', 'Key': 7}),
25 |     ('float.hcl', None, {'a': 1.02}),
26 |     ('float.hcl', 'float.json', None),
27 |     ('function.hcl', 'function.json', None),
28 |     ('issue12.hcl', 'issue12.json', None),
29 |     ('multiline_bad.hcl', 'multiline.json', None),
30 |     ('nested_lists.hcl', 'nested_lists.json', None),
31 |     ('only_comments.hcl', None, {}),
32 |     ('scientific.hcl', 'scientific.json', None),
33 |     ('structure.hcl', 'structure_flat.json', None),
34 |     #('structure2.hcl', 'structure2.json', None),  # not in the golang tests
35 |     ('structure_flatmap.hcl', 'structure_flatmap.json', None),
36 |     ('structure_list.hcl', 'structure_list.json', None), # these don't match in golang either
37 |     ('structure_list.hcl', None, {'foo': [{'key': 7}, {'key': 12}]}), # nor this
38 |     ('issue12.hcl', 'issue12.json', None),
39 |     #'structure_list_deep.json'
40 |     ('structure_multi.hcl', 'structure_multi.json', None),
41 |     ('structure_three_tiers.hcl', 'structure_three_tiers.json', None),
42 |     ('tab_heredoc.hcl', 'tab_heredoc.json', None),
43 |     ('terraform_heroku.hcl', 'terraform_heroku.json', None),
44 |     ('structure_list_deep.hcl','structure_list_deep.json', None),
45 |     ('heredoc_terminator_same_line.hcl','heredoc_terminator_same_line.json', None),
46 | ]
47 | 
48 | 
49 | 
50 | 
51 | @pytest.mark.parametrize("hcl_fname,json_fname,struct", FIXTURES)
52 | def test_decoder(hcl_fname, json_fname, struct):
53 | 
54 |     with open(join(FIXTURE_DIR, hcl_fname), 'r') as fp:
55 |         hcl_json = hcl.load(fp)
56 | 
57 |     assert json_fname is not None or struct is not None
58 | 
59 |     if json_fname is not None:
60 |         with open(join(FIXTURE_DIR, json_fname), 'r') as fp:
61 |             good_json = json.load(fp)
62 | 
63 |         assert hcl_json == good_json
64 | 
65 |     if struct is not None:
66 |         assert hcl_json == struct
67 | 
68 | 
69 | COMMENTED_FIXTURES = [
70 |     ('single_line_comment.hcl', 'single_line_comment_L.json', "single_line_comment.json", 'single_line_comment_L.json'),
71 |     ('multi_line_comment.hcl', 'multi_line_comment.json', 'multi_line_comment_M.json', 'multi_line_comment_M.json'),
72 |     ('structure_comment.hcl', 'structure_comment_L.json', 'structure_comment_M.json', 'structure_comment_A.json'),
73 |     ('array_comment.hcl', 'array_comment.json', 'array_comment.json', 'array_comment.json')
74 | ]
75 | 
76 | @pytest.mark.parametrize("export_comments", ['LINE', 'MULTILINE', 'ALL'])
77 | @pytest.mark.parametrize("hcl_fname,sline_fname,mline_fname,aline_fname", COMMENTED_FIXTURES)
78 | def test_decoder_export_comments(hcl_fname, sline_fname, mline_fname, aline_fname, export_comments):
79 |     with open(join(FIXTURE_DIR, hcl_fname), 'r') as fp:
80 |         hcl_json = hcl.load(fp, export_comments)
81 | 
82 |     json_fname = {
83 |         "LINE": sline_fname,
84 |         "MULTILINE": mline_fname,
85 |         "ALL": aline_fname
86 |     }
87 | 
88 |     with open(join(FIXTURE_DIR, json_fname[export_comments]), 'r') as fp:
89 |             good_json = json.load(fp)
90 | 
91 |     assert hcl_json == good_json


--------------------------------------------------------------------------------
/src/hcl/lexer.py:
--------------------------------------------------------------------------------
  1 | import re
  2 | import sys
  3 | 
  4 | from .ply import lex
  5 | 
  6 | if sys.version_info < (3,):
  7 |     text_type = unicode
  8 | else:
  9 |     text_type = str
 10 | 
 11 | 
 12 | def _raise_error(t, message=None):
 13 |     lexpos = t.lexer.lexpos
 14 |     lexdata = t.lexer.lexdata
 15 |     lineno = t.lexer.lineno
 16 |     column = _find_column(lexdata, t)
 17 |     if message is None:
 18 |         message = "Illegal character '%s'" % lexdata[lexpos]
 19 |     raise ValueError(
 20 |         "Line %d, column %d, index %d: %s" % (lineno, column, lexpos, message)
 21 |     )
 22 | 
 23 | 
 24 | def _find_column(input, token):
 25 |     last_cr = input.rfind('\n', 0, token.lexpos)
 26 |     column = (token.lexpos - last_cr) - 1
 27 |     return column
 28 | 
 29 | 
 30 | class Lexer(object):
 31 | 
 32 |     tokens = (
 33 |         'BOOL',
 34 |         'FLOAT',
 35 |         'NUMBER',
 36 |         'COMMA',
 37 |         'COMMENT',
 38 |         'MULTICOMMENT',
 39 |         'IDENTIFIER',
 40 |         'EQUAL',
 41 |         'STRING',
 42 |         'ADD',
 43 |         'MINUS',
 44 |         'MULTIPLY',
 45 |         'DIVIDE',
 46 |         'LEFTBRACE',
 47 |         'RIGHTBRACE',
 48 |         'LEFTBRACKET',
 49 |         'RIGHTBRACKET',
 50 |         'PERIOD',
 51 |         'EPLUS',
 52 |         'EMINUS',
 53 |         'LEFTPAREN',
 54 |         'RIGHTPAREN',
 55 |         'QMARK',
 56 |         'COLON',
 57 |         'ASTERISK_PERIOD',
 58 |         'GT',
 59 |         'LT',
 60 |         'EQ',
 61 |         'NE',
 62 |         'LE',
 63 |         'GE',
 64 |     )
 65 | 
 66 |     states = (
 67 |         ('stringdollar', 'exclusive'),
 68 |         ('string', 'exclusive'),
 69 |         ('heredoc', 'exclusive'),
 70 |         ('tabbedheredoc', 'exclusive'),
 71 |     )
 72 | 
 73 |     can_export_comments = []
 74 | 
 75 |     def t_BOOL(self, t):
 76 |         r'(true)|(false)'
 77 |         t.value = t.value == 'true'
 78 |         return t
 79 | 
 80 |     def t_EMINUS(self, t):
 81 |         r'(?<=\d|\.)[eE]-'
 82 |         return t
 83 | 
 84 |     def t_EPLUS(self, t):
 85 |         r'(?<=\d)[eE]\+?|(?<=\d\.)[eE]\+?'
 86 |         return t
 87 | 
 88 |     def t_FLOAT(self, t):
 89 |         r'-?((\d+\.\d*)|(\d*\.\d+))'
 90 |         t.value = float(t.value)
 91 |         return t
 92 | 
 93 |     def t_hexnumber(self, t):
 94 |         r'-?0[xX][0-9a-fA-F]+'
 95 |         t.value = int(t.value, base=16)
 96 |         t.type = 'NUMBER'
 97 |         return t
 98 | 
 99 |     def t_intnumber(self, t):
100 |         r'-?\d+'
101 |         t.value = int(t.value)
102 |         t.type = 'NUMBER'
103 |         return t
104 | 
105 |     def t_PERIOD(self, t):
106 |         r'\.'
107 |         return t
108 | 
109 |     def t_COMMA(self, t):
110 |         r','
111 |         return t
112 | 
113 |     def t_QMARK(self, t):
114 |         r'\?'
115 |         return t
116 | 
117 |     def t_COLON(self, t):
118 |         r':'
119 |         return t
120 | 
121 |     def t_ASTERISK_PERIOD(self, t):
122 |         r'\*\.'
123 |         return t
124 | 
125 |     def t_GT(self, t):
126 |         r'(?<!>)>(?!>|=)'
127 |         return t
128 | 
129 |     def t_LT(self, t):
130 |         r'(?<!<)<(?!<|=)'
131 |         return t
132 | 
133 |     def t_EQ(self, t):
134 |         r'=='
135 |         return t
136 | 
137 |     def t_NE(self, t):
138 |         r'!='
139 |         return t
140 | 
141 |     def t_LE(self, t):
142 |         r'<='
143 |         return t
144 | 
145 |     def t_GE(self, t):
146 |         r'>='
147 |         return t
148 | 
149 |     def t_IDENTIFIER(self, t):
150 |         r'[^\W\d][\w.-]*'
151 |         t.value = text_type(t.value)
152 |         return t
153 | 
154 |     # Strings
155 |     def t_string(self, t):
156 |         # Start of a string
157 |         r'\"'
158 |         # abs_start is the absolute start of the string. We use this at the end
159 |         # to know how many new lines we've consumed
160 |         t.lexer.abs_start = t.lexer.lexpos
161 |         # rel_pos is the begining of the unconsumed part of the string. It will
162 |         # get modified when consuming escaped characters
163 |         t.lexer.rel_pos = t.lexer.lexpos
164 |         # The value of the consumed part of the string
165 |         t.lexer.string_value = u''
166 |         t.lexer.begin('string')
167 | 
168 |     def t_string_escapedchar(self, t):
169 |         # If a quote or backslash is escaped, build up the string by ignoring
170 |         # the escape character. Should this be done for other characters?
171 |         r'(?<=\\)(\"|\\)'
172 |         t.lexer.string_value += (
173 |             t.lexer.lexdata[t.lexer.rel_pos : t.lexer.lexpos - 2] + t.value
174 |         )
175 |         t.lexer.rel_pos = t.lexer.lexpos
176 |         pass
177 | 
178 |     def t_string_stringdollar(self, t):
179 |         # Left brace preceeded by a dollar
180 |         r'(?<=\$)\{'
181 |         t.lexer.braces = 1
182 |         t.lexer.begin('stringdollar')
183 | 
184 |     def t_string_ignoring(self, t):
185 |         # Ignore everything except for a quote
186 |         r'[^\"]'
187 |         pass
188 | 
189 |     def t_string_STRING(self, t):
190 |         # End of the string
191 |         r'\"'
192 |         t.value = (
193 |             t.lexer.string_value + t.lexer.lexdata[t.lexer.rel_pos : t.lexer.lexpos - 1]
194 |         )
195 |         t.lexer.lineno += t.lexer.lexdata[t.lexer.abs_start : t.lexer.lexpos - 1].count(
196 |             '\n'
197 |         )
198 |         t.lexer.begin('INITIAL')
199 |         return t
200 | 
201 |     def t_string_eof(self, t):
202 |         t.lexer.lineno += t.lexer.lexdata[t.lexer.abs_start : t.lexer.lexpos].count(
203 |             '\n'
204 |         )
205 |         _raise_error(t, 'EOF before closing string quote')
206 | 
207 |     def t_stringdollar_dontcare(self, t):
208 |         # Ignore everything except for braces
209 |         r'[^\{\}]'
210 |         pass
211 | 
212 |     def t_stringdollar_lbrace(self, t):
213 |         r'\{'
214 |         t.lexer.braces += 1
215 | 
216 |     def t_stringdollar_rbrace(self, t):
217 |         r'\}'
218 |         t.lexer.braces -= 1
219 | 
220 |         if t.lexer.braces == 0:
221 |             # End of the dollar brace, back to the rest of the string
222 |             t.lexer.begin('string')
223 | 
224 |     def t_stringdollar_eof(self, t):
225 |         t.lexer.lineno += t.lexer.lexdata[t.lexer.abs_start : t.lexer.lexpos].count(
226 |             '\n'
227 |         )
228 |         _raise_error(t, "EOF before closing '${}' expression")
229 | 
230 |     def _init_heredoc(self, t):
231 |         t.lexer.here_start = t.lexer.lexpos
232 | 
233 |         if t.value.endswith('\r\n'):
234 |             t.lexer.newline_chars = 2
235 |         else:
236 |             t.lexer.newline_chars = 1
237 | 
238 |         if t.lexer.is_tabbed:
239 |             # Chop '<<-'
240 |             chop = 3
241 |         else:
242 |             # Chop '<<'
243 |             chop = 2
244 | 
245 |         t.lexer.here_identifier = t.value[chop : -t.lexer.newline_chars]
246 |         # We consumed a newline in the regex so bump the counter
247 |         t.lexer.lineno += 1
248 | 
249 |     def t_tabbedheredoc(self, t):
250 |         r'<<-\S+\r?\n'
251 |         t.lexer.is_tabbed = True
252 |         self._init_heredoc(t)
253 |         t.lexer.begin('tabbedheredoc')
254 | 
255 |     def t_heredoc(self, t):
256 |         r'<<\S+\r?\n'
257 |         t.lexer.is_tabbed = False
258 |         self._init_heredoc(t)
259 |         t.lexer.begin('heredoc')
260 | 
261 |     def _end_heredoc(self, t):
262 |         if t.lexer.is_tabbed:
263 |             # Strip leading tabs
264 |             value = t.value.strip()
265 |         else:
266 |             value = t.value
267 | 
268 |         if value == t.lexer.here_identifier:
269 |             # Handle case where identifier is on a line of its own. Need to
270 |             # subtract the current line and the newline characters from
271 |             # the previous line to get the endpos
272 |             endpos = t.lexer.lexpos - (t.lexer.newline_chars + len(t.value))
273 |         elif value.endswith(t.lexer.here_identifier):
274 |             # Handle case where identifier is at the end of the line. Need to
275 |             # subtract the identifier from to get the endpos
276 |             endpos = t.lexer.lexpos - len(t.lexer.here_identifier)
277 |         else:
278 |             return
279 | 
280 |         entire_string = t.lexer.lexdata[t.lexer.here_start : endpos]
281 | 
282 |         if t.lexer.is_tabbed:
283 |             # Get rid of any initial tabs, and remove any tabs preceded by
284 |             # a new line
285 |             chopped_starting_tabs = re.sub('^\t*', '', entire_string)
286 |             t.value = re.sub('\n\t*', '\n', chopped_starting_tabs)
287 |         else:
288 |             t.value = entire_string
289 | 
290 |         t.lexer.lineno += t.lexer.lexdata[t.lexer.here_start : t.lexer.lexpos].count(
291 |             '\n'
292 |         )
293 |         t.lexer.begin('INITIAL')
294 |         return t
295 | 
296 |     def t_tabbedheredoc_STRING(self, t):
297 |         r'^\t*.+?(?=\r?$)'
298 |         return self._end_heredoc(t)
299 | 
300 |     def t_heredoc_STRING(self, t):
301 |         r'^.+?(?=\r?$)'
302 |         return self._end_heredoc(t)
303 | 
304 |     def t_heredoc_ignoring(self, t):
305 |         r'.+|\n'
306 |         pass
307 | 
308 |     def t_heredoc_eof(self, t):
309 |         t.lexer.lineno += t.lexer.lexdata[t.lexer.here_start : t.lexer.lexpos].count(
310 |             '\n'
311 |         )
312 |         _raise_error(t, 'EOF before closing heredoc')
313 | 
314 |     t_tabbedheredoc_ignoring = t_heredoc_ignoring
315 |     t_tabbedheredoc_eof = t_heredoc_eof
316 | 
317 |     t_LEFTBRACE = r'\{'
318 |     t_RIGHTBRACE = r'\}'
319 |     t_LEFTBRACKET = r'\['
320 |     t_RIGHTBRACKET = r'\]'
321 |     t_LEFTPAREN = r'\('
322 |     t_RIGHTPAREN = r'\)'
323 | 
324 |     def t_COMMENT(self, t):
325 |         r'(\#|(//)).*'
326 |         if 'COMMENT' in self.can_export_comments:
327 |             t.value = t.value.lstrip('#').lstrip('//').lstrip()
328 |             return t
329 | 
330 |     def t_MULTICOMMENT(self, t):
331 |         r'/\*(.|\n)*?(\*/)'
332 |         t.lexer.lineno += t.value.count('\n')
333 |         if 'MULTICOMMENT' in self.can_export_comments:
334 |             return t
335 | 
336 |     # Define a rule so we can track line numbers
337 |     def t_newline(self, t):
338 |         r'\n+'
339 |         t.lexer.lineno += len(t.value)
340 | 
341 |     t_ignore = ' \t\r\f\v'
342 | 
343 |     t_EQUAL = r'(?<!=)=(?!=)'
344 |     t_ADD = r'\+'
345 |     t_MINUS = r'-'
346 |     t_MULTIPLY = r'\*'
347 |     t_DIVIDE = r'/'
348 | 
349 |     # Error handling rule
350 |     def t_error(self, t):
351 |         if t.value.startswith('/*'):
352 |             _raise_error(t, 'EOF before closing multiline comment')
353 |         elif t.value.startswith('*/'):
354 |             _raise_error(t, "Found '*/' before start of multiline comment")
355 |         elif t.value.startswith('/'):
356 |             c = t.value[1]
357 |             _raise_error(t, "Expected '//' for comment, got '/%s'" % c)
358 |         elif t.value.startswith('<<'):
359 |             _raise_error(t, "Heredoc must have a marker, e.g. '<<FOO'")
360 |         elif t.value.startswith('<'):
361 |             c = t.value[1]
362 |             _raise_error(t, "Heredoc must start with '<<', got '<%s'" % c)
363 |         else:
364 |             _raise_error(t)
365 | 
366 |     def __init__(self, export_comments=None):
367 |         if export_comments is not None:
368 |             if export_comments == 'LINE':
369 |                 self.can_export_comments = ['COMMENT']
370 |             elif export_comments == 'MULTILINE':
371 |                 self.can_export_comments = ['MULTICOMMENT']
372 |             elif export_comments == 'ALL':
373 |                 self.can_export_comments = ['COMMENT', 'MULTICOMMENT']
374 |             else:
375 |                 raise ValueError(
376 |                     'Only `LINE`, `MULTILINE` and `ALL` value are allowed for '
377 |                     '`export_comments`. given: `%s`.' % export_comments
378 |                 )
379 | 
380 |         self.lex = lex.lex(
381 |             module=self,
382 |             debug=False,
383 |             reflags=(re.UNICODE | re.MULTILINE),
384 |             errorlog=lex.NullLogger(),
385 |         )
386 | 
387 |     def input(self, s):
388 |         return self.lex.input(s)
389 | 
390 |     def token(self):
391 |         return self.lex.token()
392 | 


--------------------------------------------------------------------------------
/tests/test_lexer.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: UTF-8 -*-
  2 | #
  3 | # These tests are taken from hcl/lex_test.go
  4 | #
  5 | 
  6 | from __future__ import print_function, unicode_literals
  7 | 
  8 | from os.path import join, dirname
  9 | import hcl.lexer
 10 | 
 11 | import pytest
 12 | 
 13 | class Error:
 14 |     pass
 15 | 
 16 | LEX_FIXTURE_DIR = join(dirname(__file__), 'lex-fixtures')
 17 | LEX_FIXTURES = [
 18 |     (
 19 |         "array_comment.hcl",
 20 |         ["IDENTIFIER", "EQUAL", "LEFTBRACKET",
 21 |         "STRING", "COMMA",
 22 |         "STRING", "COMMA",
 23 |         "RIGHTBRACKET", None]
 24 |     ),
 25 |     (
 26 |         "comment.hcl",
 27 |         ["IDENTIFIER", "EQUAL", "STRING", None]
 28 |     ),
 29 |     (
 30 |         "multiple.hcl",
 31 |         [
 32 |             "IDENTIFIER", "EQUAL", "STRING",
 33 |             "IDENTIFIER", "EQUAL", "NUMBER",
 34 |             None,
 35 |         ],
 36 |     ),
 37 |     (
 38 |         "list.hcl",
 39 |         [
 40 |             "IDENTIFIER", "EQUAL", "LEFTBRACKET",
 41 |             "NUMBER", "COMMA", "NUMBER", "COMMA", "STRING",
 42 |             "RIGHTBRACKET", None,
 43 |         ],
 44 |     ),
 45 |     (
 46 |         "list_comma.hcl",
 47 |         [
 48 |             "IDENTIFIER", "EQUAL", "LEFTBRACKET",
 49 |             "NUMBER", "COMMA", "NUMBER", "COMMA", "STRING",
 50 |             "COMMA", "RIGHTBRACKET", None,
 51 |         ],
 52 |     ),
 53 |     (
 54 |         "list_of_maps.hcl",
 55 |         [
 56 |             "IDENTIFIER", "EQUAL", "LEFTBRACKET",
 57 |             "LEFTBRACE", "IDENTIFIER", "EQUAL", "STRING", "RIGHTBRACE",
 58 |             "COMMA",
 59 |             "LEFTBRACE", "IDENTIFIER", "EQUAL", "STRING", "COMMA",
 60 |             "IDENTIFIER", "EQUAL", "STRING", "RIGHTBRACE", "COMMA",
 61 |             "RIGHTBRACKET", None,
 62 |         ],
 63 |     ),
 64 |     (
 65 |         "structure_basic.hcl",
 66 |         [
 67 |             "IDENTIFIER", "LEFTBRACE",
 68 |             "IDENTIFIER", "EQUAL", "NUMBER",
 69 |             "STRING", "EQUAL", "NUMBER",
 70 |             "STRING", "EQUAL", "NUMBER",
 71 |             "RIGHTBRACE", None,
 72 |         ],
 73 |     ),
 74 |     (
 75 |         "structure.hcl",
 76 |         [
 77 |             "IDENTIFIER", "IDENTIFIER", "STRING", "LEFTBRACE",
 78 |             "IDENTIFIER", "EQUAL", "NUMBER",
 79 |             "IDENTIFIER", "EQUAL", "STRING",
 80 |             "RIGHTBRACE", None,
 81 |         ],
 82 |     ),
 83 |     (
 84 |         "windows_heredoc.hcl",
 85 |         [
 86 |             "IDENTIFIER", "EQUAL", "STRING", None,
 87 |         ],
 88 |     ),
 89 |     (
 90 |         "empty_heredoc.hcl",
 91 |         [
 92 |             "IDENTIFIER", "EQUAL", "STRING", None,
 93 |         ],
 94 |     ),
 95 |     (
 96 |         "heredoc_terminator_same_line.hcl",
 97 |         [
 98 |             "IDENTIFIER", "EQUAL", "STRING", None,
 99 |         ],
100 |     ),
101 |     (
102 |         "unterminated_block_comment.hcl",
103 |         ["DIVIDE", "MULTIPLY", "IDENTIFIER"],
104 |     ),
105 |     (
106 |         "nested_comment.hcl",
107 |         ["MULTIPLY", "DIVIDE", None],
108 |     ),
109 |     (
110 |         "/not a comment",
111 |         ["DIVIDE", "IDENTIFIER", "IDENTIFIER", "IDENTIFIER", None],
112 |     ),
113 | ]
114 | 
115 | # The first value in the tuple can be either the file that will be read or just
116 | # a string
117 | LEX_ERROR_FIXTURES = [
118 |     (
119 |         "old.hcl",
120 |         [
121 |             "IDENTIFIER", "EQUAL", "LEFTBRACE", "STRING", "COLON", "STRING"
122 |         ],
123 |         "Line 2, column 15, index 27: Illegal character ':'"
124 |     ),
125 |     (
126 |         "a = <HERE\n"
127 |         "foobar\n"
128 |         "HERE",
129 |         ["IDENTIFIER", "EQUAL", "LT", "IDENTIFIER"],
130 |         "Line 1, column 4, index 4: Heredoc must start with '<<', got '<H'"
131 |     ),
132 |     (
133 |         "a = <<HE RE\n"
134 |         "foobar\n"
135 |         "HERE",
136 |         ["IDENTIFIER", "EQUAL", Error],
137 |         "Line 1, column 4, index 4: Heredoc must have a marker, e.g. '<<FOO'"
138 |     ),
139 |     (
140 |         "a = <<HERE\n"
141 |         "foobar\n",
142 |         ["IDENTIFIER", "EQUAL", Error],
143 |         "Line 3, column 0, index 18: EOF before closing heredoc"
144 |     ),
145 |     (
146 |         'a = "foo',
147 |         ["IDENTIFIER", "EQUAL", Error],
148 |         "Line 1, column 8, index 8: EOF before closing string quote"
149 |     ),
150 |     (
151 |         'a = "${foo"',
152 |         ["IDENTIFIER", "EQUAL", Error],
153 |         "Line 1, column 11, index 11: EOF before closing '${}' expression"
154 |     ),
155 | 
156 | ]
157 | 
158 | @pytest.mark.parametrize("hcl_fname,tokens", LEX_FIXTURES)
159 | def test_lexer(hcl_fname, tokens):
160 | 
161 |     if hcl_fname.endswith('.hcl'):
162 |         with open(join(LEX_FIXTURE_DIR, hcl_fname), 'r') as fp:
163 |             input = fp.read()
164 |     else:
165 |         input = hcl_fname
166 | 
167 |     print(input)
168 | 
169 |     lexer = hcl.lexer.Lexer()
170 |     lexer.input(input)
171 | 
172 |     for expectedToken in tokens:
173 |         lex_tok = lexer.token()
174 | 
175 |         if lex_tok is None:
176 |             assert expectedToken is None
177 |         else:
178 |             assert expectedToken == lex_tok.type
179 |         print(lex_tok)
180 | 
181 |     assert lexer.token() is None
182 | 
183 | @pytest.mark.parametrize("hcl_fname,tokens,error_loc", LEX_ERROR_FIXTURES)
184 | def test_lexer_errors(hcl_fname, tokens, error_loc):
185 | 
186 |     if hcl_fname.endswith('.hcl'):
187 |         with open(join(LEX_FIXTURE_DIR, hcl_fname), 'r') as fp:
188 |             input = fp.read()
189 |     else:
190 |         input = hcl_fname
191 | 
192 |     print(input)
193 | 
194 |     lexer = hcl.lexer.Lexer()
195 |     lexer.input(input)
196 | 
197 |     for expectedToken in tokens:
198 |         try:
199 |             lex_tok = lexer.token()
200 |         except ValueError as e:
201 |             assert expectedToken is Error
202 |             assert error_loc == str(e)
203 |             return
204 | 
205 |         if lex_tok is None:
206 |             assert expectedToken is None
207 |         else:
208 |             assert expectedToken == lex_tok.type
209 |         print(lex_tok)
210 | 
211 | f100 = 'f' * 100
212 | 
213 | TOKEN_FIXTURES = [
214 |     # Comments
215 |     (None, "//"),
216 |     (None, "////"),
217 |     (None, "// comment"),
218 |     (None, "// /* comment */"),
219 |     (None, "// // comment //"),
220 |     (None, "//" + f100),
221 |     (None, "#"),
222 |     (None, "##"),
223 |     (None, "# comment"),
224 |     (None, "# /* comment */"),
225 |     (None, "# # comment #"),
226 |     (None, "#" + f100),
227 |     (None, "/**/"),
228 |     (None, "/***/"),
229 |     (None, "/* comment */"),
230 |     (None, "/* // comment */"),
231 |     (None, "/* /* comment */"),
232 |     (None, "/*\n comment\n*/"),
233 |     (None, "/*" + f100 + "*/"),
234 | 
235 |     # Operators
236 |     ("LEFTPAREN", "("),
237 |     ("LEFTBRACKET", "["),
238 |     ("LEFTBRACE", "{"),
239 |     ("COMMA", ","),
240 |     ("PERIOD", "."),
241 |     ("RIGHTPAREN", ")"),
242 |     ("RIGHTBRACKET", "]"),
243 |     ("RIGHTBRACE", "}"),
244 |     ("EQUAL", "="),
245 |     ("ADD", "+"),
246 |     ("MINUS", "-"),
247 |     ("MULTIPLY", "*"),
248 |     ("DIVIDE", "/"),
249 |     ("QMARK", "?"),
250 |     ("COLON", ":"),
251 |     ("GT", ">"),
252 |     ("LT", "<"),
253 |     ("EQ", "=="),
254 |     ("NE", "!="),
255 |     ("LE", "<="),
256 |     ("GE", ">="),
257 |     ("ASTERISK_PERIOD", "*."),
258 | 
259 |     # Bools
260 |     ("BOOL", "true"),
261 |     ("BOOL", "false"),
262 | 
263 |     # Identifier
264 |     ("IDENTIFIER", "a"),
265 |     ("IDENTIFIER", "a0"),
266 |     ("IDENTIFIER", "foobar"),
267 |     ("IDENTIFIER", "foo-bar"),
268 |     ("IDENTIFIER", "abc123"),
269 |     ("IDENTIFIER", "LGTM"),
270 |     ("IDENTIFIER", "_"),
271 |     ("IDENTIFIER", "_abc123"),
272 |     ("IDENTIFIER", "abc123_"),
273 |     ("IDENTIFIER", "_abc_123_"),
274 |     ("IDENTIFIER", "_äöü"),
275 |     ("IDENTIFIER", "_本"),
276 |     ("IDENTIFIER", "äöü"),
277 |     ("IDENTIFIER", "本"),
278 |     ("IDENTIFIER", "a۰۱۸"),
279 |     ("IDENTIFIER", "foo६४"),
280 |     ("IDENTIFIER", "bar９８７６"),
281 | 
282 |     # Heredoc
283 |     ("STRING", "<<EOF\nhello\nworld\nEOF"),
284 |     ("STRING", "<<EOF\nhello world\nEOF"),
285 | 
286 |     # Strings
287 |     ("STRING", '" "'),
288 |     ("STRING", '"a"'),
289 |     ("STRING", '"本"'),
290 |     ("STRING", '"{f}"'),
291 |     ("STRING", '"${file("foo")}"'),
292 |     ("STRING", r'"${file(\"foo\")}"'),
293 |     ("STRING", r'"\a"'),
294 |     ("STRING", r'"\b"'),
295 |     ("STRING", r'"\f"'),
296 |     ("STRING", r'"\n"'),
297 |     ("STRING", r'"\r"'),
298 |     ("STRING", r'"\t"'),
299 |     ("STRING", r'"\v"'),
300 |     ("STRING", r'"\""'),
301 |     ("STRING", r'"\000"'),
302 |     ("STRING", r'"\777"'),
303 |     ("STRING", r'"\x00"'),
304 |     ("STRING", r'"\xff"'),
305 |     ("STRING", r'"\u0000"'),
306 |     ("STRING", r'"\ufA16"'),
307 |     ("STRING", r'"\U00000000"'),
308 |     ("STRING", r'"\U0000ffAB"'),
309 |     ("STRING", '"' + f100 + '"'),
310 | 
311 |     # Numbers
312 |     ("NUMBER", "0"),
313 |     ("NUMBER", "1"),
314 |     ("NUMBER", "9"),
315 |     ("NUMBER", "42"),
316 |     ("NUMBER", "1234567890"),
317 |     ("NUMBER", "00"),
318 |     ("NUMBER", "01"),
319 |     ("NUMBER", "07"),
320 |     ("NUMBER", "042"),
321 |     ("NUMBER", "01234567"),
322 |     ("NUMBER", "0x0"),
323 |     ("NUMBER", "0x1"),
324 |     ("NUMBER", "0xf"),
325 |     ("NUMBER", "0x42"),
326 |     ("NUMBER", "0x123456789abcDEF"),
327 |     ("NUMBER", "0x" + f100),
328 |     ("NUMBER", "0X0"),
329 |     ("NUMBER", "0X1"),
330 |     ("NUMBER", "0XF"),
331 |     ("NUMBER", "0X42"),
332 |     ("NUMBER", "0X123456789abcDEF"),
333 |     ("NUMBER", "0X" + f100),
334 |     ("NUMBER", "-0"),
335 |     ("NUMBER", "-1"),
336 |     ("NUMBER", "-9"),
337 |     ("NUMBER", "-42"),
338 |     ("NUMBER", "-1234567890"),
339 |     ("NUMBER", "-00"),
340 |     ("NUMBER", "-01"),
341 |     ("NUMBER", "-07"),
342 |     ("NUMBER", "-29"),
343 |     ("NUMBER", "-042"),
344 |     ("NUMBER", "-01234567"),
345 |     ("NUMBER", "-0x0"),
346 |     ("NUMBER", "-0x1"),
347 |     ("NUMBER", "-0xf"),
348 |     ("NUMBER", "-0x42"),
349 |     ("NUMBER", "-0x123456789abcDEF"),
350 |     ("NUMBER", "-0x" + f100),
351 |     ("NUMBER", "-0X0"),
352 |     ("NUMBER", "-0X1"),
353 |     ("NUMBER", "-0XF"),
354 |     ("NUMBER", "-0X42"),
355 |     ("NUMBER", "-0X123456789abcDEF"),
356 |     ("NUMBER", "-0X" + f100),
357 | 
358 |     # Floats
359 |     ("FLOAT", "0."),
360 |     ("FLOAT", "1."),
361 |     ("FLOAT", "42."),
362 |     ("FLOAT", "01234567890."),
363 |     ("FLOAT", ".0"),
364 |     ("FLOAT", ".1"),
365 |     ("FLOAT", ".42"),
366 |     ("FLOAT", ".0123456789"),
367 |     ("FLOAT", "0.0"),
368 |     ("FLOAT", "1.0"),
369 |     ("FLOAT", "42.0"),
370 |     ("FLOAT", "01234567890.0"),
371 |     ("FLOAT", "-0.0"),
372 |     ("FLOAT", "-1.0"),
373 |     ("FLOAT", "-42.0"),
374 |     ("FLOAT", "-01234567890.0"),
375 | 
376 | ]
377 | 
378 | @pytest.mark.parametrize("token,input_string", TOKEN_FIXTURES)
379 | def test_tokens(token, input_string):
380 | 
381 |     print(input_string)
382 | 
383 |     lexer = hcl.lexer.Lexer()
384 |     lexer.input(input_string)
385 | 
386 |     lex_tok = lexer.token()
387 | 
388 |     if lex_tok is None:
389 |         assert token is None
390 |     else:
391 |         assert token == lex_tok.type
392 |         assert lexer.token() is None
393 | 
394 | def test_export_comments_wrong_parameter():
395 |     with pytest.raises(ValueError):
396 |         lexer = hcl.lexer.Lexer(export_comments="WRONG")
397 | 
398 | ONE_LINE_COMMENT_FIXTURES = [
399 |     ("COMMENT", "//"),
400 |     ("COMMENT", "////"),
401 |     ("COMMENT", "// comment"),
402 |     ("COMMENT", "// /* comment */"),
403 |     ("COMMENT", "// // comment //"),
404 |     ("COMMENT", "//" + f100),
405 |     ("COMMENT", "#"),
406 |     ("COMMENT", "##"),
407 |     ("COMMENT", "# comment"),
408 |     ("COMMENT", "# /* comment */"),
409 |     ("COMMENT", "# # comment #"),
410 |     ("COMMENT", "#" + f100),
411 |     (None, "/**/"),
412 |     (None, "/***/"),
413 |     (None, "/* comment */"),
414 |     (None, "/* // comment */"),
415 |     (None, "/* /* comment */"),
416 |     (None, "/*\n comment\n*/"),
417 |     (None, "/*" + f100 + "*/")
418 | ]
419 | 
420 | @pytest.mark.parametrize("token,input_string", ONE_LINE_COMMENT_FIXTURES)
421 | def test_one_line_comments_extract(token, input_string):
422 | 
423 |     print(input_string)
424 | 
425 |     lexer = hcl.lexer.Lexer(export_comments='LINE')
426 |     lexer.input(input_string)
427 | 
428 |     lex_tok = lexer.token()
429 | 
430 |     if lex_tok is None:
431 |         assert token is None
432 |     else:
433 |         assert token == lex_tok.type
434 |         assert lexer.token() is None
435 | 
436 | MULTI_LINE_COMMENT_FIXTURES = [
437 |     (None, "//"),
438 |     (None, "////"),
439 |     (None, "// comment"),
440 |     (None, "// /* comment */"),
441 |     (None, "// // comment //"),
442 |     (None, "//" + f100),
443 |     (None, "#"),
444 |     (None, "##"),
445 |     (None, "# comment"),
446 |     (None, "# /* comment */"),
447 |     (None, "# # comment #"),
448 |     (None, "#" + f100),
449 |     ("MULTICOMMENT", "/**/"),
450 |     ("MULTICOMMENT", "/***/"),
451 |     ("MULTICOMMENT", "/* comment */"),
452 |     ("MULTICOMMENT", "/* // comment */"),
453 |     ("MULTICOMMENT", "/* /* comment */"),
454 |     ("MULTICOMMENT", "/*\n comment\n*/"),
455 |     ("MULTICOMMENT", "/*" + f100 + "*/")
456 | ]
457 | 
458 | @pytest.mark.parametrize("token,input_string", MULTI_LINE_COMMENT_FIXTURES)
459 | def test_multi_line_comments_extract(token, input_string):
460 | 
461 |     print(input_string)
462 | 
463 |     lexer = hcl.lexer.Lexer(export_comments='MULTILINE')
464 |     lexer.input(input_string)
465 | 
466 |     lex_tok = lexer.token()
467 | 
468 |     if lex_tok is None:
469 |         assert token is None
470 |     else:
471 |         assert token == lex_tok.type
472 |         assert lexer.token() is None
473 | 
474 | COMMENT_FIXTURES = [
475 |     ("COMMENT", "//"),
476 |     ("COMMENT", "////"),
477 |     ("COMMENT", "// comment"),
478 |     ("COMMENT", "// /* comment */"),
479 |     ("COMMENT", "// // comment //"),
480 |     ("COMMENT", "//" + f100),
481 |     ("COMMENT", "#"),
482 |     ("COMMENT", "##"),
483 |     ("COMMENT", "# comment"),
484 |     ("COMMENT", "# /* comment */"),
485 |     ("COMMENT", "# # comment #"),
486 |     ("COMMENT", "#" + f100),
487 |     ("MULTICOMMENT", "/**/"),
488 |     ("MULTICOMMENT", "/***/"),
489 |     ("MULTICOMMENT", "/* comment */"),
490 |     ("MULTICOMMENT", "/* // comment */"),
491 |     ("MULTICOMMENT", "/* /* comment */"),
492 |     ("MULTICOMMENT", "/*\n comment\n*/"),
493 |     ("MULTICOMMENT", "/*" + f100 + "*/")
494 | ]
495 | 
496 | @pytest.mark.parametrize("token,input_string", COMMENT_FIXTURES)
497 | def test_multi_line_comments_extract(token, input_string):
498 | 
499 |     print(input_string)
500 | 
501 |     lexer = hcl.lexer.Lexer(export_comments='ALL')
502 |     lexer.input(input_string)
503 | 
504 |     lex_tok = lexer.token()
505 | 
506 |     if lex_tok is None:
507 |         assert token is None
508 |     else:
509 |         assert token == lex_tok.type
510 |         assert lexer.token() is None
511 | 
512 | # Testing EPLUS and EMINUS can't be done on their own since they
513 | # require positive lookbehinds and therefore the lexer will find at least one
514 | # other token
515 | COMPLEX_TOKEN_FIXTURES = [
516 |     # EPLUS
517 |     (["IDENTIFIER", "EQUAL", "LEFTBRACKET", "IDENTIFIER", "LEFTBRACKET", "NUMBER", "RIGHTBRACKET", "PERIOD", "IDENTIFIER", "RIGHTBRACKET", ], "records = [aws_elasticsearch_domain.elasticsearch[0].endpoint]"),
518 |     (["FLOAT", "EPLUS"], "0.e"),
519 |     (["FLOAT", "EPLUS"], "1.e+"),
520 |     (["NUMBER", "EPLUS"], "0e"),
521 |     (["NUMBER", "EPLUS"], "0e+"),
522 |     (["FLOAT", "EPLUS"], "1.E"),
523 |     (["FLOAT", "EPLUS"], "1.E+"),
524 |     (["NUMBER", "EPLUS"], "0E"),
525 |     (["NUMBER", "EPLUS"], "1E+"),
526 | 
527 |     # EMINUS
528 |     (["FLOAT", "EMINUS"], "0.e-"),
529 |     (["NUMBER", "EMINUS"], "1e-"),
530 |     (["FLOAT", "EMINUS"], "0.E-"),
531 |     (["NUMBER", "EMINUS"], "1E-"),
532 | ]
533 | 
534 | @pytest.mark.parametrize("tokens,input_string", COMPLEX_TOKEN_FIXTURES)
535 | def test_complex_tokens(tokens, input_string):
536 | 
537 |     print(input_string)
538 | 
539 |     lexer = hcl.lexer.Lexer()
540 |     lexer.input(input_string)
541 | 
542 |     for tok in tokens:
543 |         lex_tok = lexer.token()
544 | 
545 |         if lex_tok is None:
546 |             assert tok is None
547 |         else:
548 |             assert tok == lex_tok.type
549 |         print(lex_tok)
550 | 
551 |     assert lexer.token() is None
552 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
  1 | Mozilla Public License, version 2.0
  2 | 
  3 | 1. Definitions
  4 | 
  5 | 1.1. “Contributor”
  6 | 
  7 |      means each individual or legal entity that creates, contributes to the
  8 |      creation of, or owns Covered Software.
  9 | 
 10 | 1.2. “Contributor Version”
 11 | 
 12 |      means the combination of the Contributions of others (if any) used by a
 13 |      Contributor and that particular Contributor’s Contribution.
 14 | 
 15 | 1.3. “Contribution”
 16 | 
 17 |      means Covered Software of a particular Contributor.
 18 | 
 19 | 1.4. “Covered Software”
 20 | 
 21 |      means Source Code Form to which the initial Contributor has attached the
 22 |      notice in Exhibit A, the Executable Form of such Source Code Form, and
 23 |      Modifications of such Source Code Form, in each case including portions
 24 |      thereof.
 25 | 
 26 | 1.5. “Incompatible With Secondary Licenses”
 27 |      means
 28 | 
 29 |      a. that the initial Contributor has attached the notice described in
 30 |         Exhibit B to the Covered Software; or
 31 | 
 32 |      b. that the Covered Software was made available under the terms of version
 33 |         1.1 or earlier of the License, but not also under the terms of a
 34 |         Secondary License.
 35 | 
 36 | 1.6. “Executable Form”
 37 | 
 38 |      means any form of the work other than Source Code Form.
 39 | 
 40 | 1.7. “Larger Work”
 41 | 
 42 |      means a work that combines Covered Software with other material, in a separate
 43 |      file or files, that is not Covered Software.
 44 | 
 45 | 1.8. “License”
 46 | 
 47 |      means this document.
 48 | 
 49 | 1.9. “Licensable”
 50 | 
 51 |      means having the right to grant, to the maximum extent possible, whether at the
 52 |      time of the initial grant or subsequently, any and all of the rights conveyed by
 53 |      this License.
 54 | 
 55 | 1.10. “Modifications”
 56 | 
 57 |      means any of the following:
 58 | 
 59 |      a. any file in Source Code Form that results from an addition to, deletion
 60 |         from, or modification of the contents of Covered Software; or
 61 | 
 62 |      b. any new file in Source Code Form that contains any Covered Software.
 63 | 
 64 | 1.11. “Patent Claims” of a Contributor
 65 | 
 66 |       means any patent claim(s), including without limitation, method, process,
 67 |       and apparatus claims, in any patent Licensable by such Contributor that
 68 |       would be infringed, but for the grant of the License, by the making,
 69 |       using, selling, offering for sale, having made, import, or transfer of
 70 |       either its Contributions or its Contributor Version.
 71 | 
 72 | 1.12. “Secondary License”
 73 | 
 74 |       means either the GNU General Public License, Version 2.0, the GNU Lesser
 75 |       General Public License, Version 2.1, the GNU Affero General Public
 76 |       License, Version 3.0, or any later versions of those licenses.
 77 | 
 78 | 1.13. “Source Code Form”
 79 | 
 80 |       means the form of the work preferred for making modifications.
 81 | 
 82 | 1.14. “You” (or “Your”)
 83 | 
 84 |       means an individual or a legal entity exercising rights under this
 85 |       License. For legal entities, “You” includes any entity that controls, is
 86 |       controlled by, or is under common control with You. For purposes of this
 87 |       definition, “control” means (a) the power, direct or indirect, to cause
 88 |       the direction or management of such entity, whether by contract or
 89 |       otherwise, or (b) ownership of more than fifty percent (50%) of the
 90 |       outstanding shares or beneficial ownership of such entity.
 91 | 
 92 | 
 93 | 2. License Grants and Conditions
 94 | 
 95 | 2.1. Grants
 96 | 
 97 |      Each Contributor hereby grants You a world-wide, royalty-free,
 98 |      non-exclusive license:
 99 | 
100 |      a. under intellectual property rights (other than patent or trademark)
101 |         Licensable by such Contributor to use, reproduce, make available,
102 |         modify, display, perform, distribute, and otherwise exploit its
103 |         Contributions, either on an unmodified basis, with Modifications, or as
104 |         part of a Larger Work; and
105 | 
106 |      b. under Patent Claims of such Contributor to make, use, sell, offer for
107 |         sale, have made, import, and otherwise transfer either its Contributions
108 |         or its Contributor Version.
109 | 
110 | 2.2. Effective Date
111 | 
112 |      The licenses granted in Section 2.1 with respect to any Contribution become
113 |      effective for each Contribution on the date the Contributor first distributes
114 |      such Contribution.
115 | 
116 | 2.3. Limitations on Grant Scope
117 | 
118 |      The licenses granted in this Section 2 are the only rights granted under this
119 |      License. No additional rights or licenses will be implied from the distribution
120 |      or licensing of Covered Software under this License. Notwithstanding Section
121 |      2.1(b) above, no patent license is granted by a Contributor:
122 | 
123 |      a. for any code that a Contributor has removed from Covered Software; or
124 | 
125 |      b. for infringements caused by: (i) Your and any other third party’s
126 |         modifications of Covered Software, or (ii) the combination of its
127 |         Contributions with other software (except as part of its Contributor
128 |         Version); or
129 | 
130 |      c. under Patent Claims infringed by Covered Software in the absence of its
131 |         Contributions.
132 | 
133 |      This License does not grant any rights in the trademarks, service marks, or
134 |      logos of any Contributor (except as may be necessary to comply with the
135 |      notice requirements in Section 3.4).
136 | 
137 | 2.4. Subsequent Licenses
138 | 
139 |      No Contributor makes additional grants as a result of Your choice to
140 |      distribute the Covered Software under a subsequent version of this License
141 |      (see Section 10.2) or under the terms of a Secondary License (if permitted
142 |      under the terms of Section 3.3).
143 | 
144 | 2.5. Representation
145 | 
146 |      Each Contributor represents that the Contributor believes its Contributions
147 |      are its original creation(s) or it has sufficient rights to grant the
148 |      rights to its Contributions conveyed by this License.
149 | 
150 | 2.6. Fair Use
151 | 
152 |      This License is not intended to limit any rights You have under applicable
153 |      copyright doctrines of fair use, fair dealing, or other equivalents.
154 | 
155 | 2.7. Conditions
156 | 
157 |      Sections 3.1, 3.2, 3.3, and 3.4 are conditions of the licenses granted in
158 |      Section 2.1.
159 | 
160 | 
161 | 3. Responsibilities
162 | 
163 | 3.1. Distribution of Source Form
164 | 
165 |      All distribution of Covered Software in Source Code Form, including any
166 |      Modifications that You create or to which You contribute, must be under the
167 |      terms of this License. You must inform recipients that the Source Code Form
168 |      of the Covered Software is governed by the terms of this License, and how
169 |      they can obtain a copy of this License. You may not attempt to alter or
170 |      restrict the recipients’ rights in the Source Code Form.
171 | 
172 | 3.2. Distribution of Executable Form
173 | 
174 |      If You distribute Covered Software in Executable Form then:
175 | 
176 |      a. such Covered Software must also be made available in Source Code Form,
177 |         as described in Section 3.1, and You must inform recipients of the
178 |         Executable Form how they can obtain a copy of such Source Code Form by
179 |         reasonable means in a timely manner, at a charge no more than the cost
180 |         of distribution to the recipient; and
181 | 
182 |      b. You may distribute such Executable Form under the terms of this License,
183 |         or sublicense it under different terms, provided that the license for
184 |         the Executable Form does not attempt to limit or alter the recipients’
185 |         rights in the Source Code Form under this License.
186 | 
187 | 3.3. Distribution of a Larger Work
188 | 
189 |      You may create and distribute a Larger Work under terms of Your choice,
190 |      provided that You also comply with the requirements of this License for the
191 |      Covered Software. If the Larger Work is a combination of Covered Software
192 |      with a work governed by one or more Secondary Licenses, and the Covered
193 |      Software is not Incompatible With Secondary Licenses, this License permits
194 |      You to additionally distribute such Covered Software under the terms of
195 |      such Secondary License(s), so that the recipient of the Larger Work may, at
196 |      their option, further distribute the Covered Software under the terms of
197 |      either this License or such Secondary License(s).
198 | 
199 | 3.4. Notices
200 | 
201 |      You may not remove or alter the substance of any license notices (including
202 |      copyright notices, patent notices, disclaimers of warranty, or limitations
203 |      of liability) contained within the Source Code Form of the Covered
204 |      Software, except that You may alter any license notices to the extent
205 |      required to remedy known factual inaccuracies.
206 | 
207 | 3.5. Application of Additional Terms
208 | 
209 |      You may choose to offer, and to charge a fee for, warranty, support,
210 |      indemnity or liability obligations to one or more recipients of Covered
211 |      Software. However, You may do so only on Your own behalf, and not on behalf
212 |      of any Contributor. You must make it absolutely clear that any such
213 |      warranty, support, indemnity, or liability obligation is offered by You
214 |      alone, and You hereby agree to indemnify every Contributor for any
215 |      liability incurred by such Contributor as a result of warranty, support,
216 |      indemnity or liability terms You offer. You may include additional
217 |      disclaimers of warranty and limitations of liability specific to any
218 |      jurisdiction.
219 | 
220 | 4. Inability to Comply Due to Statute or Regulation
221 | 
222 |    If it is impossible for You to comply with any of the terms of this License
223 |    with respect to some or all of the Covered Software due to statute, judicial
224 |    order, or regulation then You must: (a) comply with the terms of this License
225 |    to the maximum extent possible; and (b) describe the limitations and the code
226 |    they affect. Such description must be placed in a text file included with all
227 |    distributions of the Covered Software under this License. Except to the
228 |    extent prohibited by statute or regulation, such description must be
229 |    sufficiently detailed for a recipient of ordinary skill to be able to
230 |    understand it.
231 | 
232 | 5. Termination
233 | 
234 | 5.1. The rights granted under this License will terminate automatically if You
235 |      fail to comply with any of its terms. However, if You become compliant,
236 |      then the rights granted under this License from a particular Contributor
237 |      are reinstated (a) provisionally, unless and until such Contributor
238 |      explicitly and finally terminates Your grants, and (b) on an ongoing basis,
239 |      if such Contributor fails to notify You of the non-compliance by some
240 |      reasonable means prior to 60 days after You have come back into compliance.
241 |      Moreover, Your grants from a particular Contributor are reinstated on an
242 |      ongoing basis if such Contributor notifies You of the non-compliance by
243 |      some reasonable means, this is the first time You have received notice of
244 |      non-compliance with this License from such Contributor, and You become
245 |      compliant prior to 30 days after Your receipt of the notice.
246 | 
247 | 5.2. If You initiate litigation against any entity by asserting a patent
248 |      infringement claim (excluding declaratory judgment actions, counter-claims,
249 |      and cross-claims) alleging that a Contributor Version directly or
250 |      indirectly infringes any patent, then the rights granted to You by any and
251 |      all Contributors for the Covered Software under Section 2.1 of this License
252 |      shall terminate.
253 | 
254 | 5.3. In the event of termination under Sections 5.1 or 5.2 above, all end user
255 |      license agreements (excluding distributors and resellers) which have been
256 |      validly granted by You or Your distributors under this License prior to
257 |      termination shall survive termination.
258 | 
259 | 6. Disclaimer of Warranty
260 | 
261 |    Covered Software is provided under this License on an “as is” basis, without
262 |    warranty of any kind, either expressed, implied, or statutory, including,
263 |    without limitation, warranties that the Covered Software is free of defects,
264 |    merchantable, fit for a particular purpose or non-infringing. The entire
265 |    risk as to the quality and performance of the Covered Software is with You.
266 |    Should any Covered Software prove defective in any respect, You (not any
267 |    Contributor) assume the cost of any necessary servicing, repair, or
268 |    correction. This disclaimer of warranty constitutes an essential part of this
269 |    License. No use of  any Covered Software is authorized under this License
270 |    except under this disclaimer.
271 | 
272 | 7. Limitation of Liability
273 | 
274 |    Under no circumstances and under no legal theory, whether tort (including
275 |    negligence), contract, or otherwise, shall any Contributor, or anyone who
276 |    distributes Covered Software as permitted above, be liable to You for any
277 |    direct, indirect, special, incidental, or consequential damages of any
278 |    character including, without limitation, damages for lost profits, loss of
279 |    goodwill, work stoppage, computer failure or malfunction, or any and all
280 |    other commercial damages or losses, even if such party shall have been
281 |    informed of the possibility of such damages. This limitation of liability
282 |    shall not apply to liability for death or personal injury resulting from such
283 |    party’s negligence to the extent applicable law prohibits such limitation.
284 |    Some jurisdictions do not allow the exclusion or limitation of incidental or
285 |    consequential damages, so this exclusion and limitation may not apply to You.
286 | 
287 | 8. Litigation
288 | 
289 |    Any litigation relating to this License may be brought only in the courts of
290 |    a jurisdiction where the defendant maintains its principal place of business
291 |    and such litigation shall be governed by laws of that jurisdiction, without
292 |    reference to its conflict-of-law provisions. Nothing in this Section shall
293 |    prevent a party’s ability to bring cross-claims or counter-claims.
294 | 
295 | 9. Miscellaneous
296 | 
297 |    This License represents the complete agreement concerning the subject matter
298 |    hereof. If any provision of this License is held to be unenforceable, such
299 |    provision shall be reformed only to the extent necessary to make it
300 |    enforceable. Any law or regulation which provides that the language of a
301 |    contract shall be construed against the drafter shall not be used to construe
302 |    this License against a Contributor.
303 | 
304 | 
305 | 10. Versions of the License
306 | 
307 | 10.1. New Versions
308 | 
309 |       Mozilla Foundation is the license steward. Except as provided in Section
310 |       10.3, no one other than the license steward has the right to modify or
311 |       publish new versions of this License. Each version will be given a
312 |       distinguishing version number.
313 | 
314 | 10.2. Effect of New Versions
315 | 
316 |       You may distribute the Covered Software under the terms of the version of
317 |       the License under which You originally received the Covered Software, or
318 |       under the terms of any subsequent version published by the license
319 |       steward.
320 | 
321 | 10.3. Modified Versions
322 | 
323 |       If you create software not governed by this License, and you want to
324 |       create a new license for such software, you may create and use a modified
325 |       version of this License if you rename the license and remove any
326 |       references to the name of the license steward (except to note that such
327 |       modified license differs from this License).
328 | 
329 | 10.4. Distributing Source Code Form that is Incompatible With Secondary Licenses
330 |       If You choose to distribute Source Code Form that is Incompatible With
331 |       Secondary Licenses under the terms of this version of the License, the
332 |       notice described in Exhibit B of this License must be attached.
333 | 
334 | Exhibit A - Source Code Form License Notice
335 | 
336 |       This Source Code Form is subject to the
337 |       terms of the Mozilla Public License, v.
338 |       2.0. If a copy of the MPL was not
339 |       distributed with this file, You can
340 |       obtain one at
341 |       http://mozilla.org/MPL/2.0/.
342 | 
343 | If it is not possible or desirable to put the notice in a particular file, then
344 | You may include the notice in a location (such as a LICENSE file in a relevant
345 | directory) where a recipient would be likely to look for such a notice.
346 | 
347 | You may add additional accurate notices of copyright ownership.
348 | 
349 | Exhibit B - “Incompatible With Secondary Licenses” Notice
350 | 
351 |       This Source Code Form is “Incompatible
352 |       With Secondary Licenses”, as defined by
353 |       the Mozilla Public License, v. 2.0.
354 | 
355 | 


--------------------------------------------------------------------------------
/src/hcl/parser.py:
--------------------------------------------------------------------------------
  1 | from os.path import abspath, dirname, exists, join
  2 | import sys
  3 | 
  4 | from .lexer import Lexer
  5 | from .ply import yacc
  6 | 
  7 | import inspect
  8 | 
  9 | DEBUG = False
 10 | 
 11 | # When using something like pyinstaller, the __file__ attribute isn't actually
 12 | # set correctly, so the parse file isn't able to be saved anywhere sensible.
 13 | # In these cases, just use a temporary directory, it doesn't take too long to
 14 | # generate the tables anyways...
 15 | 
 16 | if exists(dirname(__file__)):
 17 |     pickle_file = abspath(join(dirname(__file__), 'parsetab.dat'))
 18 | else:
 19 |     import tempfile
 20 | 
 21 |     fobj = tempfile.NamedTemporaryFile()
 22 |     pickle_file = fobj.name
 23 | 
 24 | 
 25 | if sys.version_info[0] < 3:
 26 | 
 27 |     def iteritems(d):
 28 |         return iter(d.iteritems())
 29 | 
 30 |     string_types = (str, unicode)
 31 | 
 32 | 
 33 | else:
 34 | 
 35 |     def iteritems(d):
 36 |         return iter(d.items())
 37 | 
 38 |     string_types = (str, bytes)
 39 | 
 40 | 
 41 | class HclParser(object):
 42 | 
 43 |     #
 44 |     # Tokens
 45 |     #
 46 | 
 47 |     tokens = (
 48 |         'BOOL',
 49 |         'FLOAT',
 50 |         'NUMBER',
 51 |         'COMMA',
 52 |         'COMMENT',
 53 |         'MULTICOMMENT',
 54 |         'IDENTIFIER',
 55 |         'EQUAL',
 56 |         'STRING',
 57 |         'ADD',
 58 |         'MINUS',
 59 |         'MULTIPLY',
 60 |         'DIVIDE',
 61 |         'LEFTBRACE',
 62 |         'RIGHTBRACE',
 63 |         'LEFTBRACKET',
 64 |         'RIGHTBRACKET',
 65 |         'PERIOD',
 66 |         'EPLUS',
 67 |         'EMINUS',
 68 |         'LEFTPAREN',
 69 |         'RIGHTPAREN',
 70 |         'QMARK',
 71 |         'COLON',
 72 |         'ASTERISK_PERIOD',
 73 |         'GT',
 74 |         'LT',
 75 |         'EQ',
 76 |         'NE',
 77 |         'LE',
 78 |         'GE',
 79 |     )
 80 | 
 81 |     #
 82 |     # Yacc parser section
 83 |     #
 84 |     def objectlist_flat(self, lt, replace):
 85 |         '''
 86 |             Similar to the dict constructor, but handles dups
 87 | 
 88 |             HCL is unclear on what one should do when duplicate keys are
 89 |             encountered. These comments aren't clear either:
 90 | 
 91 |             from decoder.go: if we're at the root or we're directly within
 92 |                              a list, decode into dicts, otherwise lists
 93 | 
 94 |             from object.go: there's a flattened list structure
 95 |         '''
 96 |         d = {}
 97 | 
 98 |         for k, v in lt:
 99 |             if k in d.keys() and not replace:
100 |                 if type(d[k]) is list:
101 |                     d[k].append(v)
102 |                 else:
103 |                     d[k] = [d[k], v]
104 |             else:
105 |                 if isinstance(v, dict):
106 |                     dd = d.setdefault(k, {})
107 |                     for kk, vv in iteritems(v):
108 |                         if type(dd) == list:
109 |                             dd.append({kk: vv})
110 |                         elif kk in dd.keys():
111 |                             if hasattr(vv, 'items'):
112 |                                 for k2, v2 in iteritems(vv):
113 |                                     dd[kk][k2] = v2
114 |                             else:
115 |                                 d[k] = [dd, {kk: vv}]
116 |                         else:
117 |                             dd[kk] = vv
118 |                 else:
119 |                     d[k] = v
120 | 
121 |         return d
122 | 
123 |     def p_top(self, p):
124 |         '''
125 |         top : empty
126 |             | objectlist
127 |         '''
128 |         if DEBUG:
129 |             self.print_p(p)
130 |         p[0] = self.objectlist_flat(p[1], True)
131 | 
132 |     def p_empty_0(self, p):
133 |         '''
134 |         empty :
135 |         '''
136 |         if DEBUG:
137 |             self.print_p(p)
138 |         p[0] = []
139 | 
140 |     def p_objectlist_0(self, p):
141 |         "objectlist : objectitem"
142 |         if DEBUG:
143 |             self.print_p(p)
144 |         p[0] = [p[1]]
145 | 
146 |     def p_objectlist_1(self, p):
147 |         "objectlist : objectlist objectitem"
148 |         if DEBUG:
149 |             self.print_p(p)
150 |         p[0] = p[1] + [p[2]]
151 | 
152 |     def p_objectlist_2(self, p):
153 |         "objectlist : objectlist COMMA objectitem"
154 |         if DEBUG:
155 |             self.print_p(p)
156 |         p[0] = p[1] + [p[3]]
157 | 
158 |     def p_object_0(self, p):
159 |         "object : LEFTBRACE objectlist RIGHTBRACE"
160 |         if DEBUG:
161 |             self.print_p(p)
162 |         p[0] = self.objectlist_flat(p[2], False)
163 | 
164 |     def p_object_1(self, p):
165 |         "object : LEFTBRACE objectlist COMMA RIGHTBRACE"
166 |         if DEBUG:
167 |             self.print_p(p)
168 |         p[0] = self.objectlist_flat(p[2], False)
169 | 
170 |     def p_object_2(self, p):
171 |         "object : LEFTBRACE RIGHTBRACE"
172 |         if DEBUG:
173 |             self.print_p(p)
174 |         p[0] = {}
175 | 
176 |     def p_objectkey_0(self, p):
177 |         '''
178 |         objectkey : IDENTIFIER
179 |                   | STRING
180 |         '''
181 |         if DEBUG:
182 |             self.print_p(p)
183 |         p[0] = p[1]
184 | 
185 |     def p_objectkey_1(self, p):
186 |         '''
187 |         objectkey : IDENTIFIER ADD number
188 |                   | number ADD IDENTIFIER
189 |                   | IDENTIFIER MINUS number
190 |                   | number MINUS IDENTIFIER
191 |                   | IDENTIFIER MULTIPLY number
192 |                   | number MULTIPLY IDENTIFIER
193 |                   | IDENTIFIER DIVIDE number
194 |                   | number DIVIDE IDENTIFIER
195 |         '''
196 |         if DEBUG:
197 |             self.print_p(p)
198 |         p[0] = (str(p[1]), str(p[2]), str(p[3]))
199 | 
200 |     def p_objectbrackets_0(self, p):
201 |         "objectbrackets : IDENTIFIER LEFTBRACKET objectkey RIGHTBRACKET"
202 |         if DEBUG:
203 |             self.print_p(p)
204 |         p[0] = p[1] + p[2] + p[3] + p[4]
205 | 
206 |     def p_objectbrackets_1(self, p):
207 |         '''
208 |         objectbrackets : IDENTIFIER LEFTBRACKET objectkey RIGHTBRACKET PERIOD IDENTIFIER
209 |                        | IDENTIFIER LEFTBRACKET NUMBER RIGHTBRACKET PERIOD IDENTIFIER
210 |         '''
211 |         if DEBUG:
212 |             self.print_p(p)
213 |         p[0] = p[1] + p[2] + str(p[3]) + p[4] + p[5] + p[6]
214 | 
215 |     def p_objectitem_0(self, p):
216 |         '''
217 |         objectitem : objectkey EQUAL number
218 |                    | objectkey EQUAL BOOL
219 |                    | objectkey EQUAL STRING
220 |                    | objectkey EQUAL IDENTIFIER
221 |                    | objectkey EQUAL object
222 |                    | objectkey EQUAL objectkey
223 |                    | objectkey EQUAL list
224 |                    | objectkey EQUAL objectbrackets
225 |                    | objectkey EQUAL function
226 |                    | objectkey EQUAL booleanexp
227 |                    | objectkey COLON number
228 |                    | objectkey COLON BOOL
229 |                    | objectkey COLON STRING
230 |                    | objectkey COLON IDENTIFIER
231 |                    | objectkey COLON object
232 |                    | objectkey COLON objectkey
233 |                    | objectkey COLON list
234 |                    | objectkey COLON objectbrackets
235 |                    | objectkey COLON booleanexp
236 |         '''
237 |         if DEBUG:
238 |             self.print_p(p)
239 |         p[0] = (p[1], p[3])
240 | 
241 |     def p_objectitem_1(self, p):
242 |         "objectitem : block"
243 |         if DEBUG:
244 |             self.print_p(p)
245 |         p[0] = p[1]
246 | 
247 |     def p_objectitem_2(self, p):
248 |         '''
249 |         objectitem : objectkey EQUAL objectkey QMARK objectkey COLON objectkey
250 |                    | objectkey EQUAL objectkey QMARK objectkey COLON number
251 |                    | objectkey EQUAL objectkey QMARK objectkey COLON BOOL
252 |                    | objectkey EQUAL objectkey QMARK objectkey COLON function
253 |                    | objectkey EQUAL objectkey QMARK number COLON objectkey
254 |                    | objectkey EQUAL objectkey QMARK BOOL COLON objectkey
255 |                    | objectkey EQUAL objectkey QMARK function COLON objectkey
256 |                    | objectkey EQUAL objectkey QMARK number COLON number
257 |                    | objectkey EQUAL objectkey QMARK number COLON BOOL
258 |                    | objectkey EQUAL objectkey QMARK number COLON function
259 |                    | objectkey EQUAL objectkey QMARK BOOL COLON number
260 |                    | objectkey EQUAL objectkey QMARK BOOL COLON function
261 |                    | objectkey EQUAL objectkey QMARK BOOL COLON BOOL
262 |                    | objectkey EQUAL booleanexp QMARK objectkey COLON objectkey
263 |                    | objectkey EQUAL booleanexp QMARK objectkey COLON number
264 |                    | objectkey EQUAL booleanexp QMARK objectkey COLON BOOL
265 |                    | objectkey EQUAL booleanexp QMARK objectkey COLON function
266 |                    | objectkey EQUAL booleanexp QMARK number COLON objectkey
267 |                    | objectkey EQUAL booleanexp QMARK BOOL COLON objectkey
268 |                    | objectkey EQUAL booleanexp QMARK function COLON objectkey
269 |                    | objectkey EQUAL booleanexp QMARK number COLON number
270 |                    | objectkey EQUAL booleanexp QMARK number COLON BOOL
271 |                    | objectkey EQUAL booleanexp QMARK number COLON function
272 |                    | objectkey EQUAL booleanexp QMARK BOOL COLON number
273 |                    | objectkey EQUAL booleanexp QMARK BOOL COLON function
274 |                    | objectkey EQUAL booleanexp QMARK BOOL COLON BOOL
275 |         '''
276 |         if DEBUG:
277 |             self.print_p(p)
278 |         p[0] = (p[1], p[3] + p[4] + str(p[5]) + p[6] + str(p[7]))
279 | 
280 |     def p_operator_0(self, p):
281 |         '''
282 |         operator : EQ
283 |                  | NE
284 |                  | LT
285 |                  | GT
286 |                  | LE
287 |                  | GE
288 |         '''
289 |         if DEBUG:
290 |             self.print_p(p)
291 |         p[0] = p[1]
292 | 
293 |     def p_booleanexp_0(self, p):
294 |         '''
295 |         booleanexp : objectkey operator objectkey
296 |                    | objectkey operator number
297 |                    | number operator objectkey
298 |         '''
299 |         if DEBUG:
300 |             self.print_p(p)
301 |         p[0] = str(p[1]) + p[2] + str(p[3])
302 | 
303 |     def p_block_0(self, p):
304 |         "block : objectkey object"
305 |         if DEBUG:
306 |             self.print_p(p)
307 |         p[0] = (p[1], p[2])
308 | 
309 |     def p_block_1(self, p):
310 |         "block : objectkey block"
311 |         if DEBUG:
312 |             self.print_p(p)
313 |         p[0] = (p[1], {p[2][0]: p[2][1]})
314 | 
315 |     def p_list_0(self, p):
316 |         '''
317 |         list : LEFTBRACKET listitems RIGHTBRACKET
318 |              | LEFTBRACKET listitems COMMA RIGHTBRACKET
319 |         '''
320 |         if DEBUG:
321 |             self.print_p(p)
322 |         p[0] = p[2]
323 | 
324 |     def p_list_1(self, p):
325 |         '''
326 |         list : LEFTBRACKET RIGHTBRACKET
327 |              | LEFTPAREN RIGHTPAREN
328 |         '''
329 |         if DEBUG:
330 |             self.print_p(p)
331 |         p[0] = []
332 | 
333 |     def p_list_2(self, p):
334 |         '''
335 |         list : LEFTPAREN LEFTBRACKET listitems RIGHTBRACKET PERIOD PERIOD PERIOD RIGHTPAREN
336 |         '''
337 |         if DEBUG:
338 |             self.print_p(p)
339 |         p[0] = [p[3]] + [p[5] + p[6] + p[7]]
340 | 
341 |     def p_list_of_lists_0(self, p):
342 |         '''
343 |         list_of_lists : list COMMA list
344 |         '''
345 |         if DEBUG:
346 |             self.print_p(p)
347 |         p[0] = p[1], p[3]
348 | 
349 |     def p_list_of_lists_1(self, p):
350 |         '''
351 |         list_of_lists : list_of_lists COMMA list
352 |         '''
353 |         if DEBUG:
354 |             self.print_p(p)
355 |         p[0] = p[1] + (p[3],)
356 | 
357 |     def p_function_0(self, p):
358 |         '''
359 |         function : IDENTIFIER LEFTPAREN listitems RIGHTPAREN
360 |                  | IDENTIFIER LEFTPAREN list_of_lists RIGHTPAREN
361 |         '''
362 |         if DEBUG:
363 |             self.print_p(p)
364 | 
365 |         p[0] = p[1] + p[2] + self.flatten(p[3]) + p[4]
366 | 
367 |     def p_function_1(self, p):
368 |         '''
369 |         function : IDENTIFIER LEFTPAREN listitems COMMA RIGHTPAREN
370 |                  | IDENTIFIER LEFTPAREN list_of_lists COMMA RIGHTPAREN
371 |         '''
372 |         if DEBUG:
373 |             self.print_p(p)
374 | 
375 |         p[0] = p[1] + p[2] + self.flatten(p[3]) + p[5]
376 | 
377 |     def p_function_2(self, p):
378 |         '''
379 |         function : IDENTIFIER LEFTPAREN list PERIOD PERIOD PERIOD RIGHTPAREN
380 |         '''
381 |         if DEBUG:
382 |             self.print_p(p)
383 | 
384 |         p[0] = p[1] + p[2] + self.flatten(p[3]) + p[4] + p[5] + p[6] + p[7]
385 | 
386 |     def p_function_3(self, p):
387 |         '''
388 |         function : IDENTIFIER LEFTPAREN LEFTBRACKET list_of_lists RIGHTBRACKET PERIOD PERIOD PERIOD RIGHTPAREN
389 |         '''
390 |         if DEBUG:
391 |             self.print_p(p)
392 | 
393 |         p[0] = (
394 |             p[1] + p[2] + p[3] + self.flatten(p[4]) + p[5] + p[6] + p[7] + p[8] + p[9]
395 |         )
396 | 
397 |     def flatten(self, value):
398 |         if isinstance(value, dict):
399 |             return (
400 |                 "{"
401 |                 + ",".join(key + ":" + self.flatten(value[key]) for key in value)
402 |                 + "}"
403 |             )
404 |         if isinstance(value, list):
405 |             return ",".join(self.flatten(v) for v in value)
406 |         if isinstance(value, tuple):
407 |             return " ".join(self.flatten(v) for v in value)
408 |         if isinstance(value, string_types):
409 |             if sys.version_info[0] < 3:
410 |                 if value.isdigit():  # python2 support, return numbers as is
411 |                     return value
412 |             else:
413 |                 if value.isnumeric():  # return numbers as is
414 |                     return value
415 |             return (
416 |                 '"' + value + '"'  # wrap string literals in double quotes
417 |                 if value not in ['+', '-'] and '.' not in value
418 |                 else value  # but not if its var interpolation or an operator
419 |             )
420 |         raise TypeError(
421 |             '%s is of type %s; expected type of dict, list, tuple, or str',
422 |             str(value),
423 |             type(value),
424 |         )
425 | 
426 |     def p_listitems_0(self, p):
427 |         '''
428 |         listitems : listitem
429 |                   | function
430 |                   | object COMMA
431 |                   | objectkey COMMA
432 |                   | list COMMA
433 |         '''
434 |         if DEBUG:
435 |             self.print_p(p)
436 |         p[0] = [p[1]]
437 | 
438 |     def p_listitems_1(self, p):
439 |         '''
440 |         listitems : listitems COMMA listitem
441 |                   | listitems COMMA function
442 |                   | listitems COMMA objectkey
443 |         '''
444 |         if DEBUG:
445 |             self.print_p(p)
446 |         p[0] = p[1] + [p[3]]
447 | 
448 |     def p_listitems_2(self, p):
449 |         '''
450 |         listitems : object COMMA object
451 |                   | object COMMA objectkey
452 |                   | objectkey COMMA objectkey
453 |                   | objectkey COMMA object
454 |                   | objectkey COMMA list
455 |         '''
456 |         if DEBUG:
457 |             self.print_p(p)
458 |         p[0] = [p[1], p[3]]
459 | 
460 |     def p_listitems_3(self, p):
461 |         '''
462 |         listitems : objectkey COMMA IDENTIFIER ASTERISK_PERIOD IDENTIFIER
463 |         '''
464 |         if DEBUG:
465 |             self.print_p(p)
466 |         p[0] = [p[1], p[3] + p[4] + p[5]]
467 | 
468 |     def p_listitems_4(self, p):
469 |         '''
470 |         listitems : objectkey list
471 |         '''
472 |         if DEBUG:
473 |             self.print_p(p)
474 |         p[2].insert(0, p[1])
475 |         p[0] = p[2]
476 | 
477 |     def p_listitems_5(self, p):
478 |         '''
479 |         listitems : listitems COMMA COMMENT
480 |                   | listitems COMMA MULTICOMMENT
481 |         '''
482 |         # skip comments in lists
483 |         if DEBUG:
484 |             self.print_p(p)
485 |         p[0] = p[1]
486 | 
487 |     def p_listitem_0(self, p):
488 |         '''
489 |         listitem : number
490 |                  | object
491 |                  | objectkey
492 |                  | objectbrackets
493 |         '''
494 |         if DEBUG:
495 |             self.print_p(p)
496 |         p[0] = p[1]
497 | 
498 |     def p_listitem_1(self, p):
499 |         '''
500 |         listitem : IDENTIFIER ASTERISK_PERIOD IDENTIFIER
501 |         '''
502 |         if DEBUG:
503 |             self.print_p(p)
504 |         p[0] = p[1] + p[2] + p[3]
505 | 
506 |     def p_number_0(self, p):
507 |         "number : int"
508 |         if DEBUG:
509 |             self.print_p(p)
510 |         p[0] = p[1]
511 | 
512 |     def p_number_1(self, p):
513 |         "number : float"
514 |         if DEBUG:
515 |             self.print_p(p)
516 |         p[0] = float(p[1])
517 | 
518 |     def p_number_2(self, p):
519 |         "number : int exp"
520 |         if DEBUG:
521 |             self.print_p(p)
522 |         p[0] = float("{0}{1}".format(p[1], p[2]))
523 | 
524 |     def p_number_3(self, p):
525 |         "number : float exp"
526 |         if DEBUG:
527 |             self.print_p(p)
528 |         p[0] = float("{0}{1}".format(p[1], p[2]))
529 | 
530 |     def p_number_4(self, p):
531 |         '''
532 |         number : number ADD number
533 |         '''
534 |         if DEBUG:
535 |             self.print_p(p)
536 |         p[0] = p[1] + p[3]
537 | 
538 |     def p_number_5(self, p):
539 |         '''
540 |         number : number MINUS number
541 |         '''
542 |         if DEBUG:
543 |             self.print_p(p)
544 |         p[0] = p[1] - p[3]
545 | 
546 |     def p_number_6(self, p):
547 |         '''
548 |         number : number MULTIPLY number
549 |         '''
550 |         if DEBUG:
551 |             self.print_p(p)
552 |         p[0] = p[1] * p[3]
553 | 
554 |     def p_number_7(self, p):
555 |         '''
556 |         number : number DIVIDE number
557 |         '''
558 |         if DEBUG:
559 |             self.print_p(p)
560 |         p[0] = p[1] / p[3]
561 | 
562 |     def p_int_0(self, p):
563 |         "int : MINUS int"
564 |         if DEBUG:
565 |             self.print_p(p)
566 |         p[0] = -p[2]
567 | 
568 |     def p_int_1(self, p):
569 |         "int : NUMBER"
570 |         if DEBUG:
571 |             self.print_p(p)
572 |         p[0] = p[1]
573 | 
574 |     def p_float_0(self, p):
575 |         "float : MINUS float"
576 |         p[0] = p[2] * -1
577 | 
578 |     def p_float_1(self, p):
579 |         "float : FLOAT"
580 |         p[0] = p[1]
581 | 
582 |     def p_exp_0(self, p):
583 |         "exp : EPLUS NUMBER"
584 |         if DEBUG:
585 |             self.print_p(p)
586 |         p[0] = "e{0}".format(p[2])
587 | 
588 |     def p_exp_1(self, p):
589 |         "exp : EMINUS NUMBER"
590 |         if DEBUG:
591 |             self.print_p(p)
592 |         p[0] = "e-{0}".format(p[2])
593 | 
594 |     def p_comment_0(self, p):
595 |         '''
596 |         block : COMMENT
597 |               | MULTICOMMENT
598 |         '''
599 |         if DEBUG:
600 |             self.print_p(p)
601 |         p[0] = ("comment-L{:03d}".format(p.lineno(1)), p[1])
602 | 
603 |     # useful for debugging the parser
604 |     def print_p(self, p):
605 |         if DEBUG:
606 |             name = inspect.getouterframes(inspect.currentframe(), 2)[1][3]
607 |             print(
608 |                 '%20s: %s' % (name, ' | '.join([str(p[i]) for i in range(0, len(p))]))
609 |             )
610 | 
611 |     def p_error(self, p):
612 |         # Derived from https://groups.google.com/forum/#!topic/ply-hack/spqwuM1Q6gM
613 | 
614 |         # Ugly hack since Ply doesn't provide any useful error information
615 |         try:
616 |             frame = inspect.currentframe()
617 |             cvars = frame.f_back.f_locals
618 |             expected = "; expected %s" % (
619 |                 ', '.join(cvars['actions'][cvars['state']].keys())
620 |             )
621 |         except:
622 |             expected = ""
623 | 
624 |         if p is not None:
625 |             msg = "Line %d, column %d: unexpected %s%s" % (
626 |                 p.lineno,
627 |                 p.lexpos,
628 |                 p.type,
629 |                 expected,
630 |             )
631 |         else:
632 |             msg = "Unexpected end of file%s" % expected
633 | 
634 |         raise ValueError(msg)
635 | 
636 |     def __init__(self):
637 |         self.yacc = yacc.yacc(
638 |             module=self, debug=False, optimize=1, debugfile=pickle_file
639 |         )
640 | 
641 |     def parse(self, s, export_comments=None):
642 |         return self.yacc.parse(
643 |             s, lexer=Lexer(export_comments=export_comments), debug=DEBUG
644 |         )
645 | 


--------------------------------------------------------------------------------
/src/hcl/ply/lex.py:
--------------------------------------------------------------------------------
   1 | # -----------------------------------------------------------------------------
   2 | # ply: lex.py
   3 | #
   4 | # Copyright (C) 2001-2019
   5 | # David M. Beazley (Dabeaz LLC)
   6 | # All rights reserved.
   7 | #
   8 | # Latest version: https://github.com/dabeaz/ply
   9 | #
  10 | # Redistribution and use in source and binary forms, with or without
  11 | # modification, are permitted provided that the following conditions are
  12 | # met:
  13 | #
  14 | # * Redistributions of source code must retain the above copyright notice,
  15 | #   this list of conditions and the following disclaimer.
  16 | # * Redistributions in binary form must reproduce the above copyright notice,
  17 | #   this list of conditions and the following disclaimer in the documentation
  18 | #   and/or other materials provided with the distribution.
  19 | # * Neither the name of David Beazley or Dabeaz LLC may be used to
  20 | #   endorse or promote products derived from this software without
  21 | #   specific prior written permission.
  22 | #
  23 | # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  24 | # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  25 | # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  26 | # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  27 | # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  28 | # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  29 | # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  30 | # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  31 | # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  32 | # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  33 | # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  34 | # -----------------------------------------------------------------------------
  35 | 
  36 | __version__    = '3.11'
  37 | __tabversion__ = '3.10'
  38 | 
  39 | import re
  40 | import sys
  41 | import types
  42 | import copy
  43 | import os
  44 | import inspect
  45 | 
  46 | # This tuple contains known string types
  47 | try:
  48 |     # Python 2.6
  49 |     StringTypes = (types.StringType, types.UnicodeType)
  50 | except AttributeError:
  51 |     # Python 3.0
  52 |     StringTypes = (str, bytes)
  53 | 
  54 | # This regular expression is used to match valid token names
  55 | _is_identifier = re.compile(r'^[a-zA-Z0-9_]+$')
  56 | 
  57 | # Exception thrown when invalid token encountered and no default error
  58 | # handler is defined.
  59 | class LexError(Exception):
  60 |     def __init__(self, message, s):
  61 |         self.args = (message,)
  62 |         self.text = s
  63 | 
  64 | 
  65 | # Token class.  This class is used to represent the tokens produced.
  66 | class LexToken(object):
  67 |     def __str__(self):
  68 |         return 'LexToken(%s,%r,%d,%d)' % (self.type, self.value, self.lineno, self.lexpos)
  69 | 
  70 |     def __repr__(self):
  71 |         return str(self)
  72 | 
  73 | 
  74 | # This object is a stand-in for a logging object created by the
  75 | # logging module.
  76 | 
  77 | class PlyLogger(object):
  78 |     def __init__(self, f):
  79 |         self.f = f
  80 | 
  81 |     def critical(self, msg, *args, **kwargs):
  82 |         self.f.write((msg % args) + '\n')
  83 | 
  84 |     def warning(self, msg, *args, **kwargs):
  85 |         self.f.write('WARNING: ' + (msg % args) + '\n')
  86 | 
  87 |     def error(self, msg, *args, **kwargs):
  88 |         self.f.write('ERROR: ' + (msg % args) + '\n')
  89 | 
  90 |     info = critical
  91 |     debug = critical
  92 | 
  93 | 
  94 | # Null logger is used when no output is generated. Does nothing.
  95 | class NullLogger(object):
  96 |     def __getattribute__(self, name):
  97 |         return self
  98 | 
  99 |     def __call__(self, *args, **kwargs):
 100 |         return self
 101 | 
 102 | 
 103 | # -----------------------------------------------------------------------------
 104 | #                        === Lexing Engine ===
 105 | #
 106 | # The following Lexer class implements the lexer runtime.   There are only
 107 | # a few public methods and attributes:
 108 | #
 109 | #    input()          -  Store a new string in the lexer
 110 | #    token()          -  Get the next token
 111 | #    clone()          -  Clone the lexer
 112 | #
 113 | #    lineno           -  Current line number
 114 | #    lexpos           -  Current position in the input string
 115 | # -----------------------------------------------------------------------------
 116 | 
 117 | class Lexer:
 118 |     def __init__(self):
 119 |         self.lexre = None             # Master regular expression. This is a list of
 120 |                                       # tuples (re, findex) where re is a compiled
 121 |                                       # regular expression and findex is a list
 122 |                                       # mapping regex group numbers to rules
 123 |         self.lexretext = None         # Current regular expression strings
 124 |         self.lexstatere = {}          # Dictionary mapping lexer states to master regexs
 125 |         self.lexstateretext = {}      # Dictionary mapping lexer states to regex strings
 126 |         self.lexstaterenames = {}     # Dictionary mapping lexer states to symbol names
 127 |         self.lexstate = 'INITIAL'     # Current lexer state
 128 |         self.lexstatestack = []       # Stack of lexer states
 129 |         self.lexstateinfo = None      # State information
 130 |         self.lexstateignore = {}      # Dictionary of ignored characters for each state
 131 |         self.lexstateerrorf = {}      # Dictionary of error functions for each state
 132 |         self.lexstateeoff = {}        # Dictionary of eof functions for each state
 133 |         self.lexreflags = 0           # Optional re compile flags
 134 |         self.lexdata = None           # Actual input data (as a string)
 135 |         self.lexpos = 0               # Current position in input text
 136 |         self.lexlen = 0               # Length of the input text
 137 |         self.lexerrorf = None         # Error rule (if any)
 138 |         self.lexeoff = None           # EOF rule (if any)
 139 |         self.lextokens = None         # List of valid tokens
 140 |         self.lexignore = ''           # Ignored characters
 141 |         self.lexliterals = ''         # Literal characters that can be passed through
 142 |         self.lexmodule = None         # Module
 143 |         self.lineno = 1               # Current line number
 144 |         self.lexoptimize = False      # Optimized mode
 145 | 
 146 |     def clone(self, object=None):
 147 |         c = copy.copy(self)
 148 | 
 149 |         # If the object parameter has been supplied, it means we are attaching the
 150 |         # lexer to a new object.  In this case, we have to rebind all methods in
 151 |         # the lexstatere and lexstateerrorf tables.
 152 | 
 153 |         if object:
 154 |             newtab = {}
 155 |             for key, ritem in self.lexstatere.items():
 156 |                 newre = []
 157 |                 for cre, findex in ritem:
 158 |                     newfindex = []
 159 |                     for f in findex:
 160 |                         if not f or not f[0]:
 161 |                             newfindex.append(f)
 162 |                             continue
 163 |                         newfindex.append((getattr(object, f[0].__name__), f[1]))
 164 |                 newre.append((cre, newfindex))
 165 |                 newtab[key] = newre
 166 |             c.lexstatere = newtab
 167 |             c.lexstateerrorf = {}
 168 |             for key, ef in self.lexstateerrorf.items():
 169 |                 c.lexstateerrorf[key] = getattr(object, ef.__name__)
 170 |             c.lexmodule = object
 171 |         return c
 172 | 
 173 |     # ------------------------------------------------------------
 174 |     # writetab() - Write lexer information to a table file
 175 |     # ------------------------------------------------------------
 176 |     def writetab(self, lextab, outputdir=''):
 177 |         if isinstance(lextab, types.ModuleType):
 178 |             raise IOError("Won't overwrite existing lextab module")
 179 |         basetabmodule = lextab.split('.')[-1]
 180 |         filename = os.path.join(outputdir, basetabmodule) + '.py'
 181 |         with open(filename, 'w') as tf:
 182 |             tf.write('# %s.py. This file automatically created by PLY (version %s). Don\'t edit!\n' % (basetabmodule, __version__))
 183 |             tf.write('_tabversion   = %s\n' % repr(__tabversion__))
 184 |             tf.write('_lextokens    = set(%s)\n' % repr(tuple(sorted(self.lextokens))))
 185 |             tf.write('_lexreflags   = %s\n' % repr(int(self.lexreflags)))
 186 |             tf.write('_lexliterals  = %s\n' % repr(self.lexliterals))
 187 |             tf.write('_lexstateinfo = %s\n' % repr(self.lexstateinfo))
 188 | 
 189 |             # Rewrite the lexstatere table, replacing function objects with function names
 190 |             tabre = {}
 191 |             for statename, lre in self.lexstatere.items():
 192 |                 titem = []
 193 |                 for (pat, func), retext, renames in zip(lre, self.lexstateretext[statename], self.lexstaterenames[statename]):
 194 |                     titem.append((retext, _funcs_to_names(func, renames)))
 195 |                 tabre[statename] = titem
 196 | 
 197 |             tf.write('_lexstatere   = %s\n' % repr(tabre))
 198 |             tf.write('_lexstateignore = %s\n' % repr(self.lexstateignore))
 199 | 
 200 |             taberr = {}
 201 |             for statename, ef in self.lexstateerrorf.items():
 202 |                 taberr[statename] = ef.__name__ if ef else None
 203 |             tf.write('_lexstateerrorf = %s\n' % repr(taberr))
 204 | 
 205 |             tabeof = {}
 206 |             for statename, ef in self.lexstateeoff.items():
 207 |                 tabeof[statename] = ef.__name__ if ef else None
 208 |             tf.write('_lexstateeoff = %s\n' % repr(tabeof))
 209 | 
 210 |     # ------------------------------------------------------------
 211 |     # readtab() - Read lexer information from a tab file
 212 |     # ------------------------------------------------------------
 213 |     def readtab(self, tabfile, fdict):
 214 |         if isinstance(tabfile, types.ModuleType):
 215 |             lextab = tabfile
 216 |         else:
 217 |             exec('import %s' % tabfile)
 218 |             lextab = sys.modules[tabfile]
 219 | 
 220 |         if getattr(lextab, '_tabversion', '0.0') != __tabversion__:
 221 |             raise ImportError('Inconsistent PLY version')
 222 | 
 223 |         self.lextokens      = lextab._lextokens
 224 |         self.lexreflags     = lextab._lexreflags
 225 |         self.lexliterals    = lextab._lexliterals
 226 |         self.lextokens_all  = self.lextokens | set(self.lexliterals)
 227 |         self.lexstateinfo   = lextab._lexstateinfo
 228 |         self.lexstateignore = lextab._lexstateignore
 229 |         self.lexstatere     = {}
 230 |         self.lexstateretext = {}
 231 |         for statename, lre in lextab._lexstatere.items():
 232 |             titem = []
 233 |             txtitem = []
 234 |             for pat, func_name in lre:
 235 |                 titem.append((re.compile(pat, lextab._lexreflags), _names_to_funcs(func_name, fdict)))
 236 | 
 237 |             self.lexstatere[statename] = titem
 238 |             self.lexstateretext[statename] = txtitem
 239 | 
 240 |         self.lexstateerrorf = {}
 241 |         for statename, ef in lextab._lexstateerrorf.items():
 242 |             self.lexstateerrorf[statename] = fdict[ef]
 243 | 
 244 |         self.lexstateeoff = {}
 245 |         for statename, ef in lextab._lexstateeoff.items():
 246 |             self.lexstateeoff[statename] = fdict[ef]
 247 | 
 248 |         self.begin('INITIAL')
 249 | 
 250 |     # ------------------------------------------------------------
 251 |     # input() - Push a new string into the lexer
 252 |     # ------------------------------------------------------------
 253 |     def input(self, s):
 254 |         # Pull off the first character to see if s looks like a string
 255 |         c = s[:1]
 256 |         if not isinstance(c, StringTypes):
 257 |             raise ValueError('Expected a string')
 258 |         self.lexdata = s
 259 |         self.lexpos = 0
 260 |         self.lexlen = len(s)
 261 | 
 262 |     # ------------------------------------------------------------
 263 |     # begin() - Changes the lexing state
 264 |     # ------------------------------------------------------------
 265 |     def begin(self, state):
 266 |         if state not in self.lexstatere:
 267 |             raise ValueError('Undefined state')
 268 |         self.lexre = self.lexstatere[state]
 269 |         self.lexretext = self.lexstateretext[state]
 270 |         self.lexignore = self.lexstateignore.get(state, '')
 271 |         self.lexerrorf = self.lexstateerrorf.get(state, None)
 272 |         self.lexeoff = self.lexstateeoff.get(state, None)
 273 |         self.lexstate = state
 274 | 
 275 |     # ------------------------------------------------------------
 276 |     # push_state() - Changes the lexing state and saves old on stack
 277 |     # ------------------------------------------------------------
 278 |     def push_state(self, state):
 279 |         self.lexstatestack.append(self.lexstate)
 280 |         self.begin(state)
 281 | 
 282 |     # ------------------------------------------------------------
 283 |     # pop_state() - Restores the previous state
 284 |     # ------------------------------------------------------------
 285 |     def pop_state(self):
 286 |         self.begin(self.lexstatestack.pop())
 287 | 
 288 |     # ------------------------------------------------------------
 289 |     # current_state() - Returns the current lexing state
 290 |     # ------------------------------------------------------------
 291 |     def current_state(self):
 292 |         return self.lexstate
 293 | 
 294 |     # ------------------------------------------------------------
 295 |     # skip() - Skip ahead n characters
 296 |     # ------------------------------------------------------------
 297 |     def skip(self, n):
 298 |         self.lexpos += n
 299 | 
 300 |     # ------------------------------------------------------------
 301 |     # opttoken() - Return the next token from the Lexer
 302 |     #
 303 |     # Note: This function has been carefully implemented to be as fast
 304 |     # as possible.  Don't make changes unless you really know what
 305 |     # you are doing
 306 |     # ------------------------------------------------------------
 307 |     def token(self):
 308 |         # Make local copies of frequently referenced attributes
 309 |         lexpos    = self.lexpos
 310 |         lexlen    = self.lexlen
 311 |         lexignore = self.lexignore
 312 |         lexdata   = self.lexdata
 313 | 
 314 |         while lexpos < lexlen:
 315 |             # This code provides some short-circuit code for whitespace, tabs, and other ignored characters
 316 |             if lexdata[lexpos] in lexignore:
 317 |                 lexpos += 1
 318 |                 continue
 319 | 
 320 |             # Look for a regular expression match
 321 |             for lexre, lexindexfunc in self.lexre:
 322 |                 m = lexre.match(lexdata, lexpos)
 323 |                 if not m:
 324 |                     continue
 325 | 
 326 |                 # Create a token for return
 327 |                 tok = LexToken()
 328 |                 tok.value = m.group()
 329 |                 tok.lineno = self.lineno
 330 |                 tok.lexpos = lexpos
 331 | 
 332 |                 i = m.lastindex
 333 |                 func, tok.type = lexindexfunc[i]
 334 | 
 335 |                 if not func:
 336 |                     # If no token type was set, it's an ignored token
 337 |                     if tok.type:
 338 |                         self.lexpos = m.end()
 339 |                         return tok
 340 |                     else:
 341 |                         lexpos = m.end()
 342 |                         break
 343 | 
 344 |                 lexpos = m.end()
 345 | 
 346 |                 # If token is processed by a function, call it
 347 | 
 348 |                 tok.lexer = self      # Set additional attributes useful in token rules
 349 |                 self.lexmatch = m
 350 |                 self.lexpos = lexpos
 351 | 
 352 |                 newtok = func(tok)
 353 | 
 354 |                 # Every function must return a token, if nothing, we just move to next token
 355 |                 if not newtok:
 356 |                     lexpos    = self.lexpos         # This is here in case user has updated lexpos.
 357 |                     lexignore = self.lexignore      # This is here in case there was a state change
 358 |                     break
 359 | 
 360 |                 # Verify type of the token.  If not in the token map, raise an error
 361 |                 if not self.lexoptimize:
 362 |                     if newtok.type not in self.lextokens_all:
 363 |                         raise LexError("%s:%d: Rule '%s' returned an unknown token type '%s'" % (
 364 |                             func.__code__.co_filename, func.__code__.co_firstlineno,
 365 |                             func.__name__, newtok.type), lexdata[lexpos:])
 366 | 
 367 |                 return newtok
 368 |             else:
 369 |                 # No match, see if in literals
 370 |                 if lexdata[lexpos] in self.lexliterals:
 371 |                     tok = LexToken()
 372 |                     tok.value = lexdata[lexpos]
 373 |                     tok.lineno = self.lineno
 374 |                     tok.type = tok.value
 375 |                     tok.lexpos = lexpos
 376 |                     self.lexpos = lexpos + 1
 377 |                     return tok
 378 | 
 379 |                 # No match. Call t_error() if defined.
 380 |                 if self.lexerrorf:
 381 |                     tok = LexToken()
 382 |                     tok.value = self.lexdata[lexpos:]
 383 |                     tok.lineno = self.lineno
 384 |                     tok.type = 'error'
 385 |                     tok.lexer = self
 386 |                     tok.lexpos = lexpos
 387 |                     self.lexpos = lexpos
 388 |                     newtok = self.lexerrorf(tok)
 389 |                     if lexpos == self.lexpos:
 390 |                         # Error method didn't change text position at all. This is an error.
 391 |                         raise LexError("Scanning error. Illegal character '%s'" % (lexdata[lexpos]), lexdata[lexpos:])
 392 |                     lexpos = self.lexpos
 393 |                     if not newtok:
 394 |                         continue
 395 |                     return newtok
 396 | 
 397 |                 self.lexpos = lexpos
 398 |                 raise LexError("Illegal character '%s' at index %d" % (lexdata[lexpos], lexpos), lexdata[lexpos:])
 399 | 
 400 |         if self.lexeoff:
 401 |             tok = LexToken()
 402 |             tok.type = 'eof'
 403 |             tok.value = ''
 404 |             tok.lineno = self.lineno
 405 |             tok.lexpos = lexpos
 406 |             tok.lexer = self
 407 |             self.lexpos = lexpos
 408 |             newtok = self.lexeoff(tok)
 409 |             return newtok
 410 | 
 411 |         self.lexpos = lexpos + 1
 412 |         if self.lexdata is None:
 413 |             raise RuntimeError('No input string given with input()')
 414 |         return None
 415 | 
 416 |     # Iterator interface
 417 |     def __iter__(self):
 418 |         return self
 419 | 
 420 |     def next(self):
 421 |         t = self.token()
 422 |         if t is None:
 423 |             raise StopIteration
 424 |         return t
 425 | 
 426 |     __next__ = next
 427 | 
 428 | # -----------------------------------------------------------------------------
 429 | #                           ==== Lex Builder ===
 430 | #
 431 | # The functions and classes below are used to collect lexing information
 432 | # and build a Lexer object from it.
 433 | # -----------------------------------------------------------------------------
 434 | 
 435 | # -----------------------------------------------------------------------------
 436 | # _get_regex(func)
 437 | #
 438 | # Returns the regular expression assigned to a function either as a doc string
 439 | # or as a .regex attribute attached by the @TOKEN decorator.
 440 | # -----------------------------------------------------------------------------
 441 | def _get_regex(func):
 442 |     return getattr(func, 'regex', func.__doc__)
 443 | 
 444 | # -----------------------------------------------------------------------------
 445 | # get_caller_module_dict()
 446 | #
 447 | # This function returns a dictionary containing all of the symbols defined within
 448 | # a caller further down the call stack.  This is used to get the environment
 449 | # associated with the yacc() call if none was provided.
 450 | # -----------------------------------------------------------------------------
 451 | def get_caller_module_dict(levels):
 452 |     f = sys._getframe(levels)
 453 |     ldict = f.f_globals.copy()
 454 |     if f.f_globals != f.f_locals:
 455 |         ldict.update(f.f_locals)
 456 |     return ldict
 457 | 
 458 | # -----------------------------------------------------------------------------
 459 | # _funcs_to_names()
 460 | #
 461 | # Given a list of regular expression functions, this converts it to a list
 462 | # suitable for output to a table file
 463 | # -----------------------------------------------------------------------------
 464 | def _funcs_to_names(funclist, namelist):
 465 |     result = []
 466 |     for f, name in zip(funclist, namelist):
 467 |         if f and f[0]:
 468 |             result.append((name, f[1]))
 469 |         else:
 470 |             result.append(f)
 471 |     return result
 472 | 
 473 | # -----------------------------------------------------------------------------
 474 | # _names_to_funcs()
 475 | #
 476 | # Given a list of regular expression function names, this converts it back to
 477 | # functions.
 478 | # -----------------------------------------------------------------------------
 479 | def _names_to_funcs(namelist, fdict):
 480 |     result = []
 481 |     for n in namelist:
 482 |         if n and n[0]:
 483 |             result.append((fdict[n[0]], n[1]))
 484 |         else:
 485 |             result.append(n)
 486 |     return result
 487 | 
 488 | # -----------------------------------------------------------------------------
 489 | # _form_master_re()
 490 | #
 491 | # This function takes a list of all of the regex components and attempts to
 492 | # form the master regular expression.  Given limitations in the Python re
 493 | # module, it may be necessary to break the master regex into separate expressions.
 494 | # -----------------------------------------------------------------------------
 495 | def _form_master_re(relist, reflags, ldict, toknames):
 496 |     if not relist:
 497 |         return []
 498 |     regex = '|'.join(relist)
 499 |     try:
 500 |         lexre = re.compile(regex, reflags)
 501 | 
 502 |         # Build the index to function map for the matching engine
 503 |         lexindexfunc = [None] * (max(lexre.groupindex.values()) + 1)
 504 |         lexindexnames = lexindexfunc[:]
 505 | 
 506 |         for f, i in lexre.groupindex.items():
 507 |             handle = ldict.get(f, None)
 508 |             if type(handle) in (types.FunctionType, types.MethodType):
 509 |                 lexindexfunc[i] = (handle, toknames[f])
 510 |                 lexindexnames[i] = f
 511 |             elif handle is not None:
 512 |                 lexindexnames[i] = f
 513 |                 if f.find('ignore_') > 0:
 514 |                     lexindexfunc[i] = (None, None)
 515 |                 else:
 516 |                     lexindexfunc[i] = (None, toknames[f])
 517 | 
 518 |         return [(lexre, lexindexfunc)], [regex], [lexindexnames]
 519 |     except Exception:
 520 |         m = int(len(relist)/2)
 521 |         if m == 0:
 522 |             m = 1
 523 |         llist, lre, lnames = _form_master_re(relist[:m], reflags, ldict, toknames)
 524 |         rlist, rre, rnames = _form_master_re(relist[m:], reflags, ldict, toknames)
 525 |         return (llist+rlist), (lre+rre), (lnames+rnames)
 526 | 
 527 | # -----------------------------------------------------------------------------
 528 | # def _statetoken(s,names)
 529 | #
 530 | # Given a declaration name s of the form "t_" and a dictionary whose keys are
 531 | # state names, this function returns a tuple (states,tokenname) where states
 532 | # is a tuple of state names and tokenname is the name of the token.  For example,
 533 | # calling this with s = "t_foo_bar_SPAM" might return (('foo','bar'),'SPAM')
 534 | # -----------------------------------------------------------------------------
 535 | def _statetoken(s, names):
 536 |     parts = s.split('_')
 537 |     for i, part in enumerate(parts[1:], 1):
 538 |         if part not in names and part != 'ANY':
 539 |             break
 540 | 
 541 |     if i > 1:
 542 |         states = tuple(parts[1:i])
 543 |     else:
 544 |         states = ('INITIAL',)
 545 | 
 546 |     if 'ANY' in states:
 547 |         states = tuple(names)
 548 | 
 549 |     tokenname = '_'.join(parts[i:])
 550 |     return (states, tokenname)
 551 | 
 552 | 
 553 | # -----------------------------------------------------------------------------
 554 | # LexerReflect()
 555 | #
 556 | # This class represents information needed to build a lexer as extracted from a
 557 | # user's input file.
 558 | # -----------------------------------------------------------------------------
 559 | class LexerReflect(object):
 560 |     def __init__(self, ldict, log=None, reflags=0):
 561 |         self.ldict      = ldict
 562 |         self.error_func = None
 563 |         self.tokens     = []
 564 |         self.reflags    = reflags
 565 |         self.stateinfo  = {'INITIAL': 'inclusive'}
 566 |         self.modules    = set()
 567 |         self.error      = False
 568 |         self.log        = PlyLogger(sys.stderr) if log is None else log
 569 | 
 570 |     # Get all of the basic information
 571 |     def get_all(self):
 572 |         self.get_tokens()
 573 |         self.get_literals()
 574 |         self.get_states()
 575 |         self.get_rules()
 576 | 
 577 |     # Validate all of the information
 578 |     def validate_all(self):
 579 |         self.validate_tokens()
 580 |         self.validate_literals()
 581 |         self.validate_rules()
 582 |         return self.error
 583 | 
 584 |     # Get the tokens map
 585 |     def get_tokens(self):
 586 |         tokens = self.ldict.get('tokens', None)
 587 |         if not tokens:
 588 |             self.log.error('No token list is defined')
 589 |             self.error = True
 590 |             return
 591 | 
 592 |         if not isinstance(tokens, (list, tuple)):
 593 |             self.log.error('tokens must be a list or tuple')
 594 |             self.error = True
 595 |             return
 596 | 
 597 |         if not tokens:
 598 |             self.log.error('tokens is empty')
 599 |             self.error = True
 600 |             return
 601 | 
 602 |         self.tokens = tokens
 603 | 
 604 |     # Validate the tokens
 605 |     def validate_tokens(self):
 606 |         terminals = {}
 607 |         for n in self.tokens:
 608 |             if not _is_identifier.match(n):
 609 |                 self.log.error("Bad token name '%s'", n)
 610 |                 self.error = True
 611 |             if n in terminals:
 612 |                 self.log.warning("Token '%s' multiply defined", n)
 613 |             terminals[n] = 1
 614 | 
 615 |     # Get the literals specifier
 616 |     def get_literals(self):
 617 |         self.literals = self.ldict.get('literals', '')
 618 |         if not self.literals:
 619 |             self.literals = ''
 620 | 
 621 |     # Validate literals
 622 |     def validate_literals(self):
 623 |         try:
 624 |             for c in self.literals:
 625 |                 if not isinstance(c, StringTypes) or len(c) > 1:
 626 |                     self.log.error('Invalid literal %s. Must be a single character', repr(c))
 627 |                     self.error = True
 628 | 
 629 |         except TypeError:
 630 |             self.log.error('Invalid literals specification. literals must be a sequence of characters')
 631 |             self.error = True
 632 | 
 633 |     def get_states(self):
 634 |         self.states = self.ldict.get('states', None)
 635 |         # Build statemap
 636 |         if self.states:
 637 |             if not isinstance(self.states, (tuple, list)):
 638 |                 self.log.error('states must be defined as a tuple or list')
 639 |                 self.error = True
 640 |             else:
 641 |                 for s in self.states:
 642 |                     if not isinstance(s, tuple) or len(s) != 2:
 643 |                         self.log.error("Invalid state specifier %s. Must be a tuple (statename,'exclusive|inclusive')", repr(s))
 644 |                         self.error = True
 645 |                         continue
 646 |                     name, statetype = s
 647 |                     if not isinstance(name, StringTypes):
 648 |                         self.log.error('State name %s must be a string', repr(name))
 649 |                         self.error = True
 650 |                         continue
 651 |                     if not (statetype == 'inclusive' or statetype == 'exclusive'):
 652 |                         self.log.error("State type for state %s must be 'inclusive' or 'exclusive'", name)
 653 |                         self.error = True
 654 |                         continue
 655 |                     if name in self.stateinfo:
 656 |                         self.log.error("State '%s' already defined", name)
 657 |                         self.error = True
 658 |                         continue
 659 |                     self.stateinfo[name] = statetype
 660 | 
 661 |     # Get all of the symbols with a t_ prefix and sort them into various
 662 |     # categories (functions, strings, error functions, and ignore characters)
 663 | 
 664 |     def get_rules(self):
 665 |         tsymbols = [f for f in self.ldict if f[:2] == 't_']
 666 | 
 667 |         # Now build up a list of functions and a list of strings
 668 |         self.toknames = {}        # Mapping of symbols to token names
 669 |         self.funcsym  = {}        # Symbols defined as functions
 670 |         self.strsym   = {}        # Symbols defined as strings
 671 |         self.ignore   = {}        # Ignore strings by state
 672 |         self.errorf   = {}        # Error functions by state
 673 |         self.eoff     = {}        # EOF functions by state
 674 | 
 675 |         for s in self.stateinfo:
 676 |             self.funcsym[s] = []
 677 |             self.strsym[s] = []
 678 | 
 679 |         if len(tsymbols) == 0:
 680 |             self.log.error('No rules of the form t_rulename are defined')
 681 |             self.error = True
 682 |             return
 683 | 
 684 |         for f in tsymbols:
 685 |             t = self.ldict[f]
 686 |             states, tokname = _statetoken(f, self.stateinfo)
 687 |             self.toknames[f] = tokname
 688 | 
 689 |             if hasattr(t, '__call__'):
 690 |                 if tokname == 'error':
 691 |                     for s in states:
 692 |                         self.errorf[s] = t
 693 |                 elif tokname == 'eof':
 694 |                     for s in states:
 695 |                         self.eoff[s] = t
 696 |                 elif tokname == 'ignore':
 697 |                     line = t.__code__.co_firstlineno
 698 |                     file = t.__code__.co_filename
 699 |                     self.log.error("%s:%d: Rule '%s' must be defined as a string", file, line, t.__name__)
 700 |                     self.error = True
 701 |                 else:
 702 |                     for s in states:
 703 |                         self.funcsym[s].append((f, t))
 704 |             elif isinstance(t, StringTypes):
 705 |                 if tokname == 'ignore':
 706 |                     for s in states:
 707 |                         self.ignore[s] = t
 708 |                     if '\\' in t:
 709 |                         self.log.warning("%s contains a literal backslash '\\'", f)
 710 | 
 711 |                 elif tokname == 'error':
 712 |                     self.log.error("Rule '%s' must be defined as a function", f)
 713 |                     self.error = True
 714 |                 else:
 715 |                     for s in states:
 716 |                         self.strsym[s].append((f, t))
 717 |             else:
 718 |                 self.log.error('%s not defined as a function or string', f)
 719 |                 self.error = True
 720 | 
 721 |         # Sort the functions by line number
 722 |         for f in self.funcsym.values():
 723 |             f.sort(key=lambda x: x[1].__code__.co_firstlineno)
 724 | 
 725 |         # Sort the strings by regular expression length
 726 |         for s in self.strsym.values():
 727 |             s.sort(key=lambda x: len(x[1]), reverse=True)
 728 | 
 729 |     # Validate all of the t_rules collected
 730 |     def validate_rules(self):
 731 |         for state in self.stateinfo:
 732 |             # Validate all rules defined by functions
 733 | 
 734 |             for fname, f in self.funcsym[state]:
 735 |                 line = f.__code__.co_firstlineno
 736 |                 file = f.__code__.co_filename
 737 |                 module = inspect.getmodule(f)
 738 |                 self.modules.add(module)
 739 | 
 740 |                 tokname = self.toknames[fname]
 741 |                 if isinstance(f, types.MethodType):
 742 |                     reqargs = 2
 743 |                 else:
 744 |                     reqargs = 1
 745 |                 nargs = f.__code__.co_argcount
 746 |                 if nargs > reqargs:
 747 |                     self.log.error("%s:%d: Rule '%s' has too many arguments", file, line, f.__name__)
 748 |                     self.error = True
 749 |                     continue
 750 | 
 751 |                 if nargs < reqargs:
 752 |                     self.log.error("%s:%d: Rule '%s' requires an argument", file, line, f.__name__)
 753 |                     self.error = True
 754 |                     continue
 755 | 
 756 |                 if not _get_regex(f):
 757 |                     self.log.error("%s:%d: No regular expression defined for rule '%s'", file, line, f.__name__)
 758 |                     self.error = True
 759 |                     continue
 760 | 
 761 |                 try:
 762 |                     c = re.compile('(?P<%s>%s)' % (fname, _get_regex(f)), self.reflags)
 763 |                     if c.match(''):
 764 |                         self.log.error("%s:%d: Regular expression for rule '%s' matches empty string", file, line, f.__name__)
 765 |                         self.error = True
 766 |                 except re.error as e:
 767 |                     self.log.error("%s:%d: Invalid regular expression for rule '%s'. %s", file, line, f.__name__, e)
 768 |                     if '#' in _get_regex(f):
 769 |                         self.log.error("%s:%d. Make sure '#' in rule '%s' is escaped with '\\#'", file, line, f.__name__)
 770 |                     self.error = True
 771 | 
 772 |             # Validate all rules defined by strings
 773 |             for name, r in self.strsym[state]:
 774 |                 tokname = self.toknames[name]
 775 |                 if tokname == 'error':
 776 |                     self.log.error("Rule '%s' must be defined as a function", name)
 777 |                     self.error = True
 778 |                     continue
 779 | 
 780 |                 if tokname not in self.tokens and tokname.find('ignore_') < 0:
 781 |                     self.log.error("Rule '%s' defined for an unspecified token %s", name, tokname)
 782 |                     self.error = True
 783 |                     continue
 784 | 
 785 |                 try:
 786 |                     c = re.compile('(?P<%s>%s)' % (name, r), self.reflags)
 787 |                     if (c.match('')):
 788 |                         self.log.error("Regular expression for rule '%s' matches empty string", name)
 789 |                         self.error = True
 790 |                 except re.error as e:
 791 |                     self.log.error("Invalid regular expression for rule '%s'. %s", name, e)
 792 |                     if '#' in r:
 793 |                         self.log.error("Make sure '#' in rule '%s' is escaped with '\\#'", name)
 794 |                     self.error = True
 795 | 
 796 |             if not self.funcsym[state] and not self.strsym[state]:
 797 |                 self.log.error("No rules defined for state '%s'", state)
 798 |                 self.error = True
 799 | 
 800 |             # Validate the error function
 801 |             efunc = self.errorf.get(state, None)
 802 |             if efunc:
 803 |                 f = efunc
 804 |                 line = f.__code__.co_firstlineno
 805 |                 file = f.__code__.co_filename
 806 |                 module = inspect.getmodule(f)
 807 |                 self.modules.add(module)
 808 | 
 809 |                 if isinstance(f, types.MethodType):
 810 |                     reqargs = 2
 811 |                 else:
 812 |                     reqargs = 1
 813 |                 nargs = f.__code__.co_argcount
 814 |                 if nargs > reqargs:
 815 |                     self.log.error("%s:%d: Rule '%s' has too many arguments", file, line, f.__name__)
 816 |                     self.error = True
 817 | 
 818 |                 if nargs < reqargs:
 819 |                     self.log.error("%s:%d: Rule '%s' requires an argument", file, line, f.__name__)
 820 |                     self.error = True
 821 | 
 822 |         for module in self.modules:
 823 |             self.validate_module(module)
 824 | 
 825 |     # -----------------------------------------------------------------------------
 826 |     # validate_module()
 827 |     #
 828 |     # This checks to see if there are duplicated t_rulename() functions or strings
 829 |     # in the parser input file.  This is done using a simple regular expression
 830 |     # match on each line in the source code of the given module.
 831 |     # -----------------------------------------------------------------------------
 832 | 
 833 |     def validate_module(self, module):
 834 |         try:
 835 |             lines, linen = inspect.getsourcelines(module)
 836 |         except IOError:
 837 |             return
 838 | 
 839 |         fre = re.compile(r'\s*def\s+(t_[a-zA-Z_0-9]*)\(')
 840 |         sre = re.compile(r'\s*(t_[a-zA-Z_0-9]*)\s*=')
 841 | 
 842 |         counthash = {}
 843 |         linen += 1
 844 |         for line in lines:
 845 |             m = fre.match(line)
 846 |             if not m:
 847 |                 m = sre.match(line)
 848 |             if m:
 849 |                 name = m.group(1)
 850 |                 prev = counthash.get(name)
 851 |                 if not prev:
 852 |                     counthash[name] = linen
 853 |                 else:
 854 |                     filename = inspect.getsourcefile(module)
 855 |                     self.log.error('%s:%d: Rule %s redefined. Previously defined on line %d', filename, linen, name, prev)
 856 |                     self.error = True
 857 |             linen += 1
 858 | 
 859 | # -----------------------------------------------------------------------------
 860 | # lex(module)
 861 | #
 862 | # Build all of the regular expression rules from definitions in the supplied module
 863 | # -----------------------------------------------------------------------------
 864 | def lex(module=None, object=None, debug=False, optimize=False, lextab='lextab',
 865 |         reflags=int(re.VERBOSE), nowarn=False, outputdir=None, debuglog=None, errorlog=None):
 866 | 
 867 |     if lextab is None:
 868 |         lextab = 'lextab'
 869 | 
 870 |     global lexer
 871 | 
 872 |     ldict = None
 873 |     stateinfo  = {'INITIAL': 'inclusive'}
 874 |     lexobj = Lexer()
 875 |     lexobj.lexoptimize = optimize
 876 |     global token, input
 877 | 
 878 |     if errorlog is None:
 879 |         errorlog = PlyLogger(sys.stderr)
 880 | 
 881 |     if debug:
 882 |         if debuglog is None:
 883 |             debuglog = PlyLogger(sys.stderr)
 884 | 
 885 |     # Get the module dictionary used for the lexer
 886 |     if object:
 887 |         module = object
 888 | 
 889 |     # Get the module dictionary used for the parser
 890 |     if module:
 891 |         _items = [(k, getattr(module, k)) for k in dir(module)]
 892 |         ldict = dict(_items)
 893 |         # If no __file__ attribute is available, try to obtain it from the __module__ instead
 894 |         if '__file__' not in ldict:
 895 |             ldict['__file__'] = sys.modules[ldict['__module__']].__file__
 896 |     else:
 897 |         ldict = get_caller_module_dict(2)
 898 | 
 899 |     # Determine if the module is package of a package or not.
 900 |     # If so, fix the tabmodule setting so that tables load correctly
 901 |     pkg = ldict.get('__package__')
 902 |     if pkg and isinstance(lextab, str):
 903 |         if '.' not in lextab:
 904 |             lextab = pkg + '.' + lextab
 905 | 
 906 |     # Collect parser information from the dictionary
 907 |     linfo = LexerReflect(ldict, log=errorlog, reflags=reflags)
 908 |     linfo.get_all()
 909 |     if not optimize:
 910 |         if linfo.validate_all():
 911 |             raise SyntaxError("Can't build lexer")
 912 | 
 913 |     if optimize and lextab:
 914 |         try:
 915 |             lexobj.readtab(lextab, ldict)
 916 |             token = lexobj.token
 917 |             input = lexobj.input
 918 |             lexer = lexobj
 919 |             return lexobj
 920 | 
 921 |         except ImportError:
 922 |             pass
 923 | 
 924 |     # Dump some basic debugging information
 925 |     if debug:
 926 |         debuglog.info('lex: tokens   = %r', linfo.tokens)
 927 |         debuglog.info('lex: literals = %r', linfo.literals)
 928 |         debuglog.info('lex: states   = %r', linfo.stateinfo)
 929 | 
 930 |     # Build a dictionary of valid token names
 931 |     lexobj.lextokens = set()
 932 |     for n in linfo.tokens:
 933 |         lexobj.lextokens.add(n)
 934 | 
 935 |     # Get literals specification
 936 |     if isinstance(linfo.literals, (list, tuple)):
 937 |         lexobj.lexliterals = type(linfo.literals[0])().join(linfo.literals)
 938 |     else:
 939 |         lexobj.lexliterals = linfo.literals
 940 | 
 941 |     lexobj.lextokens_all = lexobj.lextokens | set(lexobj.lexliterals)
 942 | 
 943 |     # Get the stateinfo dictionary
 944 |     stateinfo = linfo.stateinfo
 945 | 
 946 |     regexs = {}
 947 |     # Build the master regular expressions
 948 |     for state in stateinfo:
 949 |         regex_list = []
 950 | 
 951 |         # Add rules defined by functions first
 952 |         for fname, f in linfo.funcsym[state]:
 953 |             regex_list.append('(?P<%s>%s)' % (fname, _get_regex(f)))
 954 |             if debug:
 955 |                 debuglog.info("lex: Adding rule %s -> '%s' (state '%s')", fname, _get_regex(f), state)
 956 | 
 957 |         # Now add all of the simple rules
 958 |         for name, r in linfo.strsym[state]:
 959 |             regex_list.append('(?P<%s>%s)' % (name, r))
 960 |             if debug:
 961 |                 debuglog.info("lex: Adding rule %s -> '%s' (state '%s')", name, r, state)
 962 | 
 963 |         regexs[state] = regex_list
 964 | 
 965 |     # Build the master regular expressions
 966 | 
 967 |     if debug:
 968 |         debuglog.info('lex: ==== MASTER REGEXS FOLLOW ====')
 969 | 
 970 |     for state in regexs:
 971 |         lexre, re_text, re_names = _form_master_re(regexs[state], reflags, ldict, linfo.toknames)
 972 |         lexobj.lexstatere[state] = lexre
 973 |         lexobj.lexstateretext[state] = re_text
 974 |         lexobj.lexstaterenames[state] = re_names
 975 |         if debug:
 976 |             for i, text in enumerate(re_text):
 977 |                 debuglog.info("lex: state '%s' : regex[%d] = '%s'", state, i, text)
 978 | 
 979 |     # For inclusive states, we need to add the regular expressions from the INITIAL state
 980 |     for state, stype in stateinfo.items():
 981 |         if state != 'INITIAL' and stype == 'inclusive':
 982 |             lexobj.lexstatere[state].extend(lexobj.lexstatere['INITIAL'])
 983 |             lexobj.lexstateretext[state].extend(lexobj.lexstateretext['INITIAL'])
 984 |             lexobj.lexstaterenames[state].extend(lexobj.lexstaterenames['INITIAL'])
 985 | 
 986 |     lexobj.lexstateinfo = stateinfo
 987 |     lexobj.lexre = lexobj.lexstatere['INITIAL']
 988 |     lexobj.lexretext = lexobj.lexstateretext['INITIAL']
 989 |     lexobj.lexreflags = reflags
 990 | 
 991 |     # Set up ignore variables
 992 |     lexobj.lexstateignore = linfo.ignore
 993 |     lexobj.lexignore = lexobj.lexstateignore.get('INITIAL', '')
 994 | 
 995 |     # Set up error functions
 996 |     lexobj.lexstateerrorf = linfo.errorf
 997 |     lexobj.lexerrorf = linfo.errorf.get('INITIAL', None)
 998 |     if not lexobj.lexerrorf:
 999 |         errorlog.warning('No t_error rule is defined')
1000 | 
1001 |     # Set up eof functions
1002 |     lexobj.lexstateeoff = linfo.eoff
1003 |     lexobj.lexeoff = linfo.eoff.get('INITIAL', None)
1004 | 
1005 |     # Check state information for ignore and error rules
1006 |     for s, stype in stateinfo.items():
1007 |         if stype == 'exclusive':
1008 |             if s not in linfo.errorf:
1009 |                 errorlog.warning("No error rule is defined for exclusive state '%s'", s)
1010 |             if s not in linfo.ignore and lexobj.lexignore:
1011 |                 errorlog.warning("No ignore rule is defined for exclusive state '%s'", s)
1012 |         elif stype == 'inclusive':
1013 |             if s not in linfo.errorf:
1014 |                 linfo.errorf[s] = linfo.errorf.get('INITIAL', None)
1015 |             if s not in linfo.ignore:
1016 |                 linfo.ignore[s] = linfo.ignore.get('INITIAL', '')
1017 | 
1018 |     # Create global versions of the token() and input() functions
1019 |     token = lexobj.token
1020 |     input = lexobj.input
1021 |     lexer = lexobj
1022 | 
1023 |     # If in optimize mode, we write the lextab
1024 |     if lextab and optimize:
1025 |         if outputdir is None:
1026 |             # If no output directory is set, the location of the output files
1027 |             # is determined according to the following rules:
1028 |             #     - If lextab specifies a package, files go into that package directory
1029 |             #     - Otherwise, files go in the same directory as the specifying module
1030 |             if isinstance(lextab, types.ModuleType):
1031 |                 srcfile = lextab.__file__
1032 |             else:
1033 |                 if '.' not in lextab:
1034 |                     srcfile = ldict['__file__']
1035 |                 else:
1036 |                     parts = lextab.split('.')
1037 |                     pkgname = '.'.join(parts[:-1])
1038 |                     exec('import %s' % pkgname)
1039 |                     srcfile = getattr(sys.modules[pkgname], '__file__', '')
1040 |             outputdir = os.path.dirname(srcfile)
1041 |         try:
1042 |             lexobj.writetab(lextab, outputdir)
1043 |             if lextab in sys.modules:
1044 |                 del sys.modules[lextab]
1045 |         except IOError as e:
1046 |             errorlog.warning("Couldn't write lextab module %r. %s" % (lextab, e))
1047 | 
1048 |     return lexobj
1049 | 
1050 | # -----------------------------------------------------------------------------
1051 | # runmain()
1052 | #
1053 | # This runs the lexer as a main program
1054 | # -----------------------------------------------------------------------------
1055 | 
1056 | def runmain(lexer=None, data=None):
1057 |     if not data:
1058 |         try:
1059 |             filename = sys.argv[1]
1060 |             with open(filename) as f:
1061 |                 data = f.read()
1062 |         except IndexError:
1063 |             sys.stdout.write('Reading from standard input (type EOF to end):\n')
1064 |             data = sys.stdin.read()
1065 | 
1066 |     if lexer:
1067 |         _input = lexer.input
1068 |     else:
1069 |         _input = input
1070 |     _input(data)
1071 |     if lexer:
1072 |         _token = lexer.token
1073 |     else:
1074 |         _token = token
1075 | 
1076 |     while True:
1077 |         tok = _token()
1078 |         if not tok:
1079 |             break
1080 |         sys.stdout.write('(%s,%r,%d,%d)\n' % (tok.type, tok.value, tok.lineno, tok.lexpos))
1081 | 
1082 | # -----------------------------------------------------------------------------
1083 | # @TOKEN(regex)
1084 | #
1085 | # This decorator function can be used to set the regex expression on a function
1086 | # when its docstring might need to be set in an alternative way
1087 | # -----------------------------------------------------------------------------
1088 | 
1089 | def TOKEN(r):
1090 |     def set_regex(f):
1091 |         if hasattr(r, '__call__'):
1092 |             f.regex = _get_regex(r)
1093 |         else:
1094 |             f.regex = r
1095 |         return f
1096 |     return set_regex
1097 | 
1098 | # Alternative spelling of the TOKEN decorator
1099 | Token = TOKEN
1100 | 


--------------------------------------------------------------------------------