const unicodeLetter = /\p{L}/ unicodePunctuation = /\p{Pc}/ unicodeDigit = /[0-9]/ module.exports = grammar({ name: 'hcl', conflicts: $ => [ [$.body], [$.object_elem, $.variable_expr], [$.attr_splat], [$.full_splat], ], extras: $ => [ $.comment, /\s/, ], rules: { config_file: $ => $.body, body: $ => repeat1(seq( choice( $.attribute, $.block, ), )), attribute: $ => seq( field('name', $.identifier), '=', $.expression, ), block: $ => seq( field('name', $.identifier), repeat(choice($.string_lit, $.identifier)), '{', optional($.body), '}', ), // TODO: not to spec but good enough for now identifier: $ => token(seq( unicodeLetter, repeat(choice(unicodeLetter, unicodeDigit, unicodePunctuation)), )), expression: $ => choice( $.expr_term, //$.operation, //$.conditional, ), expr_term: $ => choice( $.literal_value, $.collection_value, $.variable_expr, $.function_call, $.for_expr, seq($.expr_term, $.index), seq($.expr_term, $.get_attr), seq($.expr_term, $.splat), seq('(', $.expression, ')'), ), literal_value: $ => choice( $.numeric_lit, $.string_lit, $.bool_lit, $.null_lit, ), numeric_lit: $ => /[0-9]+(\.[0-9]+([eE][-+]?[0-9]+)?)?/, string_lit: $ => (seq('"', token.immediate(repeat(choice(/[^\\"\n]/, /\\(.|\n)/))), '"')), bool_lit: $ => choice('true', 'false'), null_lit: $ => 'null', collection_value: $ => choice( $.tuple, $.object, ), tuple: $ => seq( '[', optional(seq( $.expression, repeat(seq(',', $.expression)), )), ']', ), object: $ => seq( '{', optional(seq( $.object_elem, repeat(seq(',', $.object_elem)), )), '}', ), object_elem: $ => seq( choice($.identifier, $.expression), choice('=', ':'), $.expression, ), index: $ => seq('[', $.expression, ']'), get_attr: $ => seq('.', $.identifier), splat: $ => choice($.attr_splat, $.full_splat), attr_splat: $ => seq('.', '*', repeat($.get_attr)), full_splat: $ => seq('[', '*', ']', repeat(choice($.get_attr, $.index))), for_expr: $ => choice($.for_tuple_expr, $.for_object_expr), for_tuple_expr: $ => seq( '[', $.for_intro, $.expression, optional($.for_cond), ']', ), for_object_expr: $ => seq( '{', $.for_intro, $.expression, '=>', $.expression, optional($.ellipsis), optional($.for_cond), '}', ), for_intro: $ => seq( 'for', $.identifier, optional(seq(',', $.identifier)), 'in', $.expression, ':', ), for_cond: $ => seq('if', $.expression), variable_expr: $ => $.identifier, function_call: $ => seq( field('name', $.identifier), '(', optional($.function_arguments), ')' ), function_arguments: $ => seq( $.expression, repeat(seq(',', $.expression)), optional(choice(',', $.ellipsis)) ), ellipsis: $ => token('...'), // http://stackoverflow.com/questions/13014947/regex-to-match-a-c-style-multiline-comment/36328890#36328890 comment: $ => token(choice( seq('#', /.*/), seq('//', /.*/), seq( '/*', /[^*]*\*+([^/*][^*]*\*+)*/, '/' ) )), } });