%{ package main import ( "bytes" "fmt" "os" "io" ) type node struct { name string children []node attributes map[string]string } func (n node) String() string { buf := new(bytes.Buffer) n.print(buf, " ") return buf.String() } func (n node) print(out io.Writer, indent string) { if (len(n.attributes) > 0) { fmt.Fprintf(out, "\n%v%v %s", indent, n.name, n.attributes) } else { fmt.Fprintf(out, "\n%v%v", indent, n.name) } for _, nn := range n.children { nn.print(out, indent + " ") } } func Node(name string) node { return node{name: name, attributes: make(map[string]string)} } func (n node) append(nn...node) node { n.children = append(n.children, nn...) return n } func (n node) attribute(key string, value string) node { n.attributes[key] = value return n } %} %union{ node node token string value string } %left T_INCLUDE T_INCLUDE_ONCE T_EVAL T_REQUIRE T_REQUIRE_ONCE %left ',' %left T_LOGICAL_OR %left T_LOGICAL_XOR %left T_LOGICAL_AND %right T_PRINT %right T_YIELD %right T_DOUBLE_ARROW %right T_YIELD_FROM %left '=' T_PLUS_EQUAL T_MINUS_EQUAL T_MUL_EQUAL T_DIV_EQUAL T_CONCAT_EQUAL T_MOD_EQUAL T_AND_EQUAL T_OR_EQUAL T_XOR_EQUAL T_SL_EQUAL T_SR_EQUAL T_POW_EQUAL %left '?' ':' %right T_COALESCE %left T_BOOLEAN_OR %left T_BOOLEAN_AND %left '|' %left '^' %left '&' %nonassoc T_IS_EQUAL T_IS_NOT_EQUAL T_IS_IDENTICAL T_IS_NOT_IDENTICAL T_SPACESHIP %nonassoc '<' T_IS_SMALLER_OR_EQUAL '>' T_IS_GREATER_OR_EQUAL %left T_SL T_SR %left '+' '-' '.' %left '*' '/' '%' %right '!' %nonassoc T_INSTANCEOF %right '~' T_INC T_DEC T_INT_CAST T_DOUBLE_CAST T_STRING_CAST T_ARRAY_CAST T_OBJECT_CAST T_BOOL_CAST T_UNSET_CAST '@' %right T_POW %right '[' %nonassoc T_NEW T_CLONE %left T_NOELSE %left T_ELSEIF %left T_ELSE %left T_ENDIF %right T_STATIC T_ABSTRACT T_FINAL T_PRIVATE T_PROTECTED T_PUBLIC %type $unk %token T_INCLUDE %token T_INCLUDE_ONCE %token T_EXIT %token T_IF %token T_LNUMBER %token T_DNUMBER %token T_STRING %token T_STRING_VARNAME %token T_VARIABLE %token T_NUM_STRING %token T_INLINE_HTML %token T_CHARACTER %token T_BAD_CHARACTER %token T_ENCAPSED_AND_WHITESPACE %token T_CONSTANT_ENCAPSED_STRING %token T_ECHO %token T_DO %token T_WHILE %token T_ENDWHILE %token T_FOR %token T_ENDFOR %token T_FOREACH %token T_ENDFOREACH %token T_DECLARE %token T_ENDDECLARE %token T_AS %token T_SWITCH %token T_ENDSWITCH %token T_CASE %token T_DEFAULT %token T_BREAK %token T_CONTINUE %token T_GOTO %token T_FUNCTION %token T_CONST %token T_RETURN %token T_TRY %token T_CATCH %token T_FINALLY %token T_THROW %token T_USE %token T_INSTEADOF %token T_GLOBAL %token T_VAR %token T_UNSET %token T_ISSET %token T_EMPTY %token T_HALT_COMPILER %token T_CLASS %token T_TRAIT %token T_INTERFACE %token T_EXTENDS %token T_IMPLEMENTS %token T_OBJECT_OPERATOR %token T_DOUBLE_ARROW %token T_LIST %token T_ARRAY %token T_CALLABLE %token T_CLASS_C %token T_TRAIT_C %token T_METHOD_C %token T_FUNC_C %token T_LINE %token T_FILE %token T_COMMENT %token T_DOC_COMMENT %token T_OPEN_TAG %token T_OPEN_TAG_WITH_ECHO %token T_CLOSE_TAG %token T_WHITESPACE %token T_START_HEREDOC %token T_END_HEREDOC %token T_DOLLAR_OPEN_CURLY_BRACES %token T_CURLY_OPEN %token T_PAAMAYIM_NEKUDOTAYIM %token T_NAMESPACE %token T_NS_C %token T_DIR %token T_NS_SEPARATOR %token T_ELLIPSIS %type class_modifier %type is_reference %type is_variadic %type returns_ref %type identifier %type top_statement %type namespace_name %type namespace_name_parts %type name %type top_statement_list %type statement %type inner_statement %type inner_statement_list %type class_modifiers %type class_declaration_statement %type function_declaration_statement %type optional_type %type return_type %type type_expr %type type %type parameter_list %type non_empty_parameter_list %type parameter %type expr %type expr_without_variable %type callable_variable %type variable %type simple_variable %type if_stmt_without_else %type if_stmt %type alt_if_stmt_without_else %type alt_if_stmt %type while_statement %type for_exprs %type non_empty_for_exprs %type for_statement %% ///////////////////////////////////////////////////////////////////////// start: top_statement_list { fmt.Println($1) } ; reserved_non_modifiers: T_INCLUDE | T_INCLUDE_ONCE | T_EVAL | T_REQUIRE | T_REQUIRE_ONCE | T_LOGICAL_OR | T_LOGICAL_XOR | T_LOGICAL_AND | T_INSTANCEOF | T_NEW | T_CLONE | T_EXIT | T_IF | T_ELSEIF | T_ELSE | T_ENDIF | T_ECHO | T_DO | T_WHILE | T_ENDWHILE | T_FOR | T_ENDFOR | T_FOREACH | T_ENDFOREACH | T_DECLARE | T_ENDDECLARE | T_AS | T_TRY | T_CATCH | T_FINALLY | T_THROW | T_USE | T_INSTEADOF | T_GLOBAL | T_VAR | T_UNSET | T_ISSET | T_EMPTY | T_CONTINUE | T_GOTO | T_FUNCTION | T_CONST | T_RETURN | T_PRINT | T_YIELD | T_LIST | T_SWITCH | T_ENDSWITCH | T_CASE | T_DEFAULT | T_BREAK | T_ARRAY | T_CALLABLE | T_EXTENDS | T_IMPLEMENTS | T_NAMESPACE | T_TRAIT | T_INTERFACE | T_CLASS | T_CLASS_C | T_TRAIT_C | T_FUNC_C | T_METHOD_C | T_LINE | T_FILE | T_DIR | T_NS_C ; semi_reserved: reserved_non_modifiers | T_STATIC | T_ABSTRACT | T_FINAL | T_PRIVATE | T_PROTECTED | T_PUBLIC ; identifier: T_STRING { $$ = Node("identifier") } | semi_reserved { $$ = Node("reserved") } ; namespace_name_parts: T_STRING { $$ = Node("NamespaceParts").append(Node($1)) } | namespace_name_parts T_NS_SEPARATOR T_STRING { $$ = $1.append(Node($3)) } ; namespace_name: namespace_name_parts { $$ = $1; } ; name: namespace_name { $$ = Node("Name").append($1); } | T_NS_SEPARATOR namespace_name { $$ = Node("Name").append($2).attribute("FullyQualified", "true"); } | T_NAMESPACE T_NS_SEPARATOR namespace_name { $$ = Node("Name").append($3).attribute("Relative", "true"); } ; top_statement_list: top_statement_list top_statement { $$ = $1.append($2); } | /* empty */ { $$ = Node("Statements") } ; top_statement: statement { $$ = $1 } | function_declaration_statement { $$ = $1 } | T_INCLUDE identifier ';' { $$ = $2; /*TODO: identifier stub, refactor it*/ } | T_NAMESPACE namespace_name ';' { $$ = Node("Namespace").append($2); } | class_declaration_statement { $$ = $1; } ; inner_statement_list: inner_statement_list inner_statement { $$ = $1.append($2); } | /* empty */ { $$ = Node("statement_list") } ; inner_statement: statement { $$ = $1; } | function_declaration_statement { $$ = $1; } | class_declaration_statement { $$ = $1; } statement: '{' inner_statement_list '}' { $$ = $2; } | if_stmt { $$ = $1; } | alt_if_stmt { $$ = $1; } | T_WHILE '(' expr ')' while_statement { $$ = Node("While").append(Node("expr").append($3)).append(Node("stmt").append($5)) } | T_DO statement T_WHILE '(' expr ')' ';' { $$ = Node("DoWhile").append(Node("expr").append($5)).append(Node("stmt").append($2))} | T_FOR '(' for_exprs ';' for_exprs ';' for_exprs ')' for_statement { $$ = Node("For"). append(Node("expr1").append($3)). append(Node("expr2").append($5)). append(Node("expr3").append($7)). append(Node("stmt").append($9)) } | expr ';' { $$ = $1; } if_stmt_without_else: T_IF '(' expr ')' statement { $$ = Node("If").append(Node("expr").append($3)).append(Node("stmt").append($5)) } | if_stmt_without_else T_ELSEIF '(' expr ')' statement { $$ = $1.append(Node("ElseIf").append(Node("expr").append($4)).append(Node("stmt").append($6))) } ; if_stmt: if_stmt_without_else %prec T_NOELSE { $$ = $1; } | if_stmt_without_else T_ELSE statement { $$ = $1.append(Node("Else").append(Node("stmt").append($3))) } ; alt_if_stmt_without_else: T_IF '(' expr ')' ':' inner_statement_list { $$ = Node("AltIf").append(Node("expr").append($3)).append(Node("stmt").append($6)) } | alt_if_stmt_without_else T_ELSEIF '(' expr ')' ':' inner_statement_list { $$ = $1.append(Node("AltElseIf").append(Node("expr").append($4)).append(Node("stmt").append($7))) } ; alt_if_stmt: alt_if_stmt_without_else T_ENDIF ';' { $$ = $1; } | alt_if_stmt_without_else T_ELSE ':' inner_statement_list T_ENDIF ';' { $$ = $1.append(Node("AltElse").append(Node("stmt").append($4))) } ; while_statement: statement { $$ = $1; } | ':' inner_statement_list T_ENDWHILE ';' { $$ = $2; } ; for_exprs: /* empty */ { $$ = Node("null"); } | non_empty_for_exprs { $$ = $1; } ; non_empty_for_exprs: non_empty_for_exprs ',' expr { $$ = $1.append($3) } | expr { $$ = Node("ExpressionList").append($1) } ; for_statement: statement { $$ = $1; } | ':' inner_statement_list T_ENDFOR ';' { $$ = $2; } ; class_declaration_statement: class_modifiers T_CLASS T_STRING '{' '}' { $$ = $1.attribute("name", $3) } | T_CLASS T_STRING '{' '}' { $$ = Node("Class").attribute("name", $2) } ; class_modifiers: class_modifier { $$ = Node("Class").attribute($1, "true") } | class_modifiers class_modifier { $$ = $1.attribute($2, "true") } ; class_modifier: T_ABSTRACT { $$ = "abstract" } | T_FINAL { $$ = "final" } ; function_declaration_statement: T_FUNCTION returns_ref T_STRING '(' parameter_list ')' return_type '{' inner_statement_list '}' { $$ = Node("Function"). attribute("name", $3). attribute("returns_ref", $2). append($5). append($7). append($9); } ; parameter_list: non_empty_parameter_list { $$ = $1; } | /* empty */ { $$ = Node("Parameter list"); } ; non_empty_parameter_list: parameter { $$ = Node("Parameter list").append($1) } | non_empty_parameter_list ',' parameter { $$ = $1.append($3); } ; parameter: optional_type is_reference is_variadic T_VARIABLE { $$ = Node("Parameter"). append($1). attribute("is_reference", $2). attribute("is_variadic", $3). attribute("var", $4); } | optional_type is_reference is_variadic T_VARIABLE '=' expr { $$ = Node("Parameter"). append($1). attribute("is_reference", $2). attribute("is_variadic", $3). attribute("var", $4). append($6); } ; optional_type: /* empty */ { $$ = Node("No type") } | type_expr { $$ = $1; } ; returns_ref: /* empty */ { $$ = "false"; } | '&' { $$ = "true"; } ; is_reference: /* empty */ { $$ = "false"; } | '&' { $$ = "true"; } ; is_variadic: /* empty */ { $$ = "false"; } | T_ELLIPSIS { $$ = "true"; } ; type_expr: type { $$ = $1; } | '?' type { $$ = $2; $$.attribute("nullable", "true") } ; type: name { $$ = $1; } | T_ARRAY { $$ = Node("array type"); } | T_CALLABLE { $$ = Node("callable type"); } ; return_type: /* empty */ { $$ = Node("void"); } | ':' type_expr { $$ = $2; } ; expr_without_variable: variable '=' expr { $$ = Node("Assign").append($1).append($3); } | variable '=' '&' expr { $$ = Node("AssignRef").append($1).append($4); } | variable '=' '&' expr { $$ = Node("AssignRef").append($1).append($4); } | T_CLONE expr { $$ = Node("Clone").append($2); } | variable T_PLUS_EQUAL expr { $$ = Node("AssignAdd").append($1).append($3); } | variable T_MINUS_EQUAL expr { $$ = Node("AssignSub").append($1).append($3); } | variable T_MUL_EQUAL expr { $$ = Node("AssignMul").append($1).append($3); } | variable T_POW_EQUAL expr { $$ = Node("AssignPow").append($1).append($3); } | variable T_DIV_EQUAL expr { $$ = Node("AssignDiv").append($1).append($3); } | variable T_CONCAT_EQUAL expr { $$ = Node("AssignConcat").append($1).append($3); } | variable T_MOD_EQUAL expr { $$ = Node("AssignMod").append($1).append($3); } | variable T_AND_EQUAL expr { $$ = Node("AssignAnd").append($1).append($3); } | variable T_AND_EQUAL expr { $$ = Node("AssignAnd").append($1).append($3); } | variable T_OR_EQUAL expr { $$ = Node("AssignOr").append($1).append($3); } | variable T_XOR_EQUAL expr { $$ = Node("AssignXor").append($1).append($3); } | variable T_SL_EQUAL expr { $$ = Node("AssignShiftLeft").append($1).append($3); } | variable T_SR_EQUAL expr { $$ = Node("AssignShiftRight").append($1).append($3); } | variable T_INC { $$ = Node("PostIncrement").append($1) } | T_INC variable { $$ = Node("PreIncrement").append($2) } | variable T_DEC { $$ = Node("PostDecrement").append($1) } | T_DEC variable { $$ = Node("PreDecrement").append($2) } | expr T_BOOLEAN_OR expr { $$ = Node("Or").append($1).append($3) } | expr T_BOOLEAN_AND expr { $$ = Node("And").append($1).append($3) } | expr T_LOGICAL_OR expr { $$ = Node("Or").append($1).append($3) } | expr T_LOGICAL_AND expr { $$ = Node("And").append($1).append($3) } | expr T_LOGICAL_XOR expr { $$ = Node("Xor").append($1).append($3) } | expr '|' expr { $$ = Node("BitwiseOr").append($1).append($3) } | expr '&' expr { $$ = Node("BitwiseAnd").append($1).append($3) } | expr '^' expr { $$ = Node("BitwiseXor").append($1).append($3) } | expr '.' expr { $$ = Node("Concat").append($1).append($3) } | expr '+' expr { $$ = Node("Add").append($1).append($3) } | expr '-' expr { $$ = Node("Sub").append($1).append($3) } | expr '*' expr { $$ = Node("Mul").append($1).append($3) } | expr T_POW expr { $$ = Node("Pow").append($1).append($3) } | expr '/' expr { $$ = Node("Div").append($1).append($3) } | expr '%' expr { $$ = Node("Mod").append($1).append($3) } | expr T_SL expr { $$ = Node("ShiftLeft").append($1).append($3) } | expr T_SR expr { $$ = Node("ShiftRight").append($1).append($3) } | '+' expr %prec T_INC { $$ = Node("UnaryPlus").append($2) } | '-' expr %prec T_INC { $$ = Node("UnaryMinus").append($2) } | '!' expr { $$ = Node("BooleanNot").append($2) } | '~' expr { $$ = Node("BitwiseNot").append($2) } | expr T_IS_IDENTICAL expr { $$ = Node("Identical").append($1).append($3) } | expr T_IS_NOT_IDENTICAL expr { $$ = Node("NotIdentical").append($1).append($3) } | expr T_IS_EQUAL expr { $$ = Node("Equal").append($1).append($3) } | expr T_IS_NOT_EQUAL expr { $$ = Node("NotEqual").append($1).append($3) } | expr T_SPACESHIP expr { $$ = Node("Spaceship").append($1).append($3) } | expr '<' expr { $$ = Node("Smaller").append($1).append($3) } | expr T_IS_SMALLER_OR_EQUAL expr { $$ = Node("SmallerOrEqual").append($1).append($3) } | expr '>' expr { $$ = Node("Greater").append($1).append($3) } | expr T_IS_GREATER_OR_EQUAL expr { $$ = Node("GreaterOrEqual").append($1).append($3) } | '(' expr ')' { $$ = $2; } | expr '?' expr ':' expr { $$ = Node("Ternary").append($1).append($3).append($5); } | expr '?' ':' expr { $$ = Node("Ternary").append($1).append($4); } | expr T_COALESCE expr { $$ = Node("Coalesce").append($1).append($3); } | T_EMPTY '(' expr ')' { $$ = Node("Empty").append($3); } | T_INCLUDE expr { $$ = Node("Include").append($2); } | T_INCLUDE_ONCE expr { $$ = Node("IncludeOnce").append($2); } | T_EVAL '(' expr ')' { $$ = Node("Eval").append($3); } | T_REQUIRE expr { $$ = Node("Require").append($2); } | T_REQUIRE_ONCE expr { $$ = Node("RequireOnce").append($2); } | T_INT_CAST expr { $$ = Node("CastInt").append($2); } | T_DOUBLE_CAST expr { $$ = Node("CastDouble").append($2); } | T_STRING_CAST expr { $$ = Node("CastString").append($2); } | T_ARRAY_CAST expr { $$ = Node("CastArray").append($2); } | T_OBJECT_CAST expr { $$ = Node("CastObject").append($2); } | T_BOOL_CAST expr { $$ = Node("CastBool").append($2); } | T_UNSET_CAST expr { $$ = Node("CastUnset").append($2); } | '@' expr { $$ = Node("Silence").append($2); } | T_PRINT expr { $$ = Node("Print").append($2); } | T_YIELD { $$ = Node("Yield"); } | T_YIELD expr { $$ = Node("Yield").append($2); } | T_YIELD expr T_DOUBLE_ARROW expr { $$ = Node("Yield").append($2).append($4); } | T_YIELD_FROM expr { $$ = Node("YieldFrom").append($2); } ; expr: variable { $$ = $1; } | expr_without_variable { $$ = $1; } ; callable_variable: simple_variable { $$ = $1; } ; variable: callable_variable { $$ = $1; } ; simple_variable: T_VARIABLE { $$ = Node("Variable").attribute("name", $1); } | '$' '{' expr '}' { $$ = $3; } | '$' simple_variable { $$ = Node("Variable").append($2); } ; ///////////////////////////////////////////////////////////////////////// %% const src = `