/* * MRustC - Rust Compiler * - By John Hodge (Mutabah/thePowersGang) * * parse/expr.cpp * - Expression (i.e. code) parsing * * Start points: * - Parse_ExprBlockNode : Parses a block * - Parse_Stmt : Parse a single statement * - Parse_Expr0 : Parse a single expression */ #include "parseerror.hpp" #include "../ast/ast.hpp" #include "common.hpp" #include #include "tokentree.hpp" using AST::ExprNode; using AST::ExprNodeP; static inline ExprNodeP mk_exprnodep(const TokenStream& lex, AST::ExprNode* en){en->set_pos(lex.getPosition()); return ExprNodeP(en); } #define NEWNODE(type, ...) mk_exprnodep(lex, new type(__VA_ARGS__)) ExprNodeP Parse_ExprBlockNode(TokenStream& lex); ExprNodeP Parse_ExprBlockLine(TokenStream& lex, bool *expect_end); ExprNodeP Parse_Stmt(TokenStream& lex); ExprNodeP Parse_Expr0(TokenStream& lex); ExprNodeP Parse_IfStmt(TokenStream& lex); ExprNodeP Parse_WhileStmt(TokenStream& lex, ::std::string lifetime); ExprNodeP Parse_ForStmt(TokenStream& lex, ::std::string lifetime); ExprNodeP Parse_Expr_Match(TokenStream& lex); ExprNodeP Parse_Expr1(TokenStream& lex); ExprNodeP Parse_ExprMacro(TokenStream& lex, Token tok); AST::Expr Parse_Expr(TokenStream& lex) { return ::AST::Expr( Parse_Expr0(lex) ); } AST::Expr Parse_ExprBlock(TokenStream& lex) { return ::AST::Expr( Parse_ExprBlockNode(lex) ); } ExprNodeP Parse_ExprBlockNode(TokenStream& lex) { TRACE_FUNCTION; Token tok; ::std::vector nodes; ::std::unique_ptr local_mod; GET_CHECK_TOK(tok, lex, TOK_BRACE_OPEN); while( GET_TOK(tok, lex) != TOK_BRACE_CLOSE ) { DEBUG("tok = " << tok); AST::MetaItems item_attrs; while( tok.type() == TOK_ATTR_OPEN ) { item_attrs.push_back( Parse_MetaItem(lex) ); GET_CHECK_TOK(tok, lex, TOK_SQUARE_CLOSE); GET_TOK(tok, lex); } switch(tok.type()) { case TOK_CATTR_OPEN: // TODO: Handle `#![` by having a pointer to the parent item (e.g. function)'s attribute list. /*node_attrs.push_back(*/ Parse_MetaItem(lex) /*)*/; GET_CHECK_TOK(tok, lex, TOK_SQUARE_CLOSE); break; // Items: case TOK_RWORD_PUB: GET_TOK(tok, lex); case TOK_RWORD_TYPE: case TOK_RWORD_USE: case TOK_RWORD_EXTERN: case TOK_RWORD_CONST: case TOK_RWORD_STATIC: case TOK_RWORD_STRUCT: case TOK_RWORD_ENUM: case TOK_RWORD_TRAIT: case TOK_RWORD_IMPL: case TOK_RWORD_FN: case TOK_RWORD_MOD: PUTBACK(tok, lex); if( !local_mod ) { local_mod = lex.parse_state().get_current_mod().add_anon(); } Parse_Mod_Item(lex, false,"!", *local_mod, false, mv$(item_attrs)); break; // 'unsafe' - Check if the next token isn't a `{`, if so it's an item. Otherwise, fall through case TOK_RWORD_UNSAFE: if( LOOK_AHEAD(lex) != TOK_BRACE_OPEN ) { PUTBACK(tok, lex); if( !local_mod ) { local_mod = lex.parse_state().get_current_mod().add_anon(); } Parse_Mod_Item(lex, false,"!", *local_mod, false, mv$(item_attrs)); break; } // fall default: { PUTBACK(tok, lex); bool expect_end = false; nodes.push_back(Parse_ExprBlockLine(lex, &expect_end)); if( nodes.back() ) { nodes.back()->set_attrs( mv$(item_attrs) ); } else { // TODO: Error if attribute on void expression? } // Set to TRUE if there was no semicolon after a statement if( expect_end ) { DEBUG("expect_end == true"); if( GET_TOK(tok, lex) != TOK_BRACE_CLOSE ) { throw ParseError::Unexpected(lex, tok, Token(TOK_BRACE_CLOSE)); } PUTBACK(tok, lex); } break; } } } return NEWNODE( AST::ExprNode_Block, ::std::move(nodes), mv$(local_mod) ); } /// Parse a single line from a block /// /// Handles: /// - Block-level constructs (with lifetime annotations) /// - use/extern/const/let ExprNodeP Parse_ExprBlockLine(TokenStream& lex, bool *expect_end) { Token tok; if( GET_TOK(tok, lex) == TOK_LIFETIME ) { // Lifetimes can only precede loops... and blocks? ::std::string lifetime = tok.str(); GET_CHECK_TOK(tok, lex, TOK_COLON); switch( GET_TOK(tok, lex) ) { case TOK_RWORD_LOOP: return NEWNODE( AST::ExprNode_Loop, lifetime, Parse_ExprBlockNode(lex) ); case TOK_RWORD_WHILE: return Parse_WhileStmt(lex, lifetime); case TOK_RWORD_FOR: return Parse_ForStmt(lex, lifetime); case TOK_RWORD_IF: return Parse_IfStmt(lex); case TOK_RWORD_MATCH: return Parse_Expr_Match(lex); case TOK_BRACE_OPEN: PUTBACK(tok, lex); return Parse_ExprBlockNode(lex); default: throw ParseError::Unexpected(lex, tok); } } else { switch( tok.type() ) { case TOK_SEMICOLON: return 0; case TOK_BRACE_OPEN: PUTBACK(tok, lex); return Parse_ExprBlockNode(lex); // let binding case TOK_RWORD_LET: { AST::Pattern pat = Parse_Pattern(lex, false); // irrefutable TypeRef type; if( GET_TOK(tok, lex) == TOK_COLON ) { type = Parse_Type(lex); GET_TOK(tok, lex); } ExprNodeP val; if( tok.type() == TOK_EQUAL ) { val = Parse_Expr0(lex); } return NEWNODE( AST::ExprNode_LetBinding, ::std::move(pat), ::std::move(type), ::std::move(val) ); } // blocks that don't need semicolons case TOK_RWORD_LOOP: return NEWNODE( AST::ExprNode_Loop, "", Parse_ExprBlockNode(lex) ); case TOK_RWORD_WHILE: return Parse_WhileStmt(lex, ""); case TOK_RWORD_FOR: return Parse_ForStmt(lex, ""); case TOK_RWORD_IF: return Parse_IfStmt(lex); case TOK_RWORD_MATCH: return Parse_Expr_Match(lex); case TOK_RWORD_UNSAFE: { auto rv = Parse_ExprBlockNode(lex); dynamic_cast(*rv).set_unsafe(); return rv; } case TOK_MACRO: // If a braced macro invocation is the first part of a statement, don't expect a semicolon if( LOOK_AHEAD(lex) == TOK_BRACE_OPEN || (lex.lookahead(0) == TOK_IDENT && lex.lookahead(1) == TOK_BRACE_OPEN) ) { return Parse_ExprMacro(lex, tok); } // Fall through to the statement code default: { PUTBACK(tok, lex); auto ret = Parse_Stmt(lex); if( GET_TOK(tok, lex) != TOK_SEMICOLON ) { PUTBACK(tok, lex); *expect_end = true; } return ::std::move(ret); break; } } } } /// While loop (either as a statement, or as part of an expression) ExprNodeP Parse_WhileStmt(TokenStream& lex, ::std::string lifetime) { Token tok; if( GET_TOK(tok, lex) == TOK_RWORD_LET ) { auto pat = Parse_Pattern(lex, true); // Refutable pattern GET_CHECK_TOK(tok, lex, TOK_EQUAL); ExprNodeP val; { SET_PARSE_FLAG(lex, disallow_struct_literal); val = Parse_Expr0(lex); } return NEWNODE( AST::ExprNode_Loop, lifetime, AST::ExprNode_Loop::WHILELET, ::std::move(pat), ::std::move(val), Parse_ExprBlockNode(lex) ); } else { PUTBACK(tok, lex); ExprNodeP cnd; { SET_PARSE_FLAG(lex, disallow_struct_literal); cnd = Parse_Expr1(lex); } return NEWNODE( AST::ExprNode_Loop, lifetime, ::std::move(cnd), Parse_ExprBlockNode(lex) ); } } /// For loop (either as a statement, or as part of an expression) ExprNodeP Parse_ForStmt(TokenStream& lex, ::std::string lifetime) { Token tok; // Irrefutable pattern AST::Pattern pat = Parse_Pattern(lex, false); GET_CHECK_TOK(tok, lex, TOK_RWORD_IN); ExprNodeP val; { SET_PARSE_FLAG(lex, disallow_struct_literal); val = Parse_Expr0(lex); } return NEWNODE( AST::ExprNode_Loop, lifetime, AST::ExprNode_Loop::FOR, ::std::move(pat), ::std::move(val), Parse_ExprBlockNode(lex) ); } /// Parse an 'if' statement // Note: TOK_RWORD_IF has already been eaten ExprNodeP Parse_IfStmt(TokenStream& lex) { TRACE_FUNCTION; Token tok; ExprNodeP cond; AST::Pattern pat; bool if_let = false; { SET_PARSE_FLAG(lex, disallow_struct_literal); if( GET_TOK(tok, lex) == TOK_RWORD_LET ) { if_let = true; // Refutable pattern pat = Parse_Pattern(lex, true); GET_CHECK_TOK(tok, lex, TOK_EQUAL); cond = Parse_Expr0(lex); } else { PUTBACK(tok, lex); cond = Parse_Expr0(lex); } } // Contents ExprNodeP code = Parse_ExprBlockNode(lex); // Handle else: ExprNodeP altcode; if( GET_TOK(tok, lex) == TOK_RWORD_ELSE ) { // Recurse for 'else if' if( GET_TOK(tok, lex) == TOK_RWORD_IF ) { altcode = Parse_IfStmt(lex); } // - or get block else { PUTBACK(tok, lex); altcode = Parse_ExprBlockNode(lex); } } // - or nothing else { PUTBACK(tok, lex); } if( if_let ) return NEWNODE( AST::ExprNode_IfLet, ::std::move(pat), ::std::move(cond), ::std::move(code), ::std::move(altcode) ); else return NEWNODE( AST::ExprNode_If, ::std::move(cond), ::std::move(code), ::std::move(altcode) ); } /// "match" block ExprNodeP Parse_Expr_Match(TokenStream& lex) { TRACE_FUNCTION; Token tok; CLEAR_PARSE_FLAG(lex, disallow_struct_literal); // 1. Get expression ExprNodeP switch_val; { SET_PARSE_FLAG(lex, disallow_struct_literal); switch_val = Parse_Expr1(lex); } //ASSERT(lex, !CHECK_PARSE_FLAG(lex, disallow_struct_literal) ); GET_CHECK_TOK(tok, lex, TOK_BRACE_OPEN); ::std::vector< AST::ExprNode_Match_Arm > arms; do { if( GET_TOK(tok, lex) == TOK_BRACE_CLOSE ) break; PUTBACK(tok, lex); AST::ExprNode_Match_Arm arm; ::AST::MetaItems arm_attrs; while( LOOK_AHEAD(lex) == TOK_ATTR_OPEN ) { GET_TOK(tok, lex); arm_attrs.push_back( Parse_MetaItem(lex) ); GET_CHECK_TOK(tok, lex, TOK_SQUARE_CLOSE); } arm.m_attrs = mv$(arm_attrs); do { // Refutable pattern arm.m_patterns.push_back( Parse_Pattern(lex, true) ); } while( GET_TOK(tok, lex) == TOK_PIPE ); if( tok.type() == TOK_RWORD_IF ) { arm.m_cond = Parse_Expr1(lex); GET_TOK(tok, lex); } CHECK_TOK(tok, TOK_FATARROW); arm.m_code = Parse_Stmt(lex); arms.push_back( ::std::move(arm) ); if( GET_TOK(tok, lex) == TOK_COMMA ) continue; PUTBACK(tok, lex); } while( 1 ); CHECK_TOK(tok, TOK_BRACE_CLOSE); return NEWNODE( AST::ExprNode_Match, ::std::move(switch_val), ::std::move(arms) ); } /// Parses the 'stmt' fragment specifier /// - Flow control /// - Expressions ExprNodeP Parse_Stmt(TokenStream& lex) { TRACE_FUNCTION; Token tok; switch(GET_TOK(tok, lex)) { case TOK_RWORD_RETURN: { ExprNodeP val; switch(LOOK_AHEAD(lex)) { case TOK_SEMICOLON: case TOK_COMMA: case TOK_BRACE_CLOSE: case TOK_PAREN_CLOSE: case TOK_SQUARE_CLOSE: break; default: val = Parse_Expr1(lex); break; } return NEWNODE( AST::ExprNode_Flow, AST::ExprNode_Flow::RETURN, "", ::std::move(val) ); } case TOK_RWORD_CONTINUE: case TOK_RWORD_BREAK: { AST::ExprNode_Flow::Type type; switch(tok.type()) { case TOK_RWORD_CONTINUE: type = AST::ExprNode_Flow::CONTINUE; break; case TOK_RWORD_BREAK: type = AST::ExprNode_Flow::BREAK; break; default: throw ParseError::BugCheck(/*lex,*/ "continue/break"); } ::std::string lifetime; if( GET_TOK(tok, lex) == TOK_LIFETIME ) { lifetime = tok.str(); GET_TOK(tok, lex); } ExprNodeP val; switch(tok.type()) { case TOK_SEMICOLON: case TOK_COMMA: case TOK_BRACE_OPEN: case TOK_BRACE_CLOSE: case TOK_PAREN_CLOSE: case TOK_SQUARE_CLOSE: PUTBACK(tok, lex); break; default: PUTBACK(tok, lex); val = Parse_Expr1(lex); break; } return NEWNODE( AST::ExprNode_Flow, type, lifetime, ::std::move(val) ); } case TOK_BRACE_OPEN: PUTBACK(tok, lex); return Parse_ExprBlockNode(lex); default: PUTBACK(tok, lex); return Parse_Expr0(lex); } } ::std::vector Parse_ParenList(TokenStream& lex) { TRACE_FUNCTION; Token tok; CLEAR_PARSE_FLAG(lex, disallow_struct_literal); ::std::vector rv; GET_CHECK_TOK(tok, lex, TOK_PAREN_OPEN); if( GET_TOK(tok, lex) != TOK_PAREN_CLOSE ) { PUTBACK(tok, lex); do { if( LOOK_AHEAD(lex) == TOK_PAREN_CLOSE ) { GET_TOK(tok, lex); break; } rv.push_back( Parse_Stmt(lex) ); } while( GET_TOK(tok, lex) == TOK_COMMA ); CHECK_TOK(tok, TOK_PAREN_CLOSE); } return rv; } // 0: Assign ExprNodeP Parse_Expr0(TokenStream& lex) { //TRACE_FUNCTION; Token tok; ::AST::MetaItems expr_attrs; while( LOOK_AHEAD(lex) == TOK_ATTR_OPEN ) { GET_TOK(tok, lex); expr_attrs.push_back( Parse_MetaItem(lex) ); GET_CHECK_TOK(tok, lex, TOK_SQUARE_CLOSE); } ExprNodeP rv = Parse_Expr1(lex); auto op = AST::ExprNode_Assign::NONE; switch( GET_TOK(tok, lex) ) { case TOK_PLUS_EQUAL: op = AST::ExprNode_Assign::ADD; if(0) case TOK_DASH_EQUAL: op = AST::ExprNode_Assign::SUB; if(0) case TOK_STAR_EQUAL: op = AST::ExprNode_Assign::MUL; if(0) case TOK_SLASH_EQUAL: op = AST::ExprNode_Assign::DIV; if(0) case TOK_PERCENT_EQUAL: op = AST::ExprNode_Assign::MOD; if(0) case TOK_AMP_EQUAL: op = AST::ExprNode_Assign::AND; if(0) case TOK_PIPE_EQUAL: op = AST::ExprNode_Assign::OR ; if(0) case TOK_CARET_EQUAL: op = AST::ExprNode_Assign::XOR; if(0) case TOK_DOUBLE_GT_EQUAL: op = AST::ExprNode_Assign::SHR; if(0) case TOK_DOUBLE_LT_EQUAL: op = AST::ExprNode_Assign::SHL; if(0) case TOK_EQUAL: op = AST::ExprNode_Assign::NONE; rv = NEWNODE( AST::ExprNode_Assign, op, ::std::move(rv), Parse_Expr0(lex) ); rv->set_attrs(mv$(expr_attrs)); return rv; default: PUTBACK(tok, lex); rv->set_attrs(mv$(expr_attrs)); return rv; } } #define LEFTASSOC(cur, _next, cases) \ ExprNodeP _next(TokenStream& lex); \ ExprNodeP cur(TokenStream& lex) \ { \ ExprNodeP (*next)(TokenStream&) = _next;\ ExprNodeP rv = next(lex); \ while(true) \ { \ Token tok; \ switch((tok = lex.getToken()).type()) \ { \ cases \ default: \ /*::std::cout << "<<" << #cur << ::std::endl; */\ PUTBACK(tok, lex); \ return rv; \ } \ } \ } bool Parse_IsTokValue(eTokenType tok_type) { switch( tok_type ) { case TOK_DOUBLE_COLON: case TOK_IDENT: case TOK_INTEGER: case TOK_FLOAT: case TOK_STRING: case TOK_RWORD_TRUE: case TOK_RWORD_FALSE: case TOK_RWORD_SELF: case TOK_RWORD_SUPER: case TOK_RWORD_BOX: case TOK_RWORD_IN: case TOK_PAREN_OPEN: case TOK_MACRO: case TOK_PIPE: case TOK_EXCLAM: case TOK_DASH: case TOK_STAR: case TOK_AMP: return true; default: return false; } } ExprNodeP Parse_Expr1_1(TokenStream& lex); // Very evil handling for '..' ExprNodeP Parse_Expr1(TokenStream& lex) { Token tok; ExprNodeP (*next)(TokenStream&) = Parse_Expr1_1; ExprNodeP left, right; // Inclusive range to a value if( GET_TOK(tok, lex) == TOK_TRIPLE_DOT ) { right = next(lex); return NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::RANGE_INC, nullptr, mv$(right) ); } else { PUTBACK(tok, lex); } // Exclusive ranges // - If NOT `.. `, parse a leading value if( GET_TOK(tok, lex) != TOK_DOUBLE_DOT ) { PUTBACK(tok, lex); left = next(lex); // - If NOT ` ..`, return the value if( GET_TOK(tok, lex) != TOK_DOUBLE_DOT ) { PUTBACK(tok, lex); return ::std::move(left); } } assert( tok.type() == TOK_DOUBLE_DOT ); // If the next token is part of a value, parse that value if( Parse_IsTokValue( LOOK_AHEAD(lex) ) ) { right = next(lex); } else { // Otherwise, leave `right` as nullptr } return NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::RANGE, ::std::move(left), ::std::move(right) ); } // TODO: Is this left associative? LEFTASSOC(Parse_Expr1_1, Parse_Expr1_5, case TOK_TRIPLE_DOT: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::RANGE_INC, mv$(rv), next(lex) ); break; ) // 1: Bool OR LEFTASSOC(Parse_Expr1_5, Parse_Expr2, case TOK_DOUBLE_PIPE: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::BOOLOR, ::std::move(rv), next(lex)); break; ) // 2: Bool AND LEFTASSOC(Parse_Expr2, Parse_Expr3, case TOK_DOUBLE_AMP: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::BOOLAND, ::std::move(rv), next(lex)); break; ) // 3: (In)Equality LEFTASSOC(Parse_Expr3, Parse_Expr4, case TOK_DOUBLE_EQUAL: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::CMPEQU, ::std::move(rv), next(lex)); break; case TOK_EXCLAM_EQUAL: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::CMPNEQU, ::std::move(rv), next(lex)); break; ) // 4: Comparisons LEFTASSOC(Parse_Expr4, Parse_Expr5, case TOK_LT: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::CMPLT, ::std::move(rv), next(lex)); break; case TOK_GT: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::CMPGT, ::std::move(rv), next(lex)); break; case TOK_LTE: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::CMPLTE, ::std::move(rv), next(lex)); break; case TOK_GTE: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::CMPGTE, ::std::move(rv), next(lex)); break; ) // 5: Bit OR LEFTASSOC(Parse_Expr5, Parse_Expr6, case TOK_PIPE: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::BITOR, ::std::move(rv), next(lex)); break; ) // 6: Bit XOR LEFTASSOC(Parse_Expr6, Parse_Expr7, case TOK_CARET: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::BITXOR, ::std::move(rv), next(lex)); break; ) // 7: Bit AND LEFTASSOC(Parse_Expr7, Parse_Expr8, case TOK_AMP: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::BITAND, ::std::move(rv), next(lex)); break; ) // 8: Bit Shifts LEFTASSOC(Parse_Expr8, Parse_Expr9, case TOK_DOUBLE_LT: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::SHL, ::std::move(rv), next(lex)); break; case TOK_DOUBLE_GT: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::SHR, ::std::move(rv), next(lex)); break; ) // 9: Add / Subtract LEFTASSOC(Parse_Expr9, Parse_Expr10, case TOK_PLUS: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::ADD, ::std::move(rv), next(lex)); break; case TOK_DASH: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::SUB, ::std::move(rv), next(lex)); break; ) // 10: Times / Divide / Modulo LEFTASSOC(Parse_Expr10, Parse_Expr11, case TOK_STAR: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::MULTIPLY, ::std::move(rv), next(lex)); break; case TOK_SLASH: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::DIVIDE, ::std::move(rv), next(lex)); break; case TOK_PERCENT: rv = NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::MODULO, ::std::move(rv), next(lex)); break; ) // 11: Cast LEFTASSOC(Parse_Expr11, Parse_Expr12, case TOK_RWORD_AS: rv = NEWNODE( AST::ExprNode_Cast, ::std::move(rv), Parse_Type(lex) ); break; ) // 12: Type Ascription ExprNodeP Parse_Expr13(TokenStream& lex); ExprNodeP Parse_Expr12(TokenStream& lex) { Token tok; auto rv = Parse_Expr13(lex); if(GET_TOK(tok, lex) == TOK_COLON) { rv->get_res_type() = Parse_Type(lex); } else { PUTBACK(tok, lex); } return rv; } // 13: Unaries ExprNodeP Parse_ExprFC(TokenStream& lex); ExprNodeP Parse_Expr13(TokenStream& lex) { Token tok; switch(GET_TOK(tok, lex)) { case TOK_DASH: return NEWNODE( AST::ExprNode_UniOp, AST::ExprNode_UniOp::NEGATE, Parse_Expr12(lex) ); case TOK_EXCLAM: return NEWNODE( AST::ExprNode_UniOp, AST::ExprNode_UniOp::INVERT, Parse_Expr12(lex) ); case TOK_STAR: return NEWNODE( AST::ExprNode_Deref, Parse_Expr12(lex) ); case TOK_RWORD_BOX: return NEWNODE( AST::ExprNode_UniOp, AST::ExprNode_UniOp::BOX, Parse_Expr12(lex) ); case TOK_RWORD_IN: { ExprNodeP dest; { SET_PARSE_FLAG(lex, disallow_struct_literal); dest = Parse_Expr1(lex); } auto val = Parse_ExprBlockNode(lex); return NEWNODE( AST::ExprNode_BinOp, AST::ExprNode_BinOp::PLACE_IN, mv$(dest), mv$(val)); } case TOK_DOUBLE_AMP: // HACK: Split && into & & lex.putback( Token(TOK_AMP) ); case TOK_AMP: if( GET_TOK(tok, lex) == TOK_RWORD_MUT ) return NEWNODE( AST::ExprNode_UniOp, AST::ExprNode_UniOp::REFMUT, Parse_Expr12(lex) ); else { PUTBACK(tok, lex); return NEWNODE( AST::ExprNode_UniOp, AST::ExprNode_UniOp::REF, Parse_Expr12(lex) ); } default: PUTBACK(tok, lex); return Parse_ExprFC(lex); } } ExprNodeP Parse_ExprVal(TokenStream& lex); ExprNodeP Parse_ExprFC(TokenStream& lex) { ExprNodeP val = Parse_ExprVal(lex); while(true) { Token tok; switch(GET_TOK(tok, lex)) { case TOK_QMARK: val = NEWNODE( AST::ExprNode_UniOp, AST::ExprNode_UniOp::QMARK, mv$(val) ); break; case TOK_PAREN_OPEN: // Expression method call PUTBACK(tok, lex); val = NEWNODE( AST::ExprNode_CallObject, ::std::move(val), Parse_ParenList(lex) ); break; case TOK_SQUARE_OPEN: val = NEWNODE( AST::ExprNode_Index, ::std::move(val), Parse_Expr0(lex) ); GET_CHECK_TOK(tok, lex, TOK_SQUARE_CLOSE); break; case TOK_DOT: // Field access / method call // TODO: What about tuple indexing? switch(GET_TOK(tok, lex)) { case TOK_IDENT: { AST::PathNode path(tok.str(), {}); switch( GET_TOK(tok, lex) ) { case TOK_PAREN_OPEN: PUTBACK(tok, lex); val = NEWNODE( AST::ExprNode_CallMethod, ::std::move(val), ::std::move(path), Parse_ParenList(lex) ); break; case TOK_DOUBLE_COLON: GET_CHECK_TOK(tok, lex, TOK_LT); path.args() = Parse_Path_GenericList(lex); val = NEWNODE( AST::ExprNode_CallMethod, ::std::move(val), ::std::move(path), Parse_ParenList(lex) ); break; default: val = NEWNODE( AST::ExprNode_Field, ::std::move(val), ::std::string(path.name()) ); PUTBACK(tok, lex); break; } break; } case TOK_INTEGER: val = NEWNODE( AST::ExprNode_Field, ::std::move(val), FMT(tok.intval()) ); break; default: throw ParseError::Unexpected(lex, mv$(tok)); } break; default: PUTBACK(tok, lex); return val; } } } ExprNodeP Parse_ExprVal_StructLiteral(TokenStream& lex, AST::Path path) { TRACE_FUNCTION; Token tok; // Braced structure literal // - A series of 0 or more pairs of : , // - '..' ::std::vector< ::std::pair< ::std::string, ::std::unique_ptr> > items; while( GET_TOK(tok, lex) == TOK_IDENT ) { ::std::string name = tok.str(); GET_CHECK_TOK(tok, lex, TOK_COLON); ExprNodeP val = Parse_Stmt(lex); items.push_back( ::std::make_pair(::std::move(name), ::std::move(val)) ); if( GET_TOK(tok,lex) == TOK_BRACE_CLOSE ) break; CHECK_TOK(tok, TOK_COMMA); } ExprNodeP base_val; if( tok.type() == TOK_DOUBLE_DOT ) { // default base_val = Parse_Expr0(lex); GET_TOK(tok, lex); } CHECK_TOK(tok, TOK_BRACE_CLOSE); return NEWNODE( AST::ExprNode_StructLiteral, path, ::std::move(base_val), ::std::move(items) ); } ExprNodeP Parse_ExprVal_Closure(TokenStream& lex, bool is_move) { TRACE_FUNCTION; Token tok; ::std::vector< ::std::pair > args; while( GET_TOK(tok, lex) != TOK_PIPE ) { PUTBACK(tok, lex); // Irrefutable pattern AST::Pattern pat = Parse_Pattern(lex, false); TypeRef type; if( GET_TOK(tok, lex) == TOK_COLON ) type = Parse_Type(lex); else PUTBACK(tok, lex); args.push_back( ::std::make_pair( ::std::move(pat), ::std::move(type) ) ); if( GET_TOK(tok, lex) != TOK_COMMA ) break; } CHECK_TOK(tok, TOK_PIPE); TypeRef rt; if( GET_TOK(tok, lex) == TOK_THINARROW ) { if( GET_TOK(tok, lex) == TOK_EXCLAM ) { rt = TypeRef(TypeRef::TagInvalid(), Span(tok.get_pos())); } else { PUTBACK(tok, lex); rt = Parse_Type(lex); } } else PUTBACK(tok, lex); auto code = Parse_Expr0(lex); return NEWNODE( AST::ExprNode_Closure, ::std::move(args), ::std::move(rt), ::std::move(code) ); } ExprNodeP Parse_FormatArgs(TokenStream& lex) { TRACE_FUNCTION; Token tok; GET_CHECK_TOK(tok, lex, TOK_STRING); ::std::string fmt = tok.str(); ::std::vector nodes; while( GET_TOK(tok, lex) == TOK_COMMA ) { // TODO: Support named auto exp = NEWNODE( AST::ExprNode_UniOp, AST::ExprNode_UniOp::REF, Parse_Expr1(lex) ); // ( &arg as *const _, &::fmt as fn(*const (), &mut Formatter) ) //nodes.push_back( NEWNODE( AST::ExprNode_Cast, TypeRef } //return NEWNODE( AST::ExprNode_ArrayLiteral, ::std::move(nodes) ); DEBUG("TODO: Proper support for format_args!"); return NEWNODE( AST::ExprNode_Tuple, ::std::vector() ); } ExprNodeP Parse_ExprVal(TokenStream& lex) { TRACE_FUNCTION; Token tok; AST::Path path; switch( GET_TOK(tok, lex) ) { case TOK_BRACE_OPEN: PUTBACK(tok, lex); return Parse_ExprBlockNode(lex); case TOK_INTERPOLATED_EXPR: return tok.take_frag_node(); // TODO: Return/break/continue/... here? case TOK_RWORD_RETURN: case TOK_RWORD_CONTINUE: case TOK_RWORD_BREAK: PUTBACK(tok, lex); return Parse_Stmt(lex); case TOK_RWORD_LOOP: return NEWNODE( AST::ExprNode_Loop, "", Parse_ExprBlockNode(lex) ); case TOK_RWORD_WHILE: return Parse_WhileStmt(lex, ""); case TOK_RWORD_FOR: return Parse_ForStmt(lex, ""); case TOK_RWORD_MATCH: return Parse_Expr_Match(lex); case TOK_RWORD_IF: return Parse_IfStmt(lex); case TOK_RWORD_UNSAFE: { auto rv = Parse_ExprBlockNode(lex); dynamic_cast(*rv).set_unsafe(); return rv; } // UFCS case TOK_DOUBLE_LT: PUTBACK(tok, lex); case TOK_LT: { TypeRef ty = Parse_Type(lex); if( GET_TOK(tok, lex) == TOK_RWORD_AS ) { auto trait = Parse_Path(lex, PATH_GENERIC_TYPE); GET_CHECK_TOK(tok, lex, TOK_GT); GET_CHECK_TOK(tok, lex, TOK_DOUBLE_COLON); path = AST::Path(AST::Path::TagUfcs(), ty, trait, Parse_PathNodes(lex, PATH_GENERIC_EXPR)); } else { PUTBACK(tok, lex); GET_CHECK_TOK(tok, lex, TOK_GT); // TODO: Terminating the "path" here is sometimes valid GET_CHECK_TOK(tok, lex, TOK_DOUBLE_COLON); path = AST::Path(AST::Path::TagUfcs(), ty, Parse_PathNodes(lex, PATH_GENERIC_EXPR)); } } if(0) case TOK_RWORD_SELF: { if( LOOK_AHEAD(lex) != TOK_DOUBLE_COLON ) { return NEWNODE( AST::ExprNode_NamedValue, AST::Path(AST::Path::TagLocal(), "self") ); } else { PUTBACK(tok, lex); path = Parse_Path(lex, PATH_GENERIC_EXPR); } } if(0) case TOK_RWORD_SUPER: { PUTBACK(tok, lex); path = Parse_Path(lex, PATH_GENERIC_EXPR); } if(0) case TOK_IDENT: // Get path { PUTBACK(tok, lex); path = Parse_Path(lex, false, PATH_GENERIC_EXPR); } if(0) case TOK_INTERPOLATED_PATH: { path = mv$(tok.frag_path()); } if(0) case TOK_DOUBLE_COLON: path = Parse_Path(lex, true, PATH_GENERIC_EXPR); switch( GET_TOK(tok, lex) ) { case TOK_PAREN_OPEN: // Function call PUTBACK(tok, lex); return NEWNODE( AST::ExprNode_CallPath, ::std::move(path), Parse_ParenList(lex) ); case TOK_BRACE_OPEN: if( !CHECK_PARSE_FLAG(lex, disallow_struct_literal) ) return Parse_ExprVal_StructLiteral(lex, ::std::move(path)); else DEBUG("Not parsing struct literal"); default: // Value PUTBACK(tok, lex); return NEWNODE( AST::ExprNode_NamedValue, ::std::move(path) ); } case TOK_RWORD_MOVE: // TODO: Annotate closure as move GET_TOK(tok, lex); if(tok.type() == TOK_PIPE) return Parse_ExprVal_Closure(lex, true); else if(tok.type() == TOK_DOUBLE_PIPE) { lex.putback(Token(TOK_PIPE)); return Parse_ExprVal_Closure(lex, true); } else { CHECK_TOK(tok, TOK_PIPE); } case TOK_DOUBLE_PIPE: lex.putback(Token(TOK_PIPE)); case TOK_PIPE: return Parse_ExprVal_Closure(lex, false); case TOK_INTEGER: return NEWNODE( AST::ExprNode_Integer, tok.intval(), tok.datatype() ); case TOK_FLOAT: return NEWNODE( AST::ExprNode_Float, tok.floatval(), tok.datatype() ); case TOK_STRING: return NEWNODE( AST::ExprNode_String, tok.str() ); case TOK_BYTESTRING: return NEWNODE( AST::ExprNode_ByteString, tok.str() ); case TOK_RWORD_TRUE: return NEWNODE( AST::ExprNode_Bool, true ); case TOK_RWORD_FALSE: return NEWNODE( AST::ExprNode_Bool, false ); case TOK_PAREN_OPEN: if( GET_TOK(tok, lex) == TOK_PAREN_CLOSE ) { DEBUG("Unit"); return NEWNODE( AST::ExprNode_Tuple, ::std::vector() ); } else { CLEAR_PARSE_FLAG(lex, disallow_struct_literal); PUTBACK(tok, lex); ExprNodeP rv = Parse_Expr0(lex); if( GET_TOK(tok, lex) == TOK_COMMA ) { ::std::vector ents; ents.push_back( ::std::move(rv) ); do { if( GET_TOK(tok, lex) == TOK_PAREN_CLOSE ) break; PUTBACK(tok, lex); ents.push_back( Parse_Expr0(lex) ); } while( GET_TOK(tok, lex) == TOK_COMMA ); rv = NEWNODE( AST::ExprNode_Tuple, ::std::move(ents) ); } CHECK_TOK(tok, TOK_PAREN_CLOSE); return rv; } case TOK_SQUARE_OPEN: if( GET_TOK(tok, lex) == TOK_SQUARE_CLOSE ) { // Empty literal return NEWNODE( AST::ExprNode_Array, ::std::vector() ); } else { PUTBACK(tok, lex); auto first = Parse_Expr0(lex); if( GET_TOK(tok, lex) == TOK_SEMICOLON ) { // Repetiion auto count = Parse_Expr0(lex); GET_CHECK_TOK(tok, lex, TOK_SQUARE_CLOSE); return NEWNODE( AST::ExprNode_Array, ::std::move(first), ::std::move(count) ); } else { ::std::vector items; items.push_back( ::std::move(first) ); while( tok.type() == TOK_COMMA ) { if( GET_TOK(tok, lex) == TOK_SQUARE_CLOSE ) break; else PUTBACK(tok, lex); items.push_back( Parse_Expr0(lex) ); GET_TOK(tok, lex); } CHECK_TOK(tok, TOK_SQUARE_CLOSE); return NEWNODE( AST::ExprNode_Array, ::std::move(items) ); } } throw ParseError::BugCheck(lex, "Array literal fell"); case TOK_MACRO: return Parse_ExprMacro(lex, mv$(tok)); default: throw ParseError::Unexpected(lex, tok); } } ExprNodeP Parse_ExprMacro(TokenStream& lex, Token tok) { ::std::string name = tok.str(); ::std::string ident; if( GET_TOK(tok, lex) == TOK_IDENT ) { ident = mv$(tok.str()); } else { PUTBACK(tok, lex); } TokenTree tt = Parse_TT(lex, true); if( tt.is_token() ) { throw ParseError::Unexpected(lex, tt.tok()); } return NEWNODE(AST::ExprNode_Macro, mv$(name), mv$(ident), mv$(tt)); } // Token Tree Parsing TokenTree Parse_TT(TokenStream& lex, bool unwrapped) { TRACE_FUNCTION; Token tok = lex.getToken(); eTokenType closer = TOK_PAREN_CLOSE; switch(tok.type()) { case TOK_PAREN_OPEN: closer = TOK_PAREN_CLOSE; break; case TOK_SQUARE_OPEN: closer = TOK_SQUARE_CLOSE; break; case TOK_BRACE_OPEN: closer = TOK_BRACE_CLOSE; break; case TOK_EOF: case TOK_NULL: throw ParseError::Unexpected(lex, tok); default: return TokenTree( mv$(tok) ); } ::std::vector items; if( !unwrapped ) items.push_back( mv$(tok) ); while(GET_TOK(tok, lex) != closer && tok.type() != TOK_EOF) { if( tok.type() == TOK_NULL ) throw ParseError::Unexpected(lex, tok); PUTBACK(tok, lex); items.push_back(Parse_TT(lex, false)); } if( !unwrapped ) items.push_back( mv$(tok) ); return TokenTree(mv$(items)); } /// A wrapping lexer that class TTLexer: public TokenStream { TokenStream& m_input; Token m_last_token; ::std::vector m_output; public: TTLexer(TokenStream& input): m_input(input) { } virtual Position getPosition() const override { return m_input.getPosition(); } virtual Token realGetToken() override { Token tok = m_input.getToken(); m_output.push_back( TokenTree(tok) ); return tok; } TokenTree get_output() { unsigned int eat = (TokenStream::m_cache_valid ? 1 : 0) + TokenStream::m_lookahead.size(); DEBUG(eat << " tokens were not consumed"); assert( m_output.size() >= eat ); assert( m_input.m_lookahead.size() == 0 ); assert( m_input.m_cache_valid == false ); for( unsigned int i = 0; i < eat; i ++ ) { Token tok = m_output[ m_output.size() - eat + i ].tok(); DEBUG("Unconsume " << tok); m_input.m_lookahead.push_back( tok ); } DEBUG("- output was [" << m_output << "]"); m_output.erase( m_output.end() - eat, m_output.end() ); DEBUG("Returning [" << m_output << "]"); return ::std::move(m_output); } }; TokenTree Parse_TT_Type(TokenStream& lex) { TRACE_FUNCTION; TTLexer wlex(lex); SET_PARSE_FLAG(wlex, no_expand_macros); // discard result Parse_Type(wlex); return wlex.get_output(); } /// Parse a token tree path TokenTree Parse_TT_Path(TokenStream& lex, bool mode_expr) { TRACE_FUNCTION; TTLexer wlex(lex); SET_PARSE_FLAG(wlex, no_expand_macros); Token tok; if( GET_TOK(tok, wlex) == TOK_DOUBLE_COLON ) { Parse_Path(wlex, true, (mode_expr ? PATH_GENERIC_EXPR : PATH_GENERIC_TYPE)); } else { PUTBACK(tok, lex); Parse_Path(wlex, false, (mode_expr ? PATH_GENERIC_EXPR : PATH_GENERIC_TYPE)); } return wlex.get_output(); } /// Parse a token tree expression TokenTree Parse_TT_Expr(TokenStream& lex) { TRACE_FUNCTION; TTLexer wlex(lex); SET_PARSE_FLAG(wlex, no_expand_macros); Parse_Expr1(wlex); return wlex.get_output(); } TokenTree Parse_TT_Pattern(TokenStream& lex) { TRACE_FUNCTION; TTLexer wlex(lex); SET_PARSE_FLAG(wlex, no_expand_macros); // Allow a refutable pattern here Parse_Pattern(wlex, true); return wlex.get_output(); } TokenTree Parse_TT_Stmt(TokenStream& lex) { TRACE_FUNCTION; TTLexer wlex(lex); SET_PARSE_FLAG(wlex, no_expand_macros); throw ParseError::Todo("Parse_TT_Stmt"); } TokenTree Parse_TT_Block(TokenStream& lex) { TRACE_FUNCTION; TTLexer wlex(lex); SET_PARSE_FLAG(wlex, no_expand_macros); throw ParseError::Todo("Parse_TT_Block"); } TokenTree Parse_TT_Meta(TokenStream& lex) { TRACE_FUNCTION; TTLexer wlex(lex); SET_PARSE_FLAG(wlex, no_expand_macros); Parse_MetaItem(wlex); return wlex.get_output(); }