diff options
Diffstat (limited to 'gcc/rust/expand/rust-macro-builtins-asm.cc')
-rw-r--r-- | gcc/rust/expand/rust-macro-builtins-asm.cc | 1175 |
1 files changed, 1173 insertions, 2 deletions
diff --git a/gcc/rust/expand/rust-macro-builtins-asm.cc b/gcc/rust/expand/rust-macro-builtins-asm.cc index 62bb593..529ccc5 100644 --- a/gcc/rust/expand/rust-macro-builtins-asm.cc +++ b/gcc/rust/expand/rust-macro-builtins-asm.cc @@ -16,5 +16,1176 @@ // along with GCC; see the file COPYING3. If not see // <http://www.gnu.org/licenses/>. -#include "rust-macro-builtins.h" -#include "rust-macro-builtins-helpers.h" +#include "expected.h" +#include "rust-macro-builtins-asm.h" +#include "rust-ast-fragment.h" +#include "rust-ast.h" +#include "rust-fmt.h" +#include "rust-stmt.h" +#include "rust-parse.h" + +namespace Rust { +std::set<std::string> potentially_nonpromoted_keywords + = {"in", "out", "lateout", "inout", "inlateout", "const", "sym", "label"}; + +// Helper function strips the beginning and ending double quotes from a +// string. +std::string +strip_double_quotes (const std::string &str) +{ + std::string result = str; + + rust_assert (!str.empty ()); + + rust_assert (str.front () == '\"'); + rust_assert (str.back () == '\"'); + + // we have to special case empty strings which just contain a set of quotes + // so, if the string is "\"\"", just return "" + if (result.size () == 2) + return ""; + + rust_assert (result.size () >= 3); + + result.erase (0, 1); + result.erase (result.size () - 1, 1); + + return result; +} + +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_clobber_abi (InlineAsmContext inline_asm_ctx) +{ + // clobber_abi := "clobber_abi(" <abi> *("," <abi>) [","] ")" + // PARSE EVERYTHING COMMITTEDLY IN THIS FUNCTION, WE CONFIRMED VIA clobber_abi + // identifier keyword + auto &parser = inline_asm_ctx.parser; + auto last_token_id = inline_asm_ctx.last_token_id; + auto &inline_asm = inline_asm_ctx.inline_asm; + auto token = parser.peek_current_token (); + if (!parser.skip_token (LEFT_PAREN)) + { + token = parser.peek_current_token (); + + // TODO: Error reporting shifted to the left 1 character, I'm not sure + // why. + if (token->get_id () == last_token_id) + { + rust_error_at (token->get_locus (), + "expected %<(%>, found end of macro arguments"); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + else + { + rust_error_at (token->get_locus (), "expected %<(%>, found %qs", + token->get_token_description ()); + } + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + + if (parser.skip_token (RIGHT_PAREN)) + { + rust_error_at ( + parser.peek_current_token ()->get_locus (), + "at least one abi must be provided as an argument to %<clobber_abi%>"); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + + std::vector<AST::TupleClobber> new_abis; + + token = parser.peek_current_token (); + + while (token->get_id () != last_token_id && token->get_id () != RIGHT_PAREN) + { + // Check if it is a string literal or not, codename: <ABI> in ABNF + if (token->get_id () == STRING_LITERAL) + { + // TODO: Caring for span in here. + new_abis.push_back ({token->as_string (), token->get_locus ()}); + } + else + { + // TODO: We encountered something that is not string literal, which + // should be illegal, please emit the correct error + // https://github.com/rust-lang/rust/blob/b92758a9aef1cef7b79e2b72c3d8ba113e547f89/compiler/rustc_builtin_macros/src/asm.rs#L387 + rust_unreachable (); + } + + if (parser.skip_token (RIGHT_PAREN)) + { + break; + } + + if (!parser.skip_token (COMMA)) + { + // TODO: If the skip of comma is unsuccessful, which should be + // illegal, pleaes emit the correct error. + rust_unreachable (); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + + token = parser.peek_current_token (); + } + + // Done processing the local clobber abis, push that to the main Args in + // argument + + for (auto abi : new_abis) + { + inline_asm.clobber_abi.push_back (abi); + } + + return inline_asm_ctx; +} + +tl::optional<AST::InlineAsmRegOrRegClass> +parse_reg (InlineAsmContext &inline_asm_ctx) +{ + using RegType = AST::InlineAsmRegOrRegClass::Type; + auto &parser = inline_asm_ctx.parser; + + if (!parser.skip_token (LEFT_PAREN)) + { + // TODO: we expect a left parenthesis here, please return the correct + // error. + rust_unreachable (); + return tl::nullopt; + } + + // after successful left parenthesis parsing, we should return ast of + // InlineAsmRegOrRegClass of reg or reg class + auto token = parser.peek_current_token (); + AST::InlineAsmRegOrRegClass reg_class; + if (parser.skip_token (IDENTIFIER)) + { + // construct a InlineAsmRegOrRegClass + reg_class.type = RegType::RegClass; + reg_class.reg_class.Symbol = token->as_string (); + } + else if (parser.skip_token (STRING_LITERAL)) + { + // TODO: there is STRING_LITERAL, and BYTE_STRING_LITERAL, should we check + // for both? + + // construct a InlineAsmRegOrRegClass + // parse_format_string + reg_class.type = RegType::Reg; + inline_asm_ctx.is_explicit = true; + reg_class.reg_class.Symbol = token->as_string (); + } + else + { + // TODO: This should emit error + // return + // Err(p.dcx().create_err(errors::ExpectedRegisterClassOrExplicitRegister + // { + // span: p.token.span, + // })); + rust_unreachable (); + } + if (!parser.skip_token (RIGHT_PAREN)) + { + // TODO: we expect a left parenthesis here, please return the correct + // error. + rust_unreachable (); + return tl::nullopt; + } + + return reg_class; +} + +// From rustc +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_reg_operand (InlineAsmContext inline_asm_ctx) +{ + // let name = if p.token.is_ident() && p.look_ahead(1, |t| *t == token::Eq) { + // let (ident, _) = p.token.ident().unwrap(); + // p.bump(); + // p.expect(&token::Eq)?; + // allow_templates = false; + // Some(ident.name) + // } else { + // None + // }; + auto &parser = inline_asm_ctx.parser; + auto token = parser.peek_current_token (); + auto iden_token = parser.peek_current_token (); + + tl::optional<std::string> name = tl::nullopt; + if (check_identifier (parser, "")) + { + auto equal_token = parser.peek_current_token (); + + if (parser.skip_token (EQUAL)) + { + name = token->as_string (); + } + else + { + rust_error_at (token->get_locus (), + "expected operand, %s, options, or " + "additional template string", + "clobber_abi"); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + } + + int slot = inline_asm_ctx.inline_asm.operands.size (); + + // Here is all parse_reg_operand functions we're using in a for loop + auto parse_funcs = {parse_reg_operand_in, parse_reg_operand_out, + parse_reg_operand_lateout, parse_reg_operand_inout, + parse_reg_operand_const, parse_reg_operand_sym, + parse_reg_operand_unexpected}; + + // Loop over and execute the parsing functions, if the parser successfullly + // parses or if the parser fails to parse while it has committed to a token, + // we propogate the result. + tl::expected<InlineAsmContext, InlineAsmParseError> parsing_operand ( + inline_asm_ctx); + for (auto &parse_func : parse_funcs) + { + auto result = parsing_operand.and_then (parse_func); + + // Per rust's asm.rs's structure + // After we've parse successfully, we break out and do a local validation + // of named, positional & explicit register operands + + if (result.has_value ()) + { + inline_asm_ctx = *result; + break; + } + else if (result.error () == COMMITTED) + { + if (parse_func == parse_reg_operand_unexpected) + return inline_asm_ctx; + else + return result; + } + } + + auto &inline_asm = inline_asm_ctx.inline_asm; + + token = inline_asm_ctx.parser.peek_current_token (); + rust_debug_loc (token->get_locus (), "Here\n"); + if (inline_asm_ctx.is_explicit) + { + if (name != tl::nullopt) + { + rust_error_at (token->get_locus (), + "explicit register arguments cannot have names"); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + inline_asm.reg_args.insert (slot); + } + else if (name != tl::nullopt) + { + if (inline_asm.named_args.find (name.value ()) + != inline_asm.named_args.end ()) + { + rust_error_at (token->get_locus (), "duplicate argument named %qs", + name.value ().c_str ()); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + inline_asm.named_args[name.value ()] = slot; + } + else + { + if (!inline_asm.named_args.empty () || !inline_asm.reg_args.empty ()) + { + // positional arguments cannot follow named arguments or explicit + // register arguments + rust_error_at (token->get_locus (), + "positional arguments cannot follow named arguments " + "or explicit register arguments"); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + } + + return inline_asm_ctx; +} + +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_reg_operand_in (InlineAsmContext inline_asm_ctx) +{ + // For the keyword IN, currently we count it as a seperate keyword called + // Rust::IN search for #define RS_TOKEN_LIST in code base. + auto &parser = inline_asm_ctx.parser; + location_t locus = parser.peek_current_token ()->get_locus (); + if (!inline_asm_ctx.is_global_asm () && parser.skip_token (IN)) + { + auto reg = parse_reg (inline_asm_ctx); + + if (parser.skip_token (UNDERSCORE)) + { + // We are sure to be failing a test here, based on asm.rs + // https://github.com/rust-lang/rust/blob/a330e49593ee890f9197727a3a558b6e6b37f843/compiler/rustc_builtin_macros/src/asm.rs#L112 + rust_unreachable (); + // return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + + auto expr = parser.parse_expr (); + + // TODO: When we've succesfully parse an expr, remember to clone_expr() + // instead of nullptr + AST::InlineAsmOperand::In in (reg, std::move (expr)); + inline_asm_ctx.inline_asm.operands.emplace_back (in, locus); + return inline_asm_ctx; + } + return tl::unexpected<InlineAsmParseError> (NONCOMMITED); +} + +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_reg_operand_out (InlineAsmContext inline_asm_ctx) +{ + auto &parser = inline_asm_ctx.parser; + location_t locus = parser.peek_current_token ()->get_locus (); + if (!inline_asm_ctx.is_global_asm () && check_identifier (parser, "out")) + { + auto reg = parse_reg (inline_asm_ctx); + std::unique_ptr<AST::Expr> expr = parser.parse_expr (); + + rust_assert (expr != nullptr); + + /*auto expr_ptr = + std::make_unique<AST::Expr>(AST::LiteralExpr(Literal))*/ + + // TODO: When we've succesfully parse an expr, remember to clone_expr() + // instead of nullptr + AST::InlineAsmOperand::Out out (reg, false, std::move (expr)); + + inline_asm_ctx.inline_asm.operands.emplace_back (out, locus); + + return inline_asm_ctx; + } + + return tl::unexpected<InlineAsmParseError> (NONCOMMITED); +} + +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_reg_operand_lateout (InlineAsmContext inline_asm_ctx) +{ + auto &parser = inline_asm_ctx.parser; + auto token = parser.peek_current_token (); + if (!inline_asm_ctx.is_global_asm () && check_identifier (parser, "lateout")) + { + rust_error_at (token->get_locus (), + "The lateout feature is not implemented"); + rust_unreachable (); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + + return tl::unexpected<InlineAsmParseError> (NONCOMMITED); +} + +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_reg_operand_inout (InlineAsmContext inline_asm_ctx) +{ + auto &parser = inline_asm_ctx.parser; + auto token = parser.peek_current_token (); + + if (!inline_asm_ctx.is_global_asm () && check_identifier (parser, "inout")) + { + auto reg = parse_reg (inline_asm_ctx); + + if (parser.skip_token (UNDERSCORE)) + { + // We are sure to be failing a test here, based on asm.rs + // https://github.com/rust-lang/rust/blob/a330e49593ee890f9197727a3a558b6e6b37f843/compiler/rustc_builtin_macros/src/asm.rs#L112 + rust_error_at (token->get_locus (), + "The lateout feature is not implemented"); + rust_unreachable (); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + + // TODO: Is error propogation our top priority, the ? in rust's asm.rs is + // doing a lot of work. + // TODO: Not sure how to use parse_expr + if (!check_identifier (parser, "")) + rust_unreachable (); + // auto expr = parse_format_string (inline_asm_ctx); + + std::unique_ptr<AST::Expr> out_expr; + + if (parser.skip_token (MATCH_ARROW)) + { + if (!parser.skip_token (UNDERSCORE)) + { + // auto result = parse_format_string (inline_asm_ctx); + + if (!check_identifier (parser, "")) + rust_unreachable (); + // out_expr = parser.parse_expr(); + } + + // TODO: Rembmer to pass in clone_expr() instead of nullptr + // https://github.com/rust-lang/rust/blob/a3167859f2fd8ff2241295469876a2b687280bdc/compiler/rustc_builtin_macros/src/asm.rs#L135 + // RUST VERSION: ast::InlineAsmOperand::SplitInOut { reg, in_expr: + // expr, out_expr, late: false } + // struct AST::InlineAsmOperand::SplitInOut split_in_out (reg, + // false, nullptr, + // nullptr); + // inline_asm_ctx.inline_asm.operands.push_back (split_in_out); + + return inline_asm_ctx; + } + else + { + // https://github.com/rust-lang/rust/blob/a3167859f2fd8ff2241295469876a2b687280bdc/compiler/rustc_builtin_macros/src/asm.rs#L137 + // RUST VERSION: ast::InlineAsmOperand::InOut { reg, expr, late: false + // } + // struct AST::InlineAsmOperand::InOut inout (reg, false, + // nullptr); + // inline_asm_ctx.inline_asm.operands.push_back (inout); + return inline_asm_ctx; + } + } + + return tl::unexpected<InlineAsmParseError> (NONCOMMITED); +} + +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_reg_operand_const (InlineAsmContext inline_asm_ctx) +{ + auto &parser = inline_asm_ctx.parser; + if (parser.peek_current_token ()->get_id () == CONST) + { + // TODO: Please handle const with parse_expr instead. + auto anon_const = parse_format_string (inline_asm_ctx); + rust_unreachable (); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + + return tl::unexpected<InlineAsmParseError> (NONCOMMITED); +} + +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_reg_operand_sym (InlineAsmContext inline_asm_ctx) +{ + auto &parser = inline_asm_ctx.parser; + + if (check_identifier (parser, "sym")) + { + // TODO: Please handle sym, which needs ExprKind::Path in Rust's asm.rs + rust_unreachable (); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + return tl::unexpected<InlineAsmParseError> (NONCOMMITED); +} + +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_reg_operand_unexpected (InlineAsmContext inline_asm_ctx) +{ + auto token = inline_asm_ctx.parser.peek_current_token (); + // TODO: It is weird that we can't seem to match any identifier, + // something must be wrong. consult compiler code in asm.rs or rust online + // compiler. + // rust_unreachable (); + + // rust_error_at (token->get_locus (), "ERROR RIGHT HERE"); + return tl::unexpected<InlineAsmParseError> (COMMITTED); +} + +void +check_and_set (InlineAsmContext &inline_asm_ctx, AST::InlineAsm::Option option) +{ + auto &parser = inline_asm_ctx.parser; + auto &inline_asm = inline_asm_ctx.inline_asm; + if (inline_asm.options.count (option) != 0) + { + // TODO: report an error of duplication + rust_error_at (parser.peek_current_token ()->get_locus (), + "the %qs option was already provided", + AST::InlineAsm::option_to_string (option).c_str ()); + return; + } + else + { + inline_asm.options.insert (option); + } +} +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_options (InlineAsmContext &inline_asm_ctx) +{ + auto &parser = inline_asm_ctx.parser; + bool is_global_asm = inline_asm_ctx.inline_asm.is_global_asm; + // Parse everything commitedly + if (!parser.skip_token (LEFT_PAREN)) + { + auto local_token = parser.peek_current_token (); + rust_error_at (local_token->get_locus (), "expected %qs, found %qs", "(", + local_token->as_string ().c_str ()); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + + auto token = parser.peek_current_token (); + while (!parser.skip_token (RIGHT_PAREN)) + { + if (!is_global_asm && check_identifier (parser, "pure")) + { + check_and_set (inline_asm_ctx, AST::InlineAsm::Option::PURE); + } + else if (!is_global_asm && check_identifier (parser, "nomem")) + { + check_and_set (inline_asm_ctx, AST::InlineAsm::Option::NOMEM); + } + else if (!is_global_asm && check_identifier (parser, "readonly")) + { + check_and_set (inline_asm_ctx, AST::InlineAsm::Option::READONLY); + } + else if (!is_global_asm && check_identifier (parser, "preserves_flags")) + { + check_and_set (inline_asm_ctx, + AST::InlineAsm::Option::PRESERVES_FLAGS); + } + else if (!is_global_asm && check_identifier (parser, "noreturn")) + { + check_and_set (inline_asm_ctx, AST::InlineAsm::Option::NORETURN); + } + else if (!is_global_asm && check_identifier (parser, "nostack")) + { + check_and_set (inline_asm_ctx, AST::InlineAsm::Option::NOSTACK); + } + else if (!is_global_asm && check_identifier (parser, "may_unwind")) + { + check_and_set (inline_asm_ctx, AST::InlineAsm::Option::MAY_UNWIND); + } + else if (check_identifier (parser, "att_syntax")) + { + check_and_set (inline_asm_ctx, AST::InlineAsm::Option::ATT_SYNTAX); + } + else if (check_identifier (parser, "raw")) + { + check_and_set (inline_asm_ctx, AST::InlineAsm::Option::RAW); + } + else + { + rust_error_at (token->get_locus (), + "expected one of %qs, %qs, %qs, %qs, %qs, %qs, %qs, " + "%qs, %qs, or %qs, found %qs", + ")", "att_syntax", "may_unwind", "nomem", "noreturn", + "nostack", "preserves_flags", "pure", "raw", + "readonly", token->as_string ().c_str ()); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + if (parser.skip_token (RIGHT_PAREN)) + { + break; + } + + // Parse comma as optional + if (parser.skip_token (COMMA)) + continue; + else + { + rust_unreachable (); + token = parser.peek_current_token (); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + } + + // TODO: Per rust asm.rs regarding options_spans + // I'm guessing this has to do with some error reporting. + // let new_span = span_start.to(p.prev_token.span); + // args.options_spans.push(new_span); + + return inline_asm_ctx; +} + +bool +check_identifier (Parser<MacroInvocLexer> &p, std::string ident) +{ + auto token = p.peek_current_token (); + + if (token->get_id () == IDENTIFIER) + { + auto str = token->as_string (); + + // For non-promoted keywords, we need to also check for them. + + if (str == ident) + { + p.skip_token (); + return true; + } + if (ident == "") + { + if (potentially_nonpromoted_keywords.find (str) + == potentially_nonpromoted_keywords.end ()) + { + p.skip_token (); + return true; + } + return false; + } + } + + return false; +} + +tl::optional<std::string> +parse_format_string (InlineAsmContext &inline_asm_ctx) +{ + auto &parser = inline_asm_ctx.parser; + auto last_token_id = inline_asm_ctx.last_token_id; + auto token = parser.peek_current_token (); + + if (token->get_id () != last_token_id && token->get_id () == STRING_LITERAL) + { + // very nice, we got a supposedly formatted string. + parser.skip_token (); + return token->as_string (); + } + else + { + return tl::nullopt; + } +} + +tl::optional<AST::Fragment> +MacroBuiltin::asm_handler (location_t invoc_locus, AST::MacroInvocData &invoc, + AST::InvocKind semicolon, AST::AsmKind is_global_asm) +{ + return parse_asm (invoc_locus, invoc, semicolon, is_global_asm); +} + +tl::optional<AST::Fragment> +MacroBuiltin::llvm_asm_handler (location_t invoc_locus, + AST::MacroInvocData &invoc, + AST::InvocKind semicolon, + AST::AsmKind is_global_asm) +{ + return parse_llvm_asm (invoc_locus, invoc, semicolon, is_global_asm); +} + +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_asm_arg (InlineAsmContext inline_asm_ctx) +{ + auto &parser = inline_asm_ctx.parser; + auto last_token_id = inline_asm_ctx.last_token_id; + auto token = parser.peek_current_token (); + tl::optional<std::string> fm_string; + while (token->get_id () != last_token_id) + { + token = parser.peek_current_token (); + + if (token->get_id () == COLON || token->get_id () == SCOPE_RESOLUTION) + { + rust_error_at ( + token->get_locus (), + "the legacy LLVM-style %<asm!%> syntax is no longer supported"); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + + // We accept a comma token here. + if (token->get_id () != COMMA + && inline_asm_ctx.consumed_comma_without_formatted_string) + { + // if it is not a comma, but we consumed it previously, this is fine + // but we have to set it to false tho. + inline_asm_ctx.consumed_comma_without_formatted_string = false; + } + else if (token->get_id () == COMMA + && !inline_asm_ctx.consumed_comma_without_formatted_string) + { + inline_asm_ctx.consumed_comma_without_formatted_string = false; + parser.skip_token (); + } + else if (token->get_id () == COMMA + && inline_asm_ctx.consumed_comma_without_formatted_string) + { + // We consumed comma, and there happens to also be a comma + // error should be: expected expression, found `,` + rust_error_at (token->get_locus (), "expected expression, found %qs", + ","); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + break; + } + + // And if that token comma is also the trailing comma, we break + token = parser.peek_current_token (); + if (token->get_id () == COMMA && token->get_id () == last_token_id) + { + parser.skip_token (); + break; + } + + // Ok after the left paren is good, we better be parsing correctly + // everything in here, which is operand in ABNF + + // Parse clobber abi, eat the identifier named "clobber_abi" if true + if (check_identifier (parser, "clobber_abi")) + { + auto expected = parse_clobber_abi (inline_asm_ctx); + if (expected.has_value ()) + continue; + else if (expected.error () == COMMITTED) + return expected; + + // The error type is definitely non-committed (we have checked above), + // we are allowed to keep on parsing + } + + if (check_identifier (parser, "options")) + { + auto expected = parse_options (inline_asm_ctx); + if (expected.has_value ()) + continue; + else if (expected.error () == COMMITTED) + return expected; + + // The error type is definitely non-committed (we have checked above), + // we are allowed to keep on parsing + } + + // Ok after we have check that neither clobber_abi nor options works, the + // only other logical choice is reg_operand + + auto expected = parse_reg_operand (inline_asm_ctx); + if (expected.has_value ()) + continue; + else if (expected.error () == COMMITTED) + return expected; + + // Since parse_reg_operand is the last thing we've considered, + // The non-committed parse error type means that we have exhausted our + // search path + + // We then should return the error of COMMITTED, even though we have not + // committed to anything So that the error bubbles up and we recover from + // this error gracefully + rust_error_at (token->get_locus (), + "expected operand, %s, options, or additional " + "template string", + "clobber_abi"); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + return tl::expected<InlineAsmContext, InlineAsmParseError> (inline_asm_ctx); +} + +tl::expected<InlineAsmContext, InlineAsmParseError> +expand_inline_asm_strings (InlineAsmContext inline_asm_ctx) +{ + auto &inline_asm = inline_asm_ctx.inline_asm; + + auto str_vec = inline_asm.get_template_strs (); + + decltype (str_vec) resulting_template_vec; + for (auto &template_str : str_vec) + { + /*std::cout << template_str.symbol << std::endl;*/ + + auto pieces = Fmt::Pieces::collect (template_str.symbol, false, + Fmt::ffi::ParseMode::InlineAsm); + auto pieces_vec = pieces.get_pieces (); + + std::string transformed_template_str = ""; + for (size_t i = 0; i < pieces_vec.size (); i++) + { + auto piece = pieces_vec[i]; + if (piece.tag == Fmt::ffi::Piece::Tag::String) + { + transformed_template_str += piece.string._0.to_string (); + } + else if (piece.tag == Fmt::ffi::Piece::Tag::NextArgument) + { + /* std::cout << " " << i << ": "*/ + /*<< piece.next_argument._0.to_string () << std::endl;*/ + + auto next_argument = piece.next_argument._0; + switch (piece.next_argument._0.position.tag) + { + case Fmt::ffi::Position::Tag::ArgumentImplicitlyIs: { + auto idx = next_argument.position.argument_implicitly_is._0; + /*auto trait = next_argument.format;*/ + /*auto arg = arguments.at (idx);*/ + + /* // FIXME(Arthur): This API sucks*/ + /* rust_assert (arg.get_kind ().kind*/ + /*== AST::FormatArgumentKind::Kind::Normal);*/ + /**/ + /* args.push_back ({arg.get_expr ().clone_expr (), + * trait});*/ + + transformed_template_str += "%" + std::to_string (idx); + // std::cout << "argument implicitly is: " << idx << + // std::endl; std::cout << "transformed template str is:" + // << transformed_template_str << std::endl; + /*std::cout << "trait: " << trait.to_string () << + * std::endl;*/ + /*std::cout << "arg: " << arg.to_string () << std::endl;*/ + } + break; + case Fmt::ffi::Position::Tag::ArgumentIs: + case Fmt::ffi::Position::Tag::ArgumentNamed: + rust_sorry_at (inline_asm.get_locus (), + "unhandled argument position specifier"); + break; + } + } + } + template_str.symbol = transformed_template_str; + } + + inline_asm.template_strs = str_vec; + return inline_asm_ctx; +} + +tl::optional<AST::Fragment> +parse_asm (location_t invoc_locus, AST::MacroInvocData &invoc, + AST::InvocKind semicolon, AST::AsmKind is_global_asm) +{ + // From the rule of asm. + // We first parse all formatted strings. If we fail, then we return + // tl::nullopt + + // We then parse the asm arguments. If we fail, then we return + // tl::nullopt + + // We then validate. If we fail, then we return tl::nullopt + + // Done + MacroInvocLexer lex (invoc.get_delim_tok_tree ().to_token_stream ()); + Parser<MacroInvocLexer> parser (lex); + auto last_token_id = macro_end_token (invoc.get_delim_tok_tree (), parser); + + AST::InlineAsm inline_asm (invoc_locus, + is_global_asm == AST::AsmKind::Global); + auto inline_asm_ctx = InlineAsmContext (inline_asm, parser, last_token_id); + + auto resulting_context = parse_format_strings (inline_asm_ctx) + .and_then (parse_asm_arg) + .and_then (validate) + .and_then (expand_inline_asm_strings); + + // TODO: I'm putting the validation here because the rust reference put + // it here Per Arthur's advice we would actually do the validation in a + // different stage. and visit on the InlineAsm AST instead of it's + // context. + if (resulting_context) + { + auto node = (*resulting_context).inline_asm.clone_expr_without_block (); + + std::vector<AST::SingleASTNode> single_vec = {}; + + // If the macro invocation has a semicolon (`asm!("...");`), then we + // need to make it a statement. This way, it will be expanded + // properly. + if (semicolon == AST::InvocKind::Semicoloned) + single_vec.emplace_back (AST::SingleASTNode ( + std::make_unique<AST::ExprStmt> (std::move (node), invoc_locus, + semicolon + == AST::InvocKind::Semicoloned))); + else + single_vec.emplace_back (AST::SingleASTNode (std::move (node))); + + AST::Fragment fragment_ast + = AST::Fragment (single_vec, + std::vector<std::unique_ptr<AST::Token>> ()); + return fragment_ast; + } + else + { + return tl::nullopt; + } +} + +tl::expected<InlineAsmContext, InlineAsmParseError> +parse_format_strings (InlineAsmContext inline_asm_ctx) +{ + // Parse the first ever formatted string, success or not, will skip 1 + // token + auto &parser = inline_asm_ctx.parser; + auto last_token_id = inline_asm_ctx.last_token_id; + auto fm_string = parse_format_string (inline_asm_ctx); + + auto &inline_asm = inline_asm_ctx.inline_asm; + auto token = parser.peek_current_token (); + if (fm_string == tl::nullopt) + { + rust_error_at (parser.peek_current_token ()->get_locus (), + "%s template must be a string literal", "asm"); + return tl::unexpected<InlineAsmParseError> (COMMITTED); + } + else + { + auto template_str + = AST::TupleTemplateStr (token->get_locus (), + strip_double_quotes (fm_string.value ())); + inline_asm.template_strs.push_back (template_str); + } + + // formatted string stream + + while (parser.peek_current_token ()->get_id () != last_token_id) + { + if (!parser.skip_token (COMMA)) + { + break; + } + // Ok after the comma is good, we better be parsing correctly + // everything in here, which is formatted string in ABNF + inline_asm_ctx.consumed_comma_without_formatted_string = false; + + token = parser.peek_current_token (); + fm_string = parse_format_string (inline_asm_ctx); + if (fm_string == tl::nullopt) + { + inline_asm_ctx.consumed_comma_without_formatted_string = true; + break; + } + else + { + auto template_str + = AST::TupleTemplateStr (token->get_locus (), + strip_double_quotes (fm_string.value ())); + inline_asm.template_strs.push_back (template_str); + } + } + + return inline_asm_ctx; +} + +// bool +// is_label (const std::string &potential_label) +// { + +// if (potential_label.empty () || potential_label.back () != ':') +// return false; + +// // Check if all characters before the last colon are digits +// for (size_t i = 0; i < potential_label.length () - 1; i++) +// { +// if (potential_label[i] < '0' || potential_label[i] > '9') +// return false; +// } + +// return true; +// } + +tl::expected<InlineAsmContext, InlineAsmParseError> +validate (InlineAsmContext inline_asm_ctx) +{ + return tl::expected<InlineAsmContext, InlineAsmParseError> (inline_asm_ctx); +} + +tl::optional<LlvmAsmContext> +parse_llvm_templates (LlvmAsmContext ctx) +{ + auto &parser = ctx.parser; + + auto token = parser.peek_current_token (); + + if (token->get_id () == ctx.last_token_id + || token->get_id () != STRING_LITERAL) + { + return tl::nullopt; + } + + ctx.llvm_asm.get_templates ().emplace_back (token->get_locus (), + strip_double_quotes ( + token->as_string ())); + ctx.parser.skip_token (); + + token = parser.peek_current_token (); + if (token->get_id () != ctx.last_token_id && token->get_id () != COLON + && token->get_id () != SCOPE_RESOLUTION) + { + // We do not handle multiple template string, we provide minimal support + // for the black_box intrinsics. + rust_unreachable (); + } + + return ctx; +} + +tl::optional<LlvmAsmContext> +parse_llvm_arguments (LlvmAsmContext ctx) +{ + auto &parser = ctx.parser; + enum State + { + Templates = 0, + Output, + Input, + Clobbers, + Options + } current_state + = State::Templates; + + while (parser.peek_current_token ()->get_id () != ctx.last_token_id + && parser.peek_current_token ()->get_id () != END_OF_FILE) + { + if (parser.peek_current_token ()->get_id () == SCOPE_RESOLUTION) + { + parser.skip_token (SCOPE_RESOLUTION); + current_state = static_cast<State> (current_state + 2); + } + else + { + parser.skip_token (COLON); + current_state = static_cast<State> (current_state + 1); + } + + switch (current_state) + { + case State::Output: + parse_llvm_outputs (ctx); + break; + case State::Input: + parse_llvm_inputs (ctx); + break; + case State::Clobbers: + parse_llvm_clobbers (ctx); + break; + case State::Options: + parse_llvm_options (ctx); + break; + case State::Templates: + default: + rust_unreachable (); + } + } + + return ctx; +} + +void +parse_llvm_operands (LlvmAsmContext &ctx, std::vector<AST::LlvmOperand> &result) +{ + auto &parser = ctx.parser; + auto token = parser.peek_current_token (); + while (token->get_id () != COLON && token->get_id () != SCOPE_RESOLUTION + && token->get_id () != ctx.last_token_id) + { + std::string constraint; + if (token->get_id () == STRING_LITERAL) + { + constraint = strip_double_quotes (token->as_string ()); + } + parser.skip_token (STRING_LITERAL); + parser.skip_token (LEFT_PAREN); + + token = parser.peek_current_token (); + + ParseRestrictions restrictions; + restrictions.expr_can_be_null = true; + auto expr = parser.parse_expr (); + + parser.skip_token (RIGHT_PAREN); + + result.emplace_back (constraint, std::move (expr)); + + if (parser.peek_current_token ()->get_id () == COMMA) + parser.skip_token (COMMA); + + token = parser.peek_current_token (); + } +} + +void +parse_llvm_outputs (LlvmAsmContext &ctx) +{ + parse_llvm_operands (ctx, ctx.llvm_asm.get_outputs ()); +} + +void +parse_llvm_inputs (LlvmAsmContext &ctx) +{ + parse_llvm_operands (ctx, ctx.llvm_asm.get_inputs ()); +} + +void +parse_llvm_clobbers (LlvmAsmContext &ctx) +{ + auto &parser = ctx.parser; + auto token = parser.peek_current_token (); + while (token->get_id () != COLON && token->get_id () != ctx.last_token_id) + { + if (token->get_id () == STRING_LITERAL) + { + ctx.llvm_asm.get_clobbers ().push_back ( + {strip_double_quotes (token->as_string ()), token->get_locus ()}); + } + parser.skip_token (STRING_LITERAL); + token = parser.peek_current_token (); + } +} + +void +parse_llvm_options (LlvmAsmContext &ctx) +{ + auto &parser = ctx.parser; + auto token = parser.peek_current_token (); + + while (token->get_id () != ctx.last_token_id) + { + if (token->get_id () == STRING_LITERAL) + { + auto token_str = strip_double_quotes (token->as_string ()); + + if (token_str == "volatile") + ctx.llvm_asm.set_volatile (true); + else if (token_str == "alignstack") + ctx.llvm_asm.set_align_stack (true); + else if (token_str == "intel") + ctx.llvm_asm.set_dialect (AST::LlvmInlineAsm::Dialect::Intel); + else + rust_error_at (token->get_locus (), + "Unknown llvm assembly option %qs", + token_str.c_str ()); + } + parser.skip_token (STRING_LITERAL); + + token = parser.peek_current_token (); + + if (token->get_id () == ctx.last_token_id) + continue; + parser.skip_token (COMMA); + } + + parser.skip_token (); +} + +tl::optional<AST::Fragment> +parse_llvm_asm (location_t invoc_locus, AST::MacroInvocData &invoc, + AST::InvocKind semicolon, AST::AsmKind is_global_asm) +{ + MacroInvocLexer lex (invoc.get_delim_tok_tree ().to_token_stream ()); + Parser<MacroInvocLexer> parser (lex); + auto last_token_id = macro_end_token (invoc.get_delim_tok_tree (), parser); + + AST::LlvmInlineAsm llvm_asm{invoc_locus}; + + auto asm_ctx = LlvmAsmContext (llvm_asm, parser, last_token_id); + + auto resulting_context + = parse_llvm_templates (asm_ctx).and_then (parse_llvm_arguments); + + if (resulting_context) + { + auto node = (*resulting_context).llvm_asm.clone_expr_without_block (); + + std::vector<AST::SingleASTNode> single_vec = {}; + + // If the macro invocation has a semicolon (`asm!("...");`), then we + // need to make it a statement. This way, it will be expanded + // properly. + if (semicolon == AST::InvocKind::Semicoloned) + single_vec.emplace_back (AST::SingleASTNode ( + std::make_unique<AST::ExprStmt> (std::move (node), invoc_locus, + semicolon + == AST::InvocKind::Semicoloned))); + else + single_vec.emplace_back (AST::SingleASTNode (std::move (node))); + + AST::Fragment fragment_ast + = AST::Fragment (single_vec, + std::vector<std::unique_ptr<AST::Token>> ()); + return fragment_ast; + } + return tl::nullopt; +} + +} // namespace Rust |