diff options
author | Tom Tromey <tom@tromey.com> | 2016-04-26 19:38:08 -0600 |
---|---|---|
committer | Tom Tromey <tom@tromey.com> | 2016-05-17 12:02:00 -0600 |
commit | c44af4ebc000f606d16b42224cba2cfe80391d5c (patch) | |
tree | 73839883edc5c0bd6f744024802b30f0bdd7b0e3 /gdb/rust-exp.y | |
parent | 00272ec4b0cc22c1b9d60d39ce7bf5b2d5512582 (diff) | |
download | gdb-c44af4ebc000f606d16b42224cba2cfe80391d5c.zip gdb-c44af4ebc000f606d16b42224cba2cfe80391d5c.tar.gz gdb-c44af4ebc000f606d16b42224cba2cfe80391d5c.tar.bz2 |
Add support for the Rust language
This patch adds support for the Rust language.
2016-05-17 Tom Tromey <tom@tromey.com>
Manish Goregaokar <manishsmail@gmail.com>
* symtab.c (symbol_find_demangled_name): Handle Rust.
* symfile.c (init_filename_language_table): Treat ".rs" as Rust.
* std-operator.def (STRUCTOP_ANONYMOUS, OP_RUST_ARRAY): New
constants.
* rust-lang.h: New file.
* rust-lang.c: New file.
* rust-exp.y: New file.
* dwarf2read.c (read_file_scope): Add Rust producer sniffing.
(dwarf2_compute_name, read_func_scope, read_structure_type)
(read_base_type, read_subrange_type, set_cu_language)
(new_symbol_full, determine_prefix): Handle Rust.
* defs.h (enum language) <language_rust>: New constant.
* Makefile.in (SFILES): Add rust-exp.y, rust-lang.c.
(COMMON_OBS): Add rust-exp.o, rust-lang.o.
2016-05-17 Tom Tromey <tom@tromey.com>
* gdb.base/default.exp (set language): Add rust.
Diffstat (limited to 'gdb/rust-exp.y')
-rw-r--r-- | gdb/rust-exp.y | 2752 |
1 files changed, 2752 insertions, 0 deletions
diff --git a/gdb/rust-exp.y b/gdb/rust-exp.y new file mode 100644 index 0000000..f0c4e6c --- /dev/null +++ b/gdb/rust-exp.y @@ -0,0 +1,2752 @@ +/* Bison parser for Rust expressions, for GDB. + Copyright (C) 2016 Free Software Foundation, Inc. + + This file is part of GDB. + + This program is free software; you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with this program. If not, see <http://www.gnu.org/licenses/>. */ + +/* Removing the last conflict seems difficult. */ +%expect 1 + +%{ + +#include "defs.h" + +#include "block.h" +#include "charset.h" +#include "cp-support.h" +#include "f-lang.h" +#include "gdb_obstack.h" +#include "gdb_regex.h" +#include "rust-lang.h" +#include "parser-defs.h" +#include "selftest.h" +#include "value.h" +#include "vec.h" + +#define GDB_YY_REMAP_PREFIX rust +#include "yy-remap.h" + +#define RUSTSTYPE YYSTYPE + +extern initialize_file_ftype _initialize_rust_exp; + +struct rust_op; +typedef const struct rust_op *rust_op_ptr; +DEF_VEC_P (rust_op_ptr); + +/* A typed integer constant. */ + +struct typed_val_int +{ + LONGEST val; + struct type *type; +}; + +/* A typed floating point constant. */ + +struct typed_val_float +{ + DOUBLEST dval; + struct type *type; +}; + +/* An identifier and an expression. This is used to represent one + element of a struct initializer. */ + +struct set_field +{ + struct stoken name; + const struct rust_op *init; +}; + +typedef struct set_field set_field; + +DEF_VEC_O (set_field); + + +static int rustyylex (void); +static void rust_push_back (char c); +static const char *rust_copy_name (const char *, int); +static struct stoken rust_concat3 (const char *, const char *, const char *); +static struct stoken make_stoken (const char *); +static struct block_symbol rust_lookup_symbol (const char *name, + const struct block *block, + const domain_enum domain); +static struct type *rust_lookup_type (const char *name, + const struct block *block); +static struct type *rust_type (const char *name); + +static const struct rust_op *crate_name (const struct rust_op *name); +static const struct rust_op *super_name (const struct rust_op *name, + unsigned int n_supers); + +static const struct rust_op *ast_operation (enum exp_opcode opcode, + const struct rust_op *left, + const struct rust_op *right); +static const struct rust_op *ast_compound_assignment + (enum exp_opcode opcode, const struct rust_op *left, + const struct rust_op *rust_op); +static const struct rust_op *ast_literal (struct typed_val_int val); +static const struct rust_op *ast_dliteral (struct typed_val_float val); +static const struct rust_op *ast_structop (const struct rust_op *left, + const char *name, + int completing); +static const struct rust_op *ast_structop_anonymous + (const struct rust_op *left, struct typed_val_int number); +static const struct rust_op *ast_unary (enum exp_opcode opcode, + const struct rust_op *expr); +static const struct rust_op *ast_cast (const struct rust_op *expr, + const struct rust_op *type); +static const struct rust_op *ast_call_ish (enum exp_opcode opcode, + const struct rust_op *expr, + VEC (rust_op_ptr) **params); +static const struct rust_op *ast_path (struct stoken name, + VEC (rust_op_ptr) **params); +static const struct rust_op *ast_string (struct stoken str); +static const struct rust_op *ast_struct (const struct rust_op *name, + VEC (set_field) **fields); +static const struct rust_op *ast_range (const struct rust_op *lhs, + const struct rust_op *rhs); +static const struct rust_op *ast_array_type (const struct rust_op *lhs, + struct typed_val_int val); +static const struct rust_op *ast_slice_type (const struct rust_op *type); +static const struct rust_op *ast_reference_type (const struct rust_op *type); +static const struct rust_op *ast_pointer_type (const struct rust_op *type, + int is_mut); +static const struct rust_op *ast_function_type (const struct rust_op *result, + VEC (rust_op_ptr) **params); +static const struct rust_op *ast_tuple_type (VEC (rust_op_ptr) **params); + +/* The state of the parser, used internally when we are parsing the + expression. */ + +static struct parser_state *pstate = NULL; + +/* A regular expression for matching Rust numbers. This is split up + since it is very long and this gives us a way to comment the + sections. */ + +static const char *number_regex_text = + /* subexpression 1: allows use of alternation, otherwise uninteresting */ + "^(" + /* First comes floating point. */ + /* Recognize number after the decimal point, with optional + exponent and optional type suffix. + subexpression 2: allows "?", otherwise uninteresting + subexpression 3: if present, type suffix + */ + "[0-9][0-9_]*\\.[0-9][0-9_]*([eE][-+]?[0-9][0-9_]*)?(f32|f64)?" +#define FLOAT_TYPE1 3 + "|" + /* Recognize exponent without decimal point, with optional type + suffix. + subexpression 4: if present, type suffix + */ +#define FLOAT_TYPE2 4 + "[0-9][0-9_]*[eE][-+]?[0-9][0-9_]*(f32|f64)?" + "|" + /* "23." is a valid floating point number, but "23.e5" and + "23.f32" are not. So, handle the trailing-. case + separately. */ + "[0-9][0-9_]*\\." + "|" + /* Finally come integers. + subexpression 5: text of integer + subexpression 6: if present, type suffix + subexpression 7: allows use of alternation, otherwise uninteresting + */ +#define INT_TEXT 5 +#define INT_TYPE 6 + "(0x[a-fA-F0-9_]+|0o[0-7_]+|0b[01_]+|[0-9][0-9_]*)" + "([iu](size|8|16|32|64))?" + ")"; +/* The number of subexpressions to allocate space for, including the + "0th" whole match subexpression. */ +#define NUM_SUBEXPRESSIONS 8 + +/* The compiled number-matching regex. */ + +static regex_t number_regex; + +/* True if we're running unit tests. */ + +static int unit_testing; + +/* Obstack for data temporarily allocated during parsing. */ + +static struct obstack work_obstack; + +/* Result of parsing. Points into work_obstack. */ + +static const struct rust_op *rust_ast; + +%} + +%union +{ + /* A typed integer constant. */ + struct typed_val_int typed_val_int; + + /* A typed floating point constant. */ + struct typed_val_float typed_val_float; + + /* An identifier or string. */ + struct stoken sval; + + /* A token representing an opcode, like "==". */ + enum exp_opcode opcode; + + /* A list of expressions; for example, the arguments to a function + call. */ + VEC (rust_op_ptr) **params; + + /* A list of field initializers. */ + VEC (set_field) **field_inits; + + /* A single field initializer. */ + struct set_field one_field_init; + + /* An expression. */ + const struct rust_op *op; + + /* A plain integer, for example used to count the number of + "super::" prefixes on a path. */ + unsigned int depth; +} + +%{ + + /* Rust AST operations. We build a tree of these; then lower them + to gdb expressions when parsing has completed. */ + +struct rust_op +{ + /* The opcode. */ + enum exp_opcode opcode; + /* If OPCODE is OP_TYPE, then this holds information about what type + is described by this node. */ + enum type_code typecode; + /* Indicates whether OPCODE actually represents a compound + assignment. For example, if OPCODE is GTGT and this is false, + then this rust_op represents an ordinary ">>"; but if this is + true, then this rust_op represents ">>=". Unused in other + cases. */ + unsigned int compound_assignment : 1; + /* Only used by a field expression; if set, indicates that the field + name occurred at the end of the expression and is eligible for + completion. */ + unsigned int completing : 1; + /* Operands of expression. Which one is used and how depends on the + particular opcode. */ + RUSTSTYPE left; + RUSTSTYPE right; +}; + +%} + +%token <sval> GDBVAR +%token <sval> IDENT +%token <sval> COMPLETE +%token <typed_val_int> INTEGER +%token <typed_val_int> DECIMAL_INTEGER +%token <sval> STRING +%token <sval> BYTESTRING +%token <typed_val_float> FLOAT +%token <opcode> COMPOUND_ASSIGN + +/* Keyword tokens. */ +%token <voidval> KW_AS +%token <voidval> KW_IF +%token <voidval> KW_TRUE +%token <voidval> KW_FALSE +%token <voidval> KW_SUPER +%token <voidval> KW_SELF +%token <voidval> KW_MUT +%token <voidval> KW_EXTERN +%token <voidval> KW_CONST +%token <voidval> KW_FN + +/* Operator tokens. */ +%token <voidval> DOTDOT +%token <voidval> OROR +%token <voidval> ANDAND +%token <voidval> EQEQ +%token <voidval> NOTEQ +%token <voidval> LTEQ +%token <voidval> GTEQ +%token <voidval> LSH RSH +%token <voidval> COLONCOLON +%token <voidval> ARROW + +%type <op> type +%type <op> path_for_expr +%type <op> identifier_path_for_expr +%type <op> path_for_type +%type <op> identifier_path_for_type +%type <op> just_identifiers_for_type + +%type <params> maybe_type_list +%type <params> type_list + +%type <depth> super_path + +%type <op> literal +%type <op> expr +%type <op> field_expr +%type <op> idx_expr +%type <op> unop_expr +%type <op> binop_expr +%type <op> binop_expr_expr +%type <op> type_cast_expr +%type <op> assignment_expr +%type <op> compound_assignment_expr +%type <op> paren_expr +%type <op> call_expr +%type <op> path_expr +%type <op> tuple_expr +%type <op> unit_expr +%type <op> struct_expr +%type <op> array_expr +%type <op> range_expr + +%type <params> expr_list +%type <params> maybe_expr_list +%type <params> paren_expr_list + +%type <field_inits> struct_expr_list +%type <one_field_init> struct_expr_tail + +/* Precedence. */ +%nonassoc DOTDOT +%right '=' COMPOUND_ASSIGN +%left OROR +%left ANDAND +%nonassoc EQEQ NOTEQ '<' '>' LTEQ GTEQ +%left '|' +%left '^' +%left '&' +%left LSH RSH +%left '@' +%left '+' '-' +%left '*' '/' '%' +/* These could be %precedence in Bison, but that isn't a yacc + feature. */ +%left KW_AS +%left UNARY +%left '[' '.' '(' + +%% + +start: + expr + { + /* If we are completing and see a valid parse, + rust_ast will already have been set. */ + if (rust_ast == NULL) + rust_ast = $1; + } +; + +/* Note that the Rust grammar includes a method_call_expr, but we + handle this differently, to avoid a shift/reduce conflict with + call_expr. */ +expr: + literal +| path_expr +| tuple_expr +| unit_expr +| struct_expr +| field_expr +| array_expr +| idx_expr +| range_expr +| unop_expr +| binop_expr +| paren_expr +| call_expr +; + +tuple_expr: + '(' expr ',' maybe_expr_list ')' + { + VEC_safe_insert (rust_op_ptr, *$4, 0, $2); + error (_("Tuple expressions not supported yet")); + } +; + +unit_expr: + '(' ')' + { + struct typed_val_int val; + + val.type + = language_lookup_primitive_type (parse_language (pstate), + parse_gdbarch (pstate), + "()"); + val.val = 0; + $$ = ast_literal (val); + } +; + +/* To avoid a shift/reduce conflict with call_expr, we don't handle + tuple struct expressions here, but instead when examining the + AST. */ +struct_expr: + path_for_expr '{' struct_expr_list '}' + { $$ = ast_struct ($1, $3); } +; + +struct_expr_tail: + DOTDOT expr + { + struct set_field sf; + + sf.name.ptr = NULL; + sf.name.length = 0; + sf.init = $2; + + $$ = sf; + } +| IDENT ':' expr + { + struct set_field sf; + + sf.name = $1; + sf.init = $3; + $$ = sf; + } +; + +/* S{} is documented as valid but seems to be an unstable feature, so + it is left out here. */ +struct_expr_list: + struct_expr_tail + { + VEC (set_field) **result + = OBSTACK_ZALLOC (&work_obstack, VEC (set_field) *); + + make_cleanup (VEC_cleanup (set_field), result); + VEC_safe_push (set_field, *result, &$1); + + $$ = result; + } +| IDENT ':' expr ',' struct_expr_list + { + struct set_field sf; + + sf.name = $1; + sf.init = $3; + VEC_safe_push (set_field, *$5, &sf); + $$ = $5; + } +; + +array_expr: + '[' KW_MUT expr_list ']' + { $$ = ast_call_ish (OP_ARRAY, NULL, $3); } +| '[' expr_list ']' + { $$ = ast_call_ish (OP_ARRAY, NULL, $2); } +| '[' KW_MUT expr ';' expr ']' + { $$ = ast_operation (OP_RUST_ARRAY, $3, $5); } +| '[' expr ';' expr ']' + { $$ = ast_operation (OP_RUST_ARRAY, $2, $4); } +; + +range_expr: + expr DOTDOT + { $$ = ast_range ($1, NULL); } +| expr DOTDOT expr + { $$ = ast_range ($1, $3); } +| DOTDOT expr + { $$ = ast_range (NULL, $2); } +| DOTDOT + { $$ = ast_range (NULL, NULL); } +; + +literal: + INTEGER + { $$ = ast_literal ($1); } +| DECIMAL_INTEGER + { $$ = ast_literal ($1); } +| FLOAT + { $$ = ast_dliteral ($1); } +| STRING + { + const struct rust_op *str = ast_string ($1); + VEC (set_field) **fields; + struct set_field field; + struct typed_val_int val; + struct stoken token; + + fields = OBSTACK_ZALLOC (&work_obstack, VEC (set_field) *); + make_cleanup (VEC_cleanup (set_field), fields); + + /* Wrap the raw string in the &str struct. */ + field.name.ptr = "data_ptr"; + field.name.length = strlen (field.name.ptr); + field.init = ast_unary (UNOP_ADDR, ast_string ($1)); + VEC_safe_push (set_field, *fields, &field); + + val.type = rust_type ("usize"); + val.val = $1.length; + + field.name.ptr = "length"; + field.name.length = strlen (field.name.ptr); + field.init = ast_literal (val); + VEC_safe_push (set_field, *fields, &field); + + token.ptr = "&str"; + token.length = strlen (token.ptr); + $$ = ast_struct (ast_path (token, NULL), fields); + } +| BYTESTRING + { $$ = ast_string ($1); } +| KW_TRUE + { + struct typed_val_int val; + + val.type = language_bool_type (parse_language (pstate), + parse_gdbarch (pstate)); + val.val = 1; + $$ = ast_literal (val); + } +| KW_FALSE + { + struct typed_val_int val; + + val.type = language_bool_type (parse_language (pstate), + parse_gdbarch (pstate)); + val.val = 0; + $$ = ast_literal (val); + } +; + +field_expr: + expr '.' IDENT + { $$ = ast_structop ($1, $3.ptr, 0); } +| expr '.' COMPLETE + { + $$ = ast_structop ($1, $3.ptr, 1); + rust_ast = $$; + } +| expr '.' DECIMAL_INTEGER + { $$ = ast_structop_anonymous ($1, $3); } +; + +idx_expr: + expr '[' expr ']' + { $$ = ast_operation (BINOP_SUBSCRIPT, $1, $3); } +; + +unop_expr: + '+' expr %prec UNARY + { $$ = ast_unary (UNOP_PLUS, $2); } + +| '-' expr %prec UNARY + { $$ = ast_unary (UNOP_NEG, $2); } + +| '!' expr %prec UNARY + { + /* Note that we provide a Rust-specific evaluator + override for UNOP_COMPLEMENT, so it can do the + right thing for both bool and integral + values. */ + $$ = ast_unary (UNOP_COMPLEMENT, $2); + } + +| '*' expr %prec UNARY + { $$ = ast_unary (UNOP_IND, $2); } + +| '&' expr %prec UNARY + { $$ = ast_unary (UNOP_ADDR, $2); } + +| '&' KW_MUT expr %prec UNARY + { $$ = ast_unary (UNOP_ADDR, $3); } + +; + +binop_expr: + binop_expr_expr +| type_cast_expr +| assignment_expr +| compound_assignment_expr +; + +binop_expr_expr: + expr '*' expr + { $$ = ast_operation (BINOP_MUL, $1, $3); } + +| expr '@' expr + { $$ = ast_operation (BINOP_REPEAT, $1, $3); } + +| expr '/' expr + { $$ = ast_operation (BINOP_DIV, $1, $3); } + +| expr '%' expr + { $$ = ast_operation (BINOP_REM, $1, $3); } + +| expr '<' expr + { $$ = ast_operation (BINOP_LESS, $1, $3); } + +| expr '>' expr + { $$ = ast_operation (BINOP_GTR, $1, $3); } + +| expr '&' expr + { $$ = ast_operation (BINOP_BITWISE_AND, $1, $3); } + +| expr '|' expr + { $$ = ast_operation (BINOP_BITWISE_IOR, $1, $3); } + +| expr '^' expr + { $$ = ast_operation (BINOP_BITWISE_XOR, $1, $3); } + +| expr '+' expr + { $$ = ast_operation (BINOP_ADD, $1, $3); } + +| expr '-' expr + { $$ = ast_operation (BINOP_SUB, $1, $3); } + +| expr OROR expr + { $$ = ast_operation (BINOP_LOGICAL_OR, $1, $3); } + +| expr ANDAND expr + { $$ = ast_operation (BINOP_LOGICAL_AND, $1, $3); } + +| expr EQEQ expr + { $$ = ast_operation (BINOP_EQUAL, $1, $3); } + +| expr NOTEQ expr + { $$ = ast_operation (BINOP_NOTEQUAL, $1, $3); } + +| expr LTEQ expr + { $$ = ast_operation (BINOP_LEQ, $1, $3); } + +| expr GTEQ expr + { $$ = ast_operation (BINOP_GEQ, $1, $3); } + +| expr LSH expr + { $$ = ast_operation (BINOP_LSH, $1, $3); } + +| expr RSH expr + { $$ = ast_operation (BINOP_RSH, $1, $3); } +; + +type_cast_expr: + expr KW_AS type + { $$ = ast_cast ($1, $3); } +; + +assignment_expr: + expr '=' expr + { $$ = ast_operation (BINOP_ASSIGN, $1, $3); } +; + +compound_assignment_expr: + expr COMPOUND_ASSIGN expr + { $$ = ast_compound_assignment ($2, $1, $3); } + +; + +paren_expr: + '(' expr ')' + { $$ = $2; } +; + +expr_list: + expr + { + $$ = OBSTACK_ZALLOC (&work_obstack, VEC (rust_op_ptr) *); + make_cleanup (VEC_cleanup (rust_op_ptr), $$); + VEC_safe_push (rust_op_ptr, *$$, $1); + } +| expr_list ',' expr + { + VEC_safe_push (rust_op_ptr, *$1, $3); + $$ = $1; + } +; + +maybe_expr_list: + /* %empty */ + { + /* The result can't be NULL. */ + $$ = OBSTACK_ZALLOC (&work_obstack, VEC (rust_op_ptr) *); + make_cleanup (VEC_cleanup (rust_op_ptr), $$); + } +| expr_list + { $$ = $1; } +; + +paren_expr_list: + '(' + maybe_expr_list + ')' + { $$ = $2; } +; + +call_expr: + expr paren_expr_list + { $$ = ast_call_ish (OP_FUNCALL, $1, $2); } +; + +maybe_self_path: + /* %empty */ +| KW_SELF COLONCOLON +; + +super_path: + KW_SUPER COLONCOLON + { $$ = 1; } +| super_path KW_SUPER COLONCOLON + { $$ = $1 + 1; } +; + +path_expr: + path_for_expr + { $$ = $1; } +| GDBVAR + { $$ = ast_path ($1, NULL); } +| KW_SELF + { $$ = ast_path (make_stoken ("self"), NULL); } +; + +path_for_expr: + identifier_path_for_expr +| KW_SELF COLONCOLON identifier_path_for_expr + { $$ = super_name ($3, 0); } +| maybe_self_path super_path identifier_path_for_expr + { $$ = super_name ($3, $2); } +| COLONCOLON identifier_path_for_expr + { $$ = crate_name ($2); } +| KW_EXTERN identifier_path_for_expr + { + /* This is a gdb extension to make it possible to + refer to items in other crates. It just bypasses + adding the current crate to the front of the + name. */ + $$ = ast_path (rust_concat3 ("::", $2->left.sval.ptr, NULL), + $2->right.params); + } +; + +identifier_path_for_expr: + IDENT + { $$ = ast_path ($1, NULL); } +| identifier_path_for_expr COLONCOLON IDENT + { + $$ = ast_path (rust_concat3 ($1->left.sval.ptr, "::", + $3.ptr), + NULL); + } +| identifier_path_for_expr COLONCOLON '<' type_list '>' + { $$ = ast_path ($1->left.sval, $4); } +| identifier_path_for_expr COLONCOLON '<' type_list RSH + { + $$ = ast_path ($1->left.sval, $4); + rust_push_back ('>'); + } +; + +path_for_type: + identifier_path_for_type +| KW_SELF COLONCOLON identifier_path_for_type + { $$ = super_name ($3, 0); } +| maybe_self_path super_path identifier_path_for_type + { $$ = super_name ($3, $2); } +| COLONCOLON identifier_path_for_type + { $$ = crate_name ($2); } +| KW_EXTERN identifier_path_for_type + { + /* This is a gdb extension to make it possible to + refer to items in other crates. It just bypasses + adding the current crate to the front of the + name. */ + $$ = ast_path (rust_concat3 ("::", $2->left.sval.ptr, NULL), + $2->right.params); + } +; + +just_identifiers_for_type: + IDENT + { $$ = ast_path ($1, NULL); } +| just_identifiers_for_type COLONCOLON IDENT + { + $$ = ast_path (rust_concat3 ($1->left.sval.ptr, "::", + $3.ptr), + NULL); + } +; + +identifier_path_for_type: + just_identifiers_for_type +| just_identifiers_for_type '<' type_list '>' + { $$ = ast_path ($1->left.sval, $3); } +| just_identifiers_for_type '<' type_list RSH + { + $$ = ast_path ($1->left.sval, $3); + rust_push_back ('>'); + } +; + +type: + path_for_type +| '[' type ';' INTEGER ']' + { $$ = ast_array_type ($2, $4); } +| '[' type ';' DECIMAL_INTEGER ']' + { $$ = ast_array_type ($2, $4); } +| '&' '[' type ']' + { $$ = ast_slice_type ($3); } +| '&' type + { $$ = ast_reference_type ($2); } +| '*' KW_MUT type + { $$ = ast_pointer_type ($3, 1); } +| '*' KW_CONST type + { $$ = ast_pointer_type ($3, 0); } +| KW_FN '(' maybe_type_list ')' ARROW type + { $$ = ast_function_type ($6, $3); } +| '(' maybe_type_list ')' + { $$ = ast_tuple_type ($2); } +; + +maybe_type_list: + /* %empty */ + { $$ = NULL; } +| type_list + { $$ = $1; } +; + +type_list: + type + { + VEC (rust_op_ptr) **result + = OBSTACK_ZALLOC (&work_obstack, VEC (rust_op_ptr) *); + + make_cleanup (VEC_cleanup (rust_op_ptr), result); + VEC_safe_push (rust_op_ptr, *result, $1); + $$ = result; + } +| type_list ',' type + { + VEC_safe_push (rust_op_ptr, *$1, $3); + $$ = $1; + } +; + +%% + +/* A struct of this type is used to describe a token. */ + +struct token_info +{ + const char *name; + int value; + enum exp_opcode opcode; +}; + +/* Identifier tokens. */ + +static const struct token_info identifier_tokens[] = +{ + { "as", KW_AS, OP_NULL }, + { "false", KW_FALSE, OP_NULL }, + { "if", 0, OP_NULL }, + { "mut", KW_MUT, OP_NULL }, + { "const", KW_CONST, OP_NULL }, + { "self", KW_SELF, OP_NULL }, + { "super", KW_SUPER, OP_NULL }, + { "true", KW_TRUE, OP_NULL }, + { "extern", KW_EXTERN, OP_NULL }, + { "fn", KW_FN, OP_NULL }, +}; + +/* Operator tokens, sorted longest first. */ + +static const struct token_info operator_tokens[] = +{ + { ">>=", COMPOUND_ASSIGN, BINOP_RSH }, + { "<<=", COMPOUND_ASSIGN, BINOP_LSH }, + + { "<<", LSH, OP_NULL }, + { ">>", RSH, OP_NULL }, + { "&&", ANDAND, OP_NULL }, + { "||", OROR, OP_NULL }, + { "==", EQEQ, OP_NULL }, + { "!=", NOTEQ, OP_NULL }, + { "<=", LTEQ, OP_NULL }, + { ">=", GTEQ, OP_NULL }, + { "+=", COMPOUND_ASSIGN, BINOP_ADD }, + { "-=", COMPOUND_ASSIGN, BINOP_SUB }, + { "*=", COMPOUND_ASSIGN, BINOP_MUL }, + { "/=", COMPOUND_ASSIGN, BINOP_DIV }, + { "%=", COMPOUND_ASSIGN, BINOP_REM }, + { "&=", COMPOUND_ASSIGN, BINOP_BITWISE_AND }, + { "|=", COMPOUND_ASSIGN, BINOP_BITWISE_IOR }, + { "^=", COMPOUND_ASSIGN, BINOP_BITWISE_XOR }, + + { "::", COLONCOLON, OP_NULL }, + { "..", DOTDOT, OP_NULL }, + { "->", ARROW, OP_NULL } +}; + +/* Helper function to copy to the name obstack. */ + +static const char * +rust_copy_name (const char *name, int len) +{ + return (const char *) obstack_copy0 (&work_obstack, name, len); +} + +/* Helper function to make an stoken from a C string. */ + +static struct stoken +make_stoken (const char *p) +{ + struct stoken result; + + result.ptr = p; + result.length = strlen (result.ptr); + return result; +} + +/* Helper function to concatenate three strings on the name + obstack. */ + +static struct stoken +rust_concat3 (const char *s1, const char *s2, const char *s3) +{ + return make_stoken (obconcat (&work_obstack, s1, s2, s3, (char *) NULL)); +} + +/* Return an AST node referring to NAME, but relative to the crate's + name. */ + +static const struct rust_op * +crate_name (const struct rust_op *name) +{ + char *crate = rust_crate_for_block (expression_context_block); + struct stoken result; + + gdb_assert (name->opcode == OP_VAR_VALUE); + + if (crate == NULL) + error (_("Could not find crate for current location")); + result = make_stoken (obconcat (&work_obstack, "::", crate, "::", + name->left.sval.ptr, (char *) NULL)); + xfree (crate); + + return ast_path (result, name->right.params); +} + +/* Create an AST node referring to a "super::" qualified name. IDENT + is the base name and N_SUPERS is how many "super::"s were + provided. N_SUPERS can be zero. */ + +static const struct rust_op * +super_name (const struct rust_op *ident, unsigned int n_supers) +{ + const char *scope = block_scope (expression_context_block); + int offset; + + gdb_assert (ident->opcode == OP_VAR_VALUE); + + if (scope[0] == '\0') + error (_("Couldn't find namespace scope for self::")); + + if (n_supers > 0) + { + int i; + int len; + VEC (int) *offsets = NULL; + unsigned int current_len, previous_len; + struct cleanup *cleanup; + + cleanup = make_cleanup (VEC_cleanup (int), &offsets); + current_len = cp_find_first_component (scope); + previous_len = 0; + while (scope[current_len] != '\0') + { + VEC_safe_push (int, offsets, current_len); + gdb_assert (scope[current_len] == ':'); + previous_len = current_len; + /* The "::". */ + current_len += 2; + current_len += cp_find_first_component (scope + + current_len); + } + + len = VEC_length (int, offsets); + if (n_supers >= len) + error (_("Too many super:: uses from '%s'"), scope); + + offset = VEC_index (int, offsets, len - n_supers); + + do_cleanups (cleanup); + } + else + offset = strlen (scope); + + obstack_grow (&work_obstack, "::", 2); + obstack_grow (&work_obstack, scope, offset); + obstack_grow (&work_obstack, "::", 2); + obstack_grow0 (&work_obstack, ident->left.sval.ptr, ident->left.sval.length); + + return ast_path (make_stoken ((const char *) obstack_finish (&work_obstack)), + ident->right.params); +} + +/* A helper that updates innermost_block as appropriate. */ + +static void +update_innermost_block (struct block_symbol sym) +{ + if (symbol_read_needs_frame (sym.symbol) + && (innermost_block == NULL + || contained_in (sym.block, innermost_block))) + innermost_block = sym.block; +} + +/* A helper to look up a Rust type, or fail. This only works for + types defined by rust_language_arch_info. */ + +static struct type * +rust_type (const char *name) +{ + struct type *type; + + /* When unit testing, we don't bother checking the types, so avoid a + possibly-failing lookup here. */ + if (unit_testing) + return NULL; + + type = language_lookup_primitive_type (parse_language (pstate), + parse_gdbarch (pstate), + name); + if (type == NULL) + error (_("Could not find Rust type %s"), name); + return type; +} + +/* Lex a hex number with at least MIN digits and at most MAX + digits. */ + +static uint32_t +lex_hex (int min, int max) +{ + uint32_t result = 0; + int len = 0; + /* We only want to stop at MAX if we're lexing a byte escape. */ + int check_max = min == max; + + while ((check_max ? len <= max : 1) + && ((lexptr[0] >= 'a' && lexptr[0] <= 'f') + || (lexptr[0] >= 'A' && lexptr[0] <= 'F') + || (lexptr[0] >= '0' && lexptr[0] <= '9'))) + { + result *= 16; + if (lexptr[0] >= 'a' && lexptr[0] <= 'f') + result = result + 10 + lexptr[0] - 'a'; + else if (lexptr[0] >= 'A' && lexptr[0] <= 'F') + result = result + 10 + lexptr[0] - 'A'; + else + result = result + lexptr[0] - '0'; + ++lexptr; + ++len; + } + + if (len < min) + error (_("Not enough hex digits seen")); + if (len > max) + { + gdb_assert (min != max); + error (_("Overlong hex escape")); + } + + return result; +} + +/* Lex an escape. IS_BYTE is true if we're lexing a byte escape; + otherwise we're lexing a character escape. */ + +static uint32_t +lex_escape (int is_byte) +{ + uint32_t result; + + gdb_assert (lexptr[0] == '\\'); + ++lexptr; + switch (lexptr[0]) + { + case 'x': + ++lexptr; + result = lex_hex (2, 2); + break; + + case 'u': + if (is_byte) + error (_("Unicode escape in byte literal")); + ++lexptr; + if (lexptr[0] != '{') + error (_("Missing '{' in Unicode escape")); + ++lexptr; + result = lex_hex (1, 6); + /* Could do range checks here. */ + if (lexptr[0] != '}') + error (_("Missing '}' in Unicode escape")); + ++lexptr; + break; + + case 'n': + result = '\n'; + ++lexptr; + break; + case 'r': + result = '\r'; + ++lexptr; + break; + case 't': + result = '\t'; + ++lexptr; + break; + case '\\': + result = '\\'; + ++lexptr; + break; + case '0': + result = '\0'; + ++lexptr; + break; + case '\'': + result = '\''; + ++lexptr; + break; + case '"': + result = '"'; + ++lexptr; + break; + + default: + error (_("Invalid escape \\%c in literal"), lexptr[0]); + } + + return result; +} + +/* Lex a character constant. */ + +static int +lex_character (void) +{ + int is_byte = 0; + uint32_t value; + + if (lexptr[0] == 'b') + { + is_byte = 1; + ++lexptr; + } + gdb_assert (lexptr[0] == '\''); + ++lexptr; + /* This should handle UTF-8 here. */ + if (lexptr[0] == '\\') + value = lex_escape (is_byte); + else + { + value = lexptr[0] & 0xff; + ++lexptr; + } + + if (lexptr[0] != '\'') + error (_("Unterminated character literal")); + ++lexptr; + + rustyylval.typed_val_int.val = value; + rustyylval.typed_val_int.type = rust_type (is_byte ? "u8" : "char"); + + return INTEGER; +} + +/* Return the offset of the double quote if STR looks like the start + of a raw string, or 0 if STR does not start a raw string. */ + +static int +starts_raw_string (const char *str) +{ + const char *save = str; + + if (str[0] != 'r') + return 0; + ++str; + while (str[0] == '#') + ++str; + if (str[0] == '"') + return str - save; + return 0; +} + +/* Return true if STR looks like the end of a raw string that had N + hashes at the start. */ + +static int +ends_raw_string (const char *str, int n) +{ + int i; + + gdb_assert (str[0] == '"'); + for (i = 0; i < n; ++i) + if (str[i + 1] != '#') + return 0; + return 1; +} + +/* Lex a string constant. */ + +static int +lex_string (void) +{ + int is_byte = lexptr[0] == 'b'; + int raw_length; + int len_in_chars = 0; + + if (is_byte) + ++lexptr; + raw_length = starts_raw_string (lexptr); + lexptr += raw_length; + gdb_assert (lexptr[0] == '"'); + ++lexptr; + + while (1) + { + uint32_t value; + + if (raw_length > 0) + { + if (lexptr[0] == '"' && ends_raw_string (lexptr, raw_length - 1)) + { + /* Exit with lexptr pointing after the final "#". */ + lexptr += raw_length; + break; + } + else if (lexptr[0] == '\0') + error (_("Unexpected EOF in string")); + + value = lexptr[0] & 0xff; + if (is_byte && value > 127) + error (_("Non-ASCII value in raw byte string")); + obstack_1grow (&work_obstack, value); + + ++lexptr; + } + else if (lexptr[0] == '"') + { + /* Make sure to skip the quote. */ + ++lexptr; + break; + } + else if (lexptr[0] == '\\') + { + value = lex_escape (is_byte); + + if (is_byte) + obstack_1grow (&work_obstack, value); + else + convert_between_encodings ("UTF-32", "UTF-8", (gdb_byte *) &value, + sizeof (value), sizeof (value), + &work_obstack, translit_none); + } + else if (lexptr[0] == '\0') + error (_("Unexpected EOF in string")); + else + { + value = lexptr[0] & 0xff; + if (is_byte && value > 127) + error (_("Non-ASCII value in byte string")); + obstack_1grow (&work_obstack, value); + ++lexptr; + } + } + + rustyylval.sval.length = obstack_object_size (&work_obstack); + rustyylval.sval.ptr = (const char *) obstack_finish (&work_obstack); + return is_byte ? BYTESTRING : STRING; +} + +/* Return true if STRING starts with whitespace followed by a digit. */ + +static int +space_then_number (const char *string) +{ + const char *p = string; + + while (p[0] == ' ' || p[0] == '\t') + ++p; + if (p == string) + return 0; + + return *p >= '0' && *p <= '9'; +} + +/* Return true if C can start an identifier. */ + +static int +rust_identifier_start_p (char c) +{ + return ((c >= 'a' && c <= 'z') + || (c >= 'A' && c <= 'Z') + || c == '_' + || c == '$'); +} + +/* Lex an identifier. */ + +static int +lex_identifier (void) +{ + const char *start = lexptr; + unsigned int length; + const struct token_info *token; + int i; + int is_gdb_var = lexptr[0] == '$'; + + gdb_assert (rust_identifier_start_p (lexptr[0])); + + ++lexptr; + + /* For the time being this doesn't handle Unicode rules. Non-ASCII + identifiers are gated anyway. */ + while ((lexptr[0] >= 'a' && lexptr[0] <= 'z') + || (lexptr[0] >= 'A' && lexptr[0] <= 'Z') + || lexptr[0] == '_' + || (is_gdb_var && lexptr[0] == '$') + || (lexptr[0] >= '0' && lexptr[0] <= '9')) + ++lexptr; + + + length = lexptr - start; + token = NULL; + for (i = 0; i < ARRAY_SIZE (identifier_tokens); ++i) + { + if (length == strlen (identifier_tokens[i].name) + && strncmp (identifier_tokens[i].name, start, length) == 0) + { + token = &identifier_tokens[i]; + break; + } + } + + if (token != NULL) + { + if (token->value == 0) + { + /* Leave the terminating token alone. */ + lexptr = start; + return 0; + } + } + else if (token == NULL + && (strncmp (start, "thread", length) == 0 + || strncmp (start, "task", length) == 0) + && space_then_number (lexptr)) + { + /* "task" or "thread" followed by a number terminates the + parse, per gdb rules. */ + lexptr = start; + return 0; + } + + if (token == NULL || (parse_completion && lexptr[0] == '\0')) + rustyylval.sval = make_stoken (rust_copy_name (start, length)); + + if (parse_completion && lexptr[0] == '\0') + { + /* Prevent rustyylex from returning two COMPLETE tokens. */ + prev_lexptr = lexptr; + return COMPLETE; + } + + if (token != NULL) + return token->value; + if (is_gdb_var) + return GDBVAR; + return IDENT; +} + +/* Lex an operator. */ + +static int +lex_operator (void) +{ + const struct token_info *token = NULL; + int i; + + for (i = 0; i < ARRAY_SIZE (operator_tokens); ++i) + { + if (strncmp (operator_tokens[i].name, lexptr, + strlen (operator_tokens[i].name)) == 0) + { + lexptr += strlen (operator_tokens[i].name); + token = &operator_tokens[i]; + break; + } + } + + if (token != NULL) + { + rustyylval.opcode = token->opcode; + return token->value; + } + + return *lexptr++; +} + +/* Lex a number. */ + +static int +lex_number (void) +{ + regmatch_t subexps[NUM_SUBEXPRESSIONS]; + int match; + int is_integer = 0; + int could_be_decimal = 1; + char *type_name = NULL; + struct type *type; + int end_index; + int type_index = -1; + int i, out; + char *number; + struct cleanup *cleanup = make_cleanup (null_cleanup, NULL); + + match = regexec (&number_regex, lexptr, ARRAY_SIZE (subexps), subexps, 0); + /* Failure means the regexp is broken. */ + gdb_assert (match == 0); + + if (subexps[INT_TEXT].rm_so != -1) + { + /* Integer part matched. */ + is_integer = 1; + end_index = subexps[INT_TEXT].rm_eo; + if (subexps[INT_TYPE].rm_so == -1) + type_name = "i32"; + else + { + type_index = INT_TYPE; + could_be_decimal = 0; + } + } + else if (subexps[FLOAT_TYPE1].rm_so != -1) + { + /* Found floating point type suffix. */ + end_index = subexps[FLOAT_TYPE1].rm_so; + type_index = FLOAT_TYPE1; + } + else if (subexps[FLOAT_TYPE2].rm_so != -1) + { + /* Found floating point type suffix. */ + end_index = subexps[FLOAT_TYPE2].rm_so; + type_index = FLOAT_TYPE2; + } + else + { + /* Any other floating point match. */ + end_index = subexps[0].rm_eo; + type_name = "f64"; + } + + /* We need a special case if the final character is ".". In this + case we might need to parse an integer. For example, "23.f()" is + a request for a trait method call, not a syntax error involving + the floating point number "23.". */ + gdb_assert (subexps[0].rm_eo > 0); + if (lexptr[subexps[0].rm_eo - 1] == '.') + { + const char *next = skip_spaces_const (&lexptr[subexps[0].rm_eo]); + + if (rust_identifier_start_p (*next) || *next == '.') + { + --subexps[0].rm_eo; + is_integer = 1; + end_index = subexps[0].rm_eo; + type_name = "i32"; + could_be_decimal = 1; + } + } + + /* Compute the type name if we haven't already. */ + if (type_name == NULL) + { + gdb_assert (type_index != -1); + type_name = xstrndup (lexptr + subexps[type_index].rm_so, + (subexps[type_index].rm_eo + - subexps[type_index].rm_so)); + make_cleanup (xfree, type_name); + } + + /* Look up the type. */ + type = rust_type (type_name); + + /* Copy the text of the number and remove the "_"s. */ + number = xstrndup (lexptr, end_index); + make_cleanup (xfree, number); + for (i = out = 0; number[i]; ++i) + { + if (number[i] == '_') + could_be_decimal = 0; + else + number[out++] = number[i]; + } + number[out] = '\0'; + + /* Advance past the match. */ + lexptr += subexps[0].rm_eo; + + /* Parse the number. */ + if (is_integer) + { + int radix = 10; + if (number[0] == '0') + { + if (number[1] == 'x') + radix = 16; + else if (number[1] == 'o') + radix = 8; + else if (number[1] == 'b') + radix = 2; + if (radix != 10) + { + number += 2; + could_be_decimal = 0; + } + } + rustyylval.typed_val_int.val = strtoul (number, NULL, radix); + rustyylval.typed_val_int.type = type; + } + else + { + rustyylval.typed_val_float.dval = strtod (number, NULL); + rustyylval.typed_val_float.type = type; + } + + do_cleanups (cleanup); + return is_integer ? (could_be_decimal ? DECIMAL_INTEGER : INTEGER) : FLOAT; +} + +/* The lexer. */ + +static int +rustyylex (void) +{ + /* Skip all leading whitespace. */ + while (lexptr[0] == ' ' || lexptr[0] == '\t' || lexptr[0] == '\r' + || lexptr[0] == '\n') + ++lexptr; + + /* If we hit EOF and we're completing, then return COMPLETE -- maybe + we're completing an empty string at the end of a field_expr. + But, we don't want to return two COMPLETE tokens in a row. */ + if (lexptr[0] == '\0' && lexptr == prev_lexptr) + return 0; + prev_lexptr = lexptr; + if (lexptr[0] == '\0') + { + if (parse_completion) + { + rustyylval.sval = make_stoken (""); + return COMPLETE; + } + return 0; + } + + if (lexptr[0] >= '0' && lexptr[0] <= '9') + return lex_number (); + else if (lexptr[0] == 'b' && lexptr[1] == '\'') + return lex_character (); + else if (lexptr[0] == 'b' && lexptr[1] == '"') + return lex_string (); + else if (lexptr[0] == 'b' && starts_raw_string (lexptr + 1)) + return lex_string (); + else if (starts_raw_string (lexptr)) + return lex_string (); + else if (rust_identifier_start_p (lexptr[0])) + return lex_identifier (); + else if (lexptr[0] == '"') + return lex_string (); + else if (lexptr[0] == '\'') + return lex_character (); + else if (lexptr[0] == '}' || lexptr[0] == ']') + { + /* Falls through to lex_operator. */ + --paren_depth; + } + else if (lexptr[0] == '(' || lexptr[0] == '{') + { + /* Falls through to lex_operator. */ + ++paren_depth; + } + else if (lexptr[0] == ',' && comma_terminates && paren_depth == 0) + return 0; + + return lex_operator (); +} + +/* Push back a single character to be re-lexed. */ + +static void +rust_push_back (char c) +{ + /* Can't be called before any lexing. */ + gdb_assert (prev_lexptr != NULL); + + --lexptr; + gdb_assert (*lexptr == c); +} + + + +/* Make an arbitrary operation and fill in the fields. */ + +static const struct rust_op * +ast_operation (enum exp_opcode opcode, const struct rust_op *left, + const struct rust_op *right) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = opcode; + result->left.op = left; + result->right.op = right; + + return result; +} + +/* Make a compound assignment operation. */ + +static const struct rust_op * +ast_compound_assignment (enum exp_opcode opcode, const struct rust_op *left, + const struct rust_op *right) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = opcode; + result->compound_assignment = 1; + result->left.op = left; + result->right.op = right; + + return result; +} + +/* Make a typed integer literal operation. */ + +static const struct rust_op * +ast_literal (struct typed_val_int val) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = OP_LONG; + result->left.typed_val_int = val; + + return result; +} + +/* Make a typed floating point literal operation. */ + +static const struct rust_op * +ast_dliteral (struct typed_val_float val) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = OP_DOUBLE; + result->left.typed_val_float = val; + + return result; +} + +/* Make a unary operation. */ + +static const struct rust_op * +ast_unary (enum exp_opcode opcode, const struct rust_op *expr) +{ + return ast_operation (opcode, expr, NULL); +} + +/* Make a cast operation. */ + +static const struct rust_op * +ast_cast (const struct rust_op *expr, const struct rust_op *type) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = UNOP_CAST; + result->left.op = expr; + result->right.op = type; + + return result; +} + +/* Make a call-like operation. This is nominally a function call, but + when lowering we may discover that it actually represents the + creation of a tuple struct. */ + +static const struct rust_op * +ast_call_ish (enum exp_opcode opcode, const struct rust_op *expr, + VEC (rust_op_ptr) **params) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = opcode; + result->left.op = expr; + result->right.params = params; + + return result; +} + +/* Make a structure creation operation. */ + +static const struct rust_op * +ast_struct (const struct rust_op *name, VEC (set_field) **fields) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = OP_AGGREGATE; + result->left.op = name; + result->right.field_inits = fields; + + return result; +} + +/* Make an identifier path. */ + +static const struct rust_op * +ast_path (struct stoken path, VEC (rust_op_ptr) **params) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = OP_VAR_VALUE; + result->left.sval = path; + result->right.params = params; + + return result; +} + +/* Make a string constant operation. */ + +static const struct rust_op * +ast_string (struct stoken str) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = OP_STRING; + result->left.sval = str; + + return result; +} + +/* Make a field expression. */ + +static const struct rust_op * +ast_structop (const struct rust_op *left, const char *name, int completing) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = STRUCTOP_STRUCT; + result->completing = completing; + result->left.op = left; + result->right.sval = make_stoken (name); + + return result; +} + +/* Make an anonymous struct operation, like 'x.0'. */ + +static const struct rust_op * +ast_structop_anonymous (const struct rust_op *left, + struct typed_val_int number) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = STRUCTOP_ANONYMOUS; + result->left.op = left; + result->right.typed_val_int = number; + + return result; +} + +/* Make a range operation. */ + +static const struct rust_op * +ast_range (const struct rust_op *lhs, const struct rust_op *rhs) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = OP_F90_RANGE; + result->left.op = lhs; + result->right.op = rhs; + + return result; +} + +/* A helper function to make a type-related AST node. */ + +static struct rust_op * +ast_basic_type (enum type_code typecode) +{ + struct rust_op *result = OBSTACK_ZALLOC (&work_obstack, struct rust_op); + + result->opcode = OP_TYPE; + result->typecode = typecode; + return result; +} + +/* Create an AST node describing an array type. */ + +static const struct rust_op * +ast_array_type (const struct rust_op *lhs, struct typed_val_int val) +{ + struct rust_op *result = ast_basic_type (TYPE_CODE_ARRAY); + + result->left.op = lhs; + result->right.typed_val_int = val; + return result; +} + +/* Create an AST node describing a reference type. */ + +static const struct rust_op * +ast_slice_type (const struct rust_op *type) +{ + /* Use TYPE_CODE_COMPLEX just because it is handy. */ + struct rust_op *result = ast_basic_type (TYPE_CODE_COMPLEX); + + result->left.op = type; + return result; +} + +/* Create an AST node describing a reference type. */ + +static const struct rust_op * +ast_reference_type (const struct rust_op *type) +{ + struct rust_op *result = ast_basic_type (TYPE_CODE_REF); + + result->left.op = type; + return result; +} + +/* Create an AST node describing a pointer type. */ + +static const struct rust_op * +ast_pointer_type (const struct rust_op *type, int is_mut) +{ + struct rust_op *result = ast_basic_type (TYPE_CODE_PTR); + + result->left.op = type; + /* For the time being we ignore is_mut. */ + return result; +} + +/* Create an AST node describing a function type. */ + +static const struct rust_op * +ast_function_type (const struct rust_op *rtype, VEC (rust_op_ptr) **params) +{ + struct rust_op *result = ast_basic_type (TYPE_CODE_FUNC); + + result->left.op = rtype; + result->right.params = params; + return result; +} + +/* Create an AST node describing a tuple type. */ + +static const struct rust_op * +ast_tuple_type (VEC (rust_op_ptr) **params) +{ + struct rust_op *result = ast_basic_type (TYPE_CODE_STRUCT); + + result->left.params = params; + return result; +} + +/* A helper to appropriately munge NAME and BLOCK depending on the + presence of a leading "::". */ + +static void +munge_name_and_block (const char **name, const struct block **block) +{ + /* If it is a global reference, skip the current block in favor of + the static block. */ + if (strncmp (*name, "::", 2) == 0) + { + *name += 2; + *block = block_static_block (*block); + } +} + +/* Like lookup_symbol, but handles Rust namespace conventions, and + doesn't require field_of_this_result. */ + +static struct block_symbol +rust_lookup_symbol (const char *name, const struct block *block, + const domain_enum domain) +{ + struct block_symbol result; + + munge_name_and_block (&name, &block); + + result = lookup_symbol (name, block, domain, NULL); + if (result.symbol != NULL) + update_innermost_block (result); + return result; +} + +/* Look up a type, following Rust namespace conventions. */ + +static struct type * +rust_lookup_type (const char *name, const struct block *block) +{ + struct block_symbol result; + struct type *type; + + munge_name_and_block (&name, &block); + + result = lookup_symbol (name, block, STRUCT_DOMAIN, NULL); + if (result.symbol != NULL) + { + update_innermost_block (result); + return SYMBOL_TYPE (result.symbol); + } + + type = lookup_typename (parse_language (pstate), parse_gdbarch (pstate), + name, NULL, 1); + if (type != NULL) + return type; + + /* Last chance, try a built-in type. */ + return language_lookup_primitive_type (parse_language (pstate), + parse_gdbarch (pstate), + name); +} + +static struct type *convert_ast_to_type (struct parser_state *state, + const struct rust_op *operation); +static const char *convert_name (struct parser_state *state, + const struct rust_op *operation); + +/* Convert a vector of rust_ops representing types to a vector of + types. */ + +static VEC (type_ptr) * +convert_params_to_types (struct parser_state *state, VEC (rust_op_ptr) *params) +{ + int i; + const struct rust_op *op; + VEC (type_ptr) *result = NULL; + struct cleanup *cleanup = make_cleanup (VEC_cleanup (type_ptr), &result); + + for (i = 0; VEC_iterate (rust_op_ptr, params, i, op); ++i) + VEC_safe_push (type_ptr, result, convert_ast_to_type (state, op)); + + discard_cleanups (cleanup); + return result; +} + +/* Convert a rust_op representing a type to a struct type *. */ + +static struct type * +convert_ast_to_type (struct parser_state *state, + const struct rust_op *operation) +{ + struct type *type, *result = NULL; + + if (operation->opcode == OP_VAR_VALUE) + { + const char *varname = convert_name (state, operation); + + result = rust_lookup_type (varname, expression_context_block); + if (result == NULL) + error (_("No typed name '%s' in current context"), varname); + return result; + } + + gdb_assert (operation->opcode == OP_TYPE); + + switch (operation->typecode) + { + case TYPE_CODE_ARRAY: + type = convert_ast_to_type (state, operation->left.op); + if (operation->right.typed_val_int.val < 0) + error (_("Negative array length")); + result = lookup_array_range_type (type, 0, + operation->right.typed_val_int.val - 1); + break; + + case TYPE_CODE_COMPLEX: + { + struct type *usize = rust_type ("usize"); + + type = convert_ast_to_type (state, operation->left.op); + result = rust_slice_type ("&[*gdb*]", type, usize); + } + break; + + case TYPE_CODE_REF: + case TYPE_CODE_PTR: + /* For now we treat &x and *x identically. */ + type = convert_ast_to_type (state, operation->left.op); + result = lookup_pointer_type (type); + break; + + case TYPE_CODE_FUNC: + { + VEC (type_ptr) *args + = convert_params_to_types (state, *operation->right.params); + struct cleanup *cleanup + = make_cleanup (VEC_cleanup (type_ptr), &args); + struct type **argtypes = NULL; + + type = convert_ast_to_type (state, operation->left.op); + if (!VEC_empty (type_ptr, args)) + argtypes = VEC_address (type_ptr, args); + + result + = lookup_function_type_with_arguments (type, + VEC_length (type_ptr, args), + argtypes); + result = lookup_pointer_type (result); + + do_cleanups (cleanup); + } + break; + + case TYPE_CODE_STRUCT: + { + VEC (type_ptr) *args + = convert_params_to_types (state, *operation->left.params); + struct cleanup *cleanup + = make_cleanup (VEC_cleanup (type_ptr), &args); + int i; + struct type *type; + const char *name; + + obstack_1grow (&work_obstack, '('); + for (i = 0; VEC_iterate (type_ptr, args, i, type); ++i) + { + char *type_name = type_to_string (type); + + if (i > 0) + obstack_1grow (&work_obstack, ','); + obstack_grow_str (&work_obstack, type_name); + + xfree (type_name); + } + + obstack_grow_str0 (&work_obstack, ")"); + name = (const char *) obstack_finish (&work_obstack); + + /* We don't allow creating new tuple types (yet), but we do + allow looking up existing tuple types. */ + result = rust_lookup_type (name, expression_context_block); + if (result == NULL) + error (_("could not find tuple type '%s'"), name); + + do_cleanups (cleanup); + } + break; + + default: + gdb_assert_not_reached ("unhandled opcode in convert_ast_to_type"); + } + + gdb_assert (result != NULL); + return result; +} + +/* A helper function to turn a rust_op representing a name into a full + name. This applies generic arguments as needed. The returned name + is allocated on the work obstack. */ + +static const char * +convert_name (struct parser_state *state, const struct rust_op *operation) +{ + VEC (type_ptr) *types; + struct cleanup *cleanup; + int i; + struct type *type; + + gdb_assert (operation->opcode == OP_VAR_VALUE); + + if (operation->right.params == NULL) + return operation->left.sval.ptr; + + types = convert_params_to_types (state, *operation->right.params); + cleanup = make_cleanup (VEC_cleanup (type_ptr), &types); + + obstack_grow_str (&work_obstack, operation->left.sval.ptr); + obstack_1grow (&work_obstack, '<'); + for (i = 0; VEC_iterate (type_ptr, types, i, type); ++i) + { + char *type_name = type_to_string (type); + + if (i > 0) + obstack_1grow (&work_obstack, ','); + + obstack_grow_str (&work_obstack, type_name); + xfree (type_name); + } + obstack_grow_str0 (&work_obstack, ">"); + + do_cleanups (cleanup); + + return (const char *) obstack_finish (&work_obstack); +} + +static void convert_ast_to_expression (struct parser_state *state, + const struct rust_op *operation, + const struct rust_op *top); + +/* A helper function that converts a vec of rust_ops to a gdb + expression. */ + +static void +convert_params_to_expression (struct parser_state *state, + VEC (rust_op_ptr) *params, + const struct rust_op *top) +{ + int i; + rust_op_ptr elem; + + for (i = 0; VEC_iterate (rust_op_ptr, params, i, elem); ++i) + convert_ast_to_expression (state, elem, top); +} + +/* Lower a rust_op to a gdb expression. STATE is the parser state. + OPERATION is the operation to lower. TOP is a pointer to the + top-most operation; it is used to handle the special case where the + top-most expression is an identifier and can be optionally lowered + to OP_TYPE. */ + +static void +convert_ast_to_expression (struct parser_state *state, + const struct rust_op *operation, + const struct rust_op *top) +{ + switch (operation->opcode) + { + case OP_LONG: + write_exp_elt_opcode (state, OP_LONG); + write_exp_elt_type (state, operation->left.typed_val_int.type); + write_exp_elt_longcst (state, operation->left.typed_val_int.val); + write_exp_elt_opcode (state, OP_LONG); + break; + + case OP_DOUBLE: + write_exp_elt_opcode (state, OP_DOUBLE); + write_exp_elt_type (state, operation->left.typed_val_float.type); + write_exp_elt_dblcst (state, operation->left.typed_val_float.dval); + write_exp_elt_opcode (state, OP_DOUBLE); + break; + + case STRUCTOP_STRUCT: + { + convert_ast_to_expression (state, operation->left.op, top); + + if (operation->completing) + mark_struct_expression (state); + write_exp_elt_opcode (state, STRUCTOP_STRUCT); + write_exp_string (state, operation->right.sval); + write_exp_elt_opcode (state, STRUCTOP_STRUCT); + } + break; + + case STRUCTOP_ANONYMOUS: + { + convert_ast_to_expression (state, operation->left.op, top); + + write_exp_elt_opcode (state, STRUCTOP_ANONYMOUS); + write_exp_elt_longcst (state, operation->right.typed_val_int.val); + write_exp_elt_opcode (state, STRUCTOP_ANONYMOUS); + } + break; + + case UNOP_PLUS: + case UNOP_NEG: + case UNOP_COMPLEMENT: + case UNOP_IND: + case UNOP_ADDR: + convert_ast_to_expression (state, operation->left.op, top); + write_exp_elt_opcode (state, operation->opcode); + break; + + case BINOP_SUBSCRIPT: + case BINOP_MUL: + case BINOP_REPEAT: + case BINOP_DIV: + case BINOP_REM: + case BINOP_LESS: + case BINOP_GTR: + case BINOP_BITWISE_AND: + case BINOP_BITWISE_IOR: + case BINOP_BITWISE_XOR: + case BINOP_ADD: + case BINOP_SUB: + case BINOP_LOGICAL_OR: + case BINOP_LOGICAL_AND: + case BINOP_EQUAL: + case BINOP_NOTEQUAL: + case BINOP_LEQ: + case BINOP_GEQ: + case BINOP_LSH: + case BINOP_RSH: + case BINOP_ASSIGN: + case OP_RUST_ARRAY: + convert_ast_to_expression (state, operation->left.op, top); + convert_ast_to_expression (state, operation->right.op, top); + if (operation->compound_assignment) + { + write_exp_elt_opcode (state, BINOP_ASSIGN_MODIFY); + write_exp_elt_opcode (state, operation->opcode); + write_exp_elt_opcode (state, BINOP_ASSIGN_MODIFY); + } + else + write_exp_elt_opcode (state, operation->opcode); + + if (operation->compound_assignment + || operation->opcode == BINOP_ASSIGN) + { + struct type *type; + + type = language_lookup_primitive_type (parse_language (state), + parse_gdbarch (state), + "()"); + + write_exp_elt_opcode (state, OP_LONG); + write_exp_elt_type (state, type); + write_exp_elt_longcst (state, 0); + write_exp_elt_opcode (state, OP_LONG); + + write_exp_elt_opcode (state, BINOP_COMMA); + } + break; + + case UNOP_CAST: + { + struct type *type = convert_ast_to_type (state, operation->right.op); + + convert_ast_to_expression (state, operation->left.op, top); + write_exp_elt_opcode (state, UNOP_CAST); + write_exp_elt_type (state, type); + write_exp_elt_opcode (state, UNOP_CAST); + } + break; + + case OP_FUNCALL: + { + if (operation->left.op->opcode == OP_VAR_VALUE) + { + struct type *type; + const char *varname = convert_name (state, operation->left.op); + + type = rust_lookup_type (varname, expression_context_block); + if (type != NULL) + { + /* This is actually a tuple struct expression, not a + call expression. */ + rust_op_ptr elem; + int i; + VEC (rust_op_ptr) *params = *operation->right.params; + + if (TYPE_CODE (type) != TYPE_CODE_NAMESPACE) + { + if (!rust_tuple_struct_type_p (type)) + error (_("Type %s is not a tuple struct"), varname); + + for (i = 0; + VEC_iterate (rust_op_ptr, params, i, elem); + ++i) + { + char *cell = get_print_cell (); + + xsnprintf (cell, PRINT_CELL_SIZE, "__%d", i); + write_exp_elt_opcode (state, OP_NAME); + write_exp_string (state, make_stoken (cell)); + write_exp_elt_opcode (state, OP_NAME); + + convert_ast_to_expression (state, elem, top); + } + + write_exp_elt_opcode (state, OP_AGGREGATE); + write_exp_elt_type (state, type); + write_exp_elt_longcst (state, + 2 * VEC_length (rust_op_ptr, + params)); + write_exp_elt_opcode (state, OP_AGGREGATE); + break; + } + } + } + convert_ast_to_expression (state, operation->left.op, top); + convert_params_to_expression (state, *operation->right.params, top); + write_exp_elt_opcode (state, OP_FUNCALL); + write_exp_elt_longcst (state, VEC_length (rust_op_ptr, + *operation->right.params)); + write_exp_elt_longcst (state, OP_FUNCALL); + } + break; + + case OP_ARRAY: + gdb_assert (operation->left.op == NULL); + convert_params_to_expression (state, *operation->right.params, top); + write_exp_elt_opcode (state, OP_ARRAY); + write_exp_elt_longcst (state, 0); + write_exp_elt_longcst (state, VEC_length (rust_op_ptr, + *operation->right.params) - 1); + write_exp_elt_longcst (state, OP_ARRAY); + break; + + case OP_VAR_VALUE: + { + struct block_symbol sym; + const char *varname; + + if (operation->left.sval.ptr[0] == '$') + { + write_dollar_variable (state, operation->left.sval); + break; + } + + varname = convert_name (state, operation); + sym = rust_lookup_symbol (varname, expression_context_block, + VAR_DOMAIN); + if (sym.symbol != NULL) + { + write_exp_elt_opcode (state, OP_VAR_VALUE); + write_exp_elt_block (state, sym.block); + write_exp_elt_sym (state, sym.symbol); + write_exp_elt_opcode (state, OP_VAR_VALUE); + } + else + { + struct type *type; + + type = rust_lookup_type (varname, expression_context_block); + if (type == NULL) + error (_("No symbol '%s' in current context"), varname); + + if (TYPE_CODE (type) == TYPE_CODE_STRUCT + && TYPE_NFIELDS (type) == 0) + { + /* A unit-like struct. */ + write_exp_elt_opcode (state, OP_AGGREGATE); + write_exp_elt_type (state, type); + write_exp_elt_longcst (state, 0); + write_exp_elt_opcode (state, OP_AGGREGATE); + } + else if (operation == top) + { + write_exp_elt_opcode (state, OP_TYPE); + write_exp_elt_type (state, type); + write_exp_elt_opcode (state, OP_TYPE); + break; + } + } + } + break; + + case OP_AGGREGATE: + { + int i; + int length; + struct set_field *init; + VEC (set_field) *fields = *operation->right.field_inits; + struct type *type; + const char *name; + + length = 0; + for (i = 0; VEC_iterate (set_field, fields, i, init); ++i) + { + if (init->name.ptr != NULL) + { + write_exp_elt_opcode (state, OP_NAME); + write_exp_string (state, init->name); + write_exp_elt_opcode (state, OP_NAME); + ++length; + } + + convert_ast_to_expression (state, init->init, top); + ++length; + + if (init->name.ptr == NULL) + { + /* This is handled differently from Ada in our + evaluator. */ + write_exp_elt_opcode (state, OP_OTHERS); + } + } + + name = convert_name (state, operation->left.op); + type = rust_lookup_type (name, expression_context_block); + if (type == NULL) + error (_("Could not find type '%s'"), operation->left.sval.ptr); + + if (TYPE_CODE (type) != TYPE_CODE_STRUCT + || rust_tuple_type_p (type) + || rust_tuple_struct_type_p (type)) + error (_("Struct expression applied to non-struct type")); + + write_exp_elt_opcode (state, OP_AGGREGATE); + write_exp_elt_type (state, type); + write_exp_elt_longcst (state, length); + write_exp_elt_opcode (state, OP_AGGREGATE); + } + break; + + case OP_STRING: + { + write_exp_elt_opcode (state, OP_STRING); + write_exp_string (state, operation->left.sval); + write_exp_elt_opcode (state, OP_STRING); + } + break; + + case OP_F90_RANGE: + { + enum f90_range_type kind = BOTH_BOUND_DEFAULT; + + if (operation->left.op != NULL) + { + convert_ast_to_expression (state, operation->left.op, top); + kind = HIGH_BOUND_DEFAULT; + } + if (operation->right.op != NULL) + { + convert_ast_to_expression (state, operation->right.op, top); + if (kind == BOTH_BOUND_DEFAULT) + kind = LOW_BOUND_DEFAULT; + else + { + gdb_assert (kind == HIGH_BOUND_DEFAULT); + kind = NONE_BOUND_DEFAULT; + } + } + write_exp_elt_opcode (state, OP_F90_RANGE); + write_exp_elt_longcst (state, kind); + write_exp_elt_opcode (state, OP_F90_RANGE); + } + break; + + default: + gdb_assert_not_reached ("unhandled opcode in convert_ast_to_expression"); + } +} + + + +/* The parser as exposed to gdb. */ + +int +rust_parse (struct parser_state *state) +{ + int result; + struct cleanup *cleanup; + + obstack_init (&work_obstack); + cleanup = make_cleanup_obstack_free (&work_obstack); + rust_ast = NULL; + + pstate = state; + result = rustyyparse (); + + if (!result || (parse_completion && rust_ast != NULL)) + { + const struct rust_op *ast = rust_ast; + + rust_ast = NULL; + gdb_assert (ast != NULL); + convert_ast_to_expression (state, ast, ast); + } + + do_cleanups (cleanup); + return result; +} + +/* The parser error handler. */ + +void +rustyyerror (char *msg) +{ + const char *where = prev_lexptr ? prev_lexptr : lexptr; + error (_("%s in expression, near `%s'."), (msg ? msg : "Error"), where); +} + + + +#if GDB_SELF_TEST + +/* Initialize the lexer for testing. */ + +static void +rust_lex_test_init (const char *input) +{ + prev_lexptr = NULL; + lexptr = input; + paren_depth = 0; +} + +/* A test helper that lexes a string, expecting a single token. It + returns the lexer data for this token. */ + +static RUSTSTYPE +rust_lex_test_one (const char *input, int expected) +{ + int token; + RUSTSTYPE result; + + rust_lex_test_init (input); + + token = rustyylex (); + SELF_CHECK (token == expected); + result = rustyylval; + + if (token) + { + token = rustyylex (); + SELF_CHECK (token == 0); + } + + return result; +} + +/* Test that INPUT lexes as the integer VALUE. */ + +static void +rust_lex_int_test (const char *input, int value, int kind) +{ + RUSTSTYPE result = rust_lex_test_one (input, kind); + SELF_CHECK (result.typed_val_int.val == value); +} + +/* Test that INPUT throws an exception with text ERR. */ + +static void +rust_lex_exception_test (const char *input, const char *err) +{ + TRY + { + /* The "kind" doesn't matter. */ + rust_lex_test_one (input, DECIMAL_INTEGER); + SELF_CHECK (0); + } + CATCH (except, RETURN_MASK_ERROR) + { + SELF_CHECK (strcmp (except.message, err) == 0); + } + END_CATCH +} + +/* Test that INPUT lexes as the identifier, string, or byte-string + VALUE. KIND holds the expected token kind. */ + +static void +rust_lex_stringish_test (const char *input, const char *value, int kind) +{ + RUSTSTYPE result = rust_lex_test_one (input, kind); + SELF_CHECK (result.sval.length == strlen (value)); + SELF_CHECK (strncmp (result.sval.ptr, value, result.sval.length) == 0); +} + +/* Helper to test that a string parses as a given token sequence. */ + +static void +rust_lex_test_sequence (const char *input, int len, const int expected[]) +{ + int i; + + lexptr = input; + paren_depth = 0; + + for (i = 0; i < len; ++i) + { + int token = rustyylex (); + + SELF_CHECK (token == expected[i]); + } +} + +/* Tests for an integer-parsing corner case. */ + +static void +rust_lex_test_trailing_dot (void) +{ + const int expected1[] = { DECIMAL_INTEGER, '.', IDENT, '(', ')', 0 }; + const int expected2[] = { INTEGER, '.', IDENT, '(', ')', 0 }; + const int expected3[] = { FLOAT, EQEQ, '(', ')', 0 }; + const int expected4[] = { DECIMAL_INTEGER, DOTDOT, DECIMAL_INTEGER, 0 }; + + rust_lex_test_sequence ("23.g()", ARRAY_SIZE (expected1), expected1); + rust_lex_test_sequence ("23_0.g()", ARRAY_SIZE (expected2), expected2); + rust_lex_test_sequence ("23.==()", ARRAY_SIZE (expected3), expected3); + rust_lex_test_sequence ("23..25", ARRAY_SIZE (expected4), expected4); +} + +/* Tests of completion. */ + +static void +rust_lex_test_completion (void) +{ + const int expected[] = { IDENT, '.', COMPLETE, 0 }; + + parse_completion = 1; + + rust_lex_test_sequence ("something.wha", ARRAY_SIZE (expected), expected); + rust_lex_test_sequence ("something.", ARRAY_SIZE (expected), expected); + + parse_completion = 0; +} + +/* Test pushback. */ + +static void +rust_lex_test_push_back (void) +{ + int token; + + rust_lex_test_init (">>="); + + token = rustyylex (); + SELF_CHECK (token == COMPOUND_ASSIGN); + SELF_CHECK (rustyylval.opcode == BINOP_RSH); + + rust_push_back ('='); + + token = rustyylex (); + SELF_CHECK (token == '='); + + token = rustyylex (); + SELF_CHECK (token == 0); +} + +/* Unit test the lexer. */ + +static void +rust_lex_tests (void) +{ + int i; + + obstack_init (&work_obstack); + unit_testing = 1; + + rust_lex_test_one ("", 0); + rust_lex_test_one (" \t \n \r ", 0); + rust_lex_test_one ("thread 23", 0); + rust_lex_test_one ("task 23", 0); + rust_lex_test_one ("th 104", 0); + rust_lex_test_one ("ta 97", 0); + + rust_lex_int_test ("'z'", 'z', INTEGER); + rust_lex_int_test ("'\\xff'", 0xff, INTEGER); + rust_lex_int_test ("'\\u{1016f}'", 0x1016f, INTEGER); + rust_lex_int_test ("b'z'", 'z', INTEGER); + rust_lex_int_test ("b'\\xfe'", 0xfe, INTEGER); + rust_lex_int_test ("b'\\xFE'", 0xfe, INTEGER); + rust_lex_int_test ("b'\\xfE'", 0xfe, INTEGER); + + /* Test all escapes in both modes. */ + rust_lex_int_test ("'\\n'", '\n', INTEGER); + rust_lex_int_test ("'\\r'", '\r', INTEGER); + rust_lex_int_test ("'\\t'", '\t', INTEGER); + rust_lex_int_test ("'\\\\'", '\\', INTEGER); + rust_lex_int_test ("'\\0'", '\0', INTEGER); + rust_lex_int_test ("'\\''", '\'', INTEGER); + rust_lex_int_test ("'\\\"'", '"', INTEGER); + + rust_lex_int_test ("b'\\n'", '\n', INTEGER); + rust_lex_int_test ("b'\\r'", '\r', INTEGER); + rust_lex_int_test ("b'\\t'", '\t', INTEGER); + rust_lex_int_test ("b'\\\\'", '\\', INTEGER); + rust_lex_int_test ("b'\\0'", '\0', INTEGER); + rust_lex_int_test ("b'\\''", '\'', INTEGER); + rust_lex_int_test ("b'\\\"'", '"', INTEGER); + + rust_lex_exception_test ("'z", "Unterminated character literal"); + rust_lex_exception_test ("b'\\x0'", "Not enough hex digits seen"); + rust_lex_exception_test ("b'\\u{0}'", "Unicode escape in byte literal"); + rust_lex_exception_test ("'\\x0'", "Not enough hex digits seen"); + rust_lex_exception_test ("'\\u0'", "Missing '{' in Unicode escape"); + rust_lex_exception_test ("'\\u{0", "Missing '}' in Unicode escape"); + rust_lex_exception_test ("'\\u{0000007}", "Overlong hex escape"); + rust_lex_exception_test ("'\\u{}", "Not enough hex digits seen"); + rust_lex_exception_test ("'\\Q'", "Invalid escape \\Q in literal"); + rust_lex_exception_test ("b'\\Q'", "Invalid escape \\Q in literal"); + + rust_lex_int_test ("23", 23, DECIMAL_INTEGER); + rust_lex_int_test ("2_344__29", 234429, INTEGER); + rust_lex_int_test ("0x1f", 0x1f, INTEGER); + rust_lex_int_test ("23usize", 23, INTEGER); + rust_lex_int_test ("23i32", 23, INTEGER); + rust_lex_int_test ("0x1_f", 0x1f, INTEGER); + rust_lex_int_test ("0b1_101011__", 0x6b, INTEGER); + rust_lex_int_test ("0o001177i64", 639, INTEGER); + + rust_lex_test_trailing_dot (); + + rust_lex_test_one ("23.", FLOAT); + rust_lex_test_one ("23.99f32", FLOAT); + rust_lex_test_one ("23e7", FLOAT); + rust_lex_test_one ("23E-7", FLOAT); + rust_lex_test_one ("23e+7", FLOAT); + rust_lex_test_one ("23.99e+7f64", FLOAT); + rust_lex_test_one ("23.82f32", FLOAT); + + rust_lex_stringish_test ("hibob", "hibob", IDENT); + rust_lex_stringish_test ("hibob__93", "hibob__93", IDENT); + rust_lex_stringish_test ("thread", "thread", IDENT); + + rust_lex_stringish_test ("\"string\"", "string", STRING); + rust_lex_stringish_test ("\"str\\ting\"", "str\ting", STRING); + rust_lex_stringish_test ("\"str\\\"ing\"", "str\"ing", STRING); + rust_lex_stringish_test ("r\"str\\ing\"", "str\\ing", STRING); + rust_lex_stringish_test ("r#\"str\\ting\"#", "str\\ting", STRING); + rust_lex_stringish_test ("r###\"str\\\"ing\"###", "str\\\"ing", STRING); + + rust_lex_stringish_test ("b\"string\"", "string", BYTESTRING); + rust_lex_stringish_test ("b\"\x73tring\"", "string", BYTESTRING); + rust_lex_stringish_test ("b\"str\\\"ing\"", "str\"ing", BYTESTRING); + rust_lex_stringish_test ("br####\"\\x73tring\"####", "\\x73tring", + BYTESTRING); + + for (i = 0; i < ARRAY_SIZE (identifier_tokens); ++i) + rust_lex_test_one (identifier_tokens[i].name, identifier_tokens[i].value); + + for (i = 0; i < ARRAY_SIZE (operator_tokens); ++i) + rust_lex_test_one (operator_tokens[i].name, operator_tokens[i].value); + + rust_lex_test_completion (); + rust_lex_test_push_back (); + + obstack_free (&work_obstack, NULL); + unit_testing = 0; +} + +#endif /* GDB_SELF_TEST */ + +void +_initialize_rust_exp (void) +{ + int code = regcomp (&number_regex, number_regex_text, REG_EXTENDED); + /* If the regular expression was incorrect, it was a programming + error. */ + gdb_assert (code == 0); + +#if GDB_SELF_TEST + register_self_test (rust_lex_tests); +#endif +} |