This patch removes the `VALUE flags` member from the `rb_ast_t` structure making `rb_ast_t` no longer an IMEMO object. ## Background We are trying to make the Ruby parser generated from parse.y a universal parser that can be used by other implementations such as mruby. To achieve this, it is necessary to exclude VALUE and IMEMO from parse.y, AST, and NODE. ## Summary (file by file) - `rubyparser.h` - Remove the `VALUE flags` member from `rb_ast_t` - `ruby_parser.c` and `internal/ruby_parser.h` - Use TypedData_Make_Struct VALUE which wraps `rb_ast_t` `in ast_alloc()` so that GC can manage it - You can retrieve `rb_ast_t` from the VALUE by `rb_ruby_ast_data_get()` - Change the return type of `rb_parser_compile_XXXX()` functions from `rb_ast_t *` to `VALUE` - rb_ruby_ast_new() which internally `calls ast_alloc()` is to create VALUE vast outside ruby_parser.c - `iseq.c` and `vm_core.h` - Amend the first parameter of `rb_iseq_new_XXXX()` functions from `rb_ast_body_t *` to `VALUE` - This keeps the VALUE of AST on the machine stack to prevent being removed by GC - `ast.c` - Almost all change is replacement `rb_ast_t *ast` with `VALUE vast` (sorry for the big diff) - Fix `node_memsize()` - Now it includes `rb_ast_local_table_link`, `tokens` and script_lines - `compile.c`, `load.c`, `node.c`, `parse.y`, `proc.c`, `ruby.c`, `template/prelude.c.tmpl`, `vm.c` and `vm_eval.c` - Follow-up due to the above changes - `imemo.{c|h}` - If an object with `imemo_ast` appears, considers it a bug Co-authored-by: Nobuyoshi Nakada <nobu@ruby-lang.org>
104 lines
3.8 KiB
C
104 lines
3.8 KiB
C
#ifndef INTERNAL_RUBY_PARSE_H
|
|
#define INTERNAL_RUBY_PARSE_H
|
|
|
|
#include "internal.h"
|
|
#include "internal/bignum.h"
|
|
#include "internal/compilers.h"
|
|
#include "internal/complex.h"
|
|
#include "internal/parse.h"
|
|
#include "internal/rational.h"
|
|
#include "rubyparser.h"
|
|
#include "vm.h"
|
|
|
|
struct lex_pointer_string {
|
|
VALUE str;
|
|
long ptr;
|
|
};
|
|
|
|
RUBY_SYMBOL_EXPORT_BEGIN
|
|
#ifdef UNIVERSAL_PARSER
|
|
const rb_parser_config_t *rb_ruby_parser_config(void);
|
|
rb_parser_t *rb_parser_params_new(void);
|
|
#endif
|
|
VALUE rb_parser_set_context(VALUE, const struct rb_iseq_struct *, int);
|
|
VALUE rb_parser_new(void);
|
|
VALUE rb_parser_compile_string_path(VALUE vparser, VALUE fname, VALUE src, int line);
|
|
VALUE rb_str_new_parser_string(rb_parser_string_t *str);
|
|
VALUE rb_str_new_mutable_parser_string(rb_parser_string_t *str);
|
|
VALUE rb_parser_lex_get_str(struct lex_pointer_string *ptr_str);
|
|
|
|
VALUE rb_node_str_string_val(const NODE *);
|
|
VALUE rb_node_sym_string_val(const NODE *);
|
|
VALUE rb_node_dstr_string_val(const NODE *);
|
|
VALUE rb_node_regx_string_val(const NODE *);
|
|
VALUE rb_node_dregx_string_val(const NODE *);
|
|
VALUE rb_node_line_lineno_val(const NODE *);
|
|
VALUE rb_node_file_path_val(const NODE *);
|
|
VALUE rb_node_encoding_val(const NODE *);
|
|
|
|
VALUE rb_node_integer_literal_val(const NODE *);
|
|
VALUE rb_node_float_literal_val(const NODE *);
|
|
VALUE rb_node_rational_literal_val(const NODE *);
|
|
VALUE rb_node_imaginary_literal_val(const NODE *);
|
|
RUBY_SYMBOL_EXPORT_END
|
|
|
|
VALUE rb_parser_end_seen_p(VALUE);
|
|
VALUE rb_parser_encoding(VALUE);
|
|
VALUE rb_parser_set_yydebug(VALUE, VALUE);
|
|
VALUE rb_parser_build_script_lines_from(rb_parser_ary_t *script_lines);
|
|
void rb_parser_aset_script_lines_for(VALUE path, rb_parser_ary_t *script_lines);
|
|
void rb_parser_set_options(VALUE, int, int, int, int);
|
|
VALUE rb_parser_load_file(VALUE parser, VALUE name);
|
|
void rb_parser_set_script_lines(VALUE vparser);
|
|
void rb_parser_error_tolerant(VALUE vparser);
|
|
void rb_parser_keep_tokens(VALUE vparser);
|
|
|
|
VALUE rb_parser_compile_string(VALUE, const char*, VALUE, int);
|
|
VALUE rb_parser_compile_file_path(VALUE vparser, VALUE fname, VALUE input, int line);
|
|
VALUE rb_parser_compile_generic(VALUE vparser, rb_parser_lex_gets_func *lex_gets, VALUE fname, VALUE input, int line);
|
|
VALUE rb_parser_compile_array(VALUE vparser, VALUE fname, VALUE array, int start);
|
|
|
|
enum lex_state_bits {
|
|
EXPR_BEG_bit, /* ignore newline, +/- is a sign. */
|
|
EXPR_END_bit, /* newline significant, +/- is an operator. */
|
|
EXPR_ENDARG_bit, /* ditto, and unbound braces. */
|
|
EXPR_ENDFN_bit, /* ditto, and unbound braces. */
|
|
EXPR_ARG_bit, /* newline significant, +/- is an operator. */
|
|
EXPR_CMDARG_bit, /* newline significant, +/- is an operator. */
|
|
EXPR_MID_bit, /* newline significant, +/- is an operator. */
|
|
EXPR_FNAME_bit, /* ignore newline, no reserved words. */
|
|
EXPR_DOT_bit, /* right after `.', `&.' or `::', no reserved words. */
|
|
EXPR_CLASS_bit, /* immediate after `class', no here document. */
|
|
EXPR_LABEL_bit, /* flag bit, label is allowed. */
|
|
EXPR_LABELED_bit, /* flag bit, just after a label. */
|
|
EXPR_FITEM_bit, /* symbol literal as FNAME. */
|
|
EXPR_MAX_STATE
|
|
};
|
|
/* examine combinations */
|
|
enum lex_state_e {
|
|
#define DEF_EXPR(n) EXPR_##n = (1 << EXPR_##n##_bit)
|
|
DEF_EXPR(BEG),
|
|
DEF_EXPR(END),
|
|
DEF_EXPR(ENDARG),
|
|
DEF_EXPR(ENDFN),
|
|
DEF_EXPR(ARG),
|
|
DEF_EXPR(CMDARG),
|
|
DEF_EXPR(MID),
|
|
DEF_EXPR(FNAME),
|
|
DEF_EXPR(DOT),
|
|
DEF_EXPR(CLASS),
|
|
DEF_EXPR(LABEL),
|
|
DEF_EXPR(LABELED),
|
|
DEF_EXPR(FITEM),
|
|
EXPR_VALUE = EXPR_BEG,
|
|
EXPR_BEG_ANY = (EXPR_BEG | EXPR_MID | EXPR_CLASS),
|
|
EXPR_ARG_ANY = (EXPR_ARG | EXPR_CMDARG),
|
|
EXPR_END_ANY = (EXPR_END | EXPR_ENDARG | EXPR_ENDFN),
|
|
EXPR_NONE = 0
|
|
};
|
|
|
|
VALUE rb_ruby_ast_new(const NODE *const root, rb_parser_ary_t *script_lines);
|
|
rb_ast_t *rb_ruby_ast_data_get(VALUE vast);
|
|
|
|
#endif /* INTERNAL_RUBY_PARSE_H */
|