dc/d1f/yjit_8c_source.html

// This part of YJIT helps interfacing with the rest of CRuby and with the OS.

// Sometimes our FFI binding generation tool gives undesirable outputs when it

// sees C features that Rust doesn't support well. We mitigate that by binding

// functions which have simple parameter types. The boilerplate C functions for

// that purpose are in this file.

// Similarly, we wrap OS facilities we need in simple functions to help with

// FFI and to avoid the need to use external crates.io Rust libraries.


#include "internal.h"

#include "internal/sanitizers.h"

#include "internal/string.h"

#include "internal/hash.h"

#include "internal/variable.h"

#include "internal/compile.h"

#include "internal/class.h"

#include "internal/fixnum.h"

#include "internal/numeric.h"

#include "internal/gc.h"

#include "vm_core.h"

#include "vm_callinfo.h"

#include "builtin.h"

#include "insns.inc"

#include "insns_info.inc"

#include "vm_sync.h"

#include "yjit.h"

#include "vm_insnhelper.h"

#include "probes.h"

#include "probes_helper.h"

#include "iseq.h"

#include "ruby/debug.h"

#include "internal/cont.h"


// For mmapp(), sysconf()

#ifndef _WIN32

#include <unistd.h>

#include <sys/mman.h>

#endif


#include <errno.h>


// Field offsets for the RObject struct

enum robject_offsets {

    ROBJECT_OFFSET_AS_HEAP_IVPTR = offsetof(struct RObject, as.heap.ivptr),

    ROBJECT_OFFSET_AS_ARY = offsetof(struct RObject, as.ary),

};


// Field offsets for the RString struct

enum rstring_offsets {

    RUBY_OFFSET_RSTRING_LEN = offsetof(struct RString, len)

};


// We need size_t to have a known size to simplify code generation and FFI.

// TODO(alan): check this in configure.ac to fail fast on 32 bit platforms.

STATIC_ASSERT(64b_size_t, SIZE_MAX == UINT64_MAX);

// I don't know any C implementation that has uint64_t and puts padding bits

// into size_t but the standard seems to allow it.

STATIC_ASSERT(size_t_no_padding_bits, sizeof(size_t) == sizeof(uint64_t));


// This build config impacts the pointer tagging scheme and we only want to

// support one scheme for simplicity.

STATIC_ASSERT(pointer_tagging_scheme, USE_FLONUM);


// NOTE: We can trust that uint8_t has no "padding bits" since the C spec

// guarantees it. Wording about padding bits is more explicit in C11 compared

// to C99. See C11 7.20.1.1p2. All this is to say we have _some_ standards backing to

// use a Rust `*mut u8` to represent a C `uint8_t *`.

//

// If we don't want to trust that we can interpreter the C standard correctly, we

// could outsource that work to the Rust standard library by sticking to fundamental

// types in C such as int, long, etc. and use `std::os::raw::c_long` and friends on

// the Rust side.

//

// What's up with the long prefix? Even though we build with `-fvisibility=hidden`

// we are sometimes a static library where the option doesn't prevent name collision.

// The "_yjit_" part is for trying to be informative. We might want different

// suffixes for symbols meant for Rust and symbols meant for broader CRuby.


bool

rb_yjit_mark_writable(void *mem_block, uint32_t mem_size)

{

    return mprotect(mem_block, mem_size, PROT_READ | PROT_WRITE) == 0;

}


void

rb_yjit_mark_executable(void *mem_block, uint32_t mem_size)

{

    // Do not call mprotect when mem_size is zero. Some platforms may return

    // an error for it. https://github.com/Shopify/ruby/issues/450

    if (mem_size == 0) {

        return;

    }

    if (mprotect(mem_block, mem_size, PROT_READ | PROT_EXEC)) {

        rb_bug("Couldn't make JIT page (%p, %lu bytes) executable, errno: %s",

            mem_block, (unsigned long)mem_size, strerror(errno));

    }

}


// Free the specified memory block.

bool

rb_yjit_mark_unused(void *mem_block, uint32_t mem_size)

{

    // On Linux, you need to use madvise MADV_DONTNEED to free memory.

    // We might not need to call this on macOS, but it's not really documented.

    // We generally prefer to do the same thing on both to ease testing too.

    madvise(mem_block, mem_size, MADV_DONTNEED);


    // On macOS, mprotect PROT_NONE seems to reduce RSS.

    // We also call this on Linux to avoid executing unused pages.

    return mprotect(mem_block, mem_size, PROT_NONE) == 0;

}


long

rb_yjit_array_len(VALUE a)

{

    return rb_array_len(a);

}


// `start` is inclusive and `end` is exclusive.

void

rb_yjit_icache_invalidate(void *start, void *end)

{

    // Clear/invalidate the instruction cache. Compiles to nothing on x86_64

    // but required on ARM before running freshly written code.

    // On Darwin it's the same as calling sys_icache_invalidate().

#ifdef __GNUC__

    __builtin___clear_cache(start, end);

#elif defined(__aarch64__)

#error No instruction cache clear available with this compiler on Aarch64!

#endif

}


# define PTR2NUM(x)   (rb_int2inum((intptr_t)(void *)(x)))


// For a given raw_sample (frame), set the hash with the caller's

// name, file, and line number. Return the  hash with collected frame_info.

static void

rb_yjit_add_frame(VALUE hash, VALUE frame)

{

    VALUE frame_id = PTR2NUM(frame);


    if (RTEST(rb_hash_aref(hash, frame_id))) {

        return;

    }

    else {

        VALUE frame_info = rb_hash_new();

        // Full label for the frame

        VALUE name = rb_profile_frame_full_label(frame);

        // Absolute path of the frame from rb_iseq_realpath

        VALUE file = rb_profile_frame_absolute_path(frame);

        // Line number of the frame

        VALUE line = rb_profile_frame_first_lineno(frame);


        // If absolute path isn't available use the rb_iseq_path

        if (NIL_P(file)) {

            file = rb_profile_frame_path(frame);

        }


        rb_hash_aset(frame_info, ID2SYM(rb_intern("name")), name);

        rb_hash_aset(frame_info, ID2SYM(rb_intern("file")), file);

        rb_hash_aset(frame_info, ID2SYM(rb_intern("samples")), INT2NUM(0));

        rb_hash_aset(frame_info, ID2SYM(rb_intern("total_samples")), INT2NUM(0));

        rb_hash_aset(frame_info, ID2SYM(rb_intern("edges")), rb_hash_new());

        rb_hash_aset(frame_info, ID2SYM(rb_intern("lines")), rb_hash_new());


        if (line != INT2FIX(0)) {

            rb_hash_aset(frame_info, ID2SYM(rb_intern("line")), line);

        }


       rb_hash_aset(hash, frame_id, frame_info);

    }

}


// Parses the YjitExitLocations raw_samples and line_samples collected by

// rb_yjit_record_exit_stack and turns them into 3 hashes (raw, lines, and frames) to

// be used by RubyVM::YJIT.exit_locations. yjit_raw_samples represents the raw frames information

// (without name, file, and line), and yjit_line_samples represents the line information

// of the iseq caller.

VALUE

rb_yjit_exit_locations_dict(VALUE *yjit_raw_samples, int *yjit_line_samples, int samples_len)

{

    VALUE result = rb_hash_new();

    VALUE raw_samples = rb_ary_new_capa(samples_len);

    VALUE line_samples = rb_ary_new_capa(samples_len);

    VALUE frames = rb_hash_new();

    int idx = 0;


    // While the index is less than samples_len, parse yjit_raw_samples and

    // yjit_line_samples, then add casted values to raw_samples and line_samples array.

    while (idx < samples_len) {

        int num = (int)yjit_raw_samples[idx];

        int line_num = (int)yjit_line_samples[idx];

        idx++;


        // + 1 as we append an additional sample for the insn

        rb_ary_push(raw_samples, SIZET2NUM(num + 1));

        rb_ary_push(line_samples, INT2NUM(line_num + 1));


        // Loop through the length of samples_len and add data to the

        // frames hash. Also push the current value onto the raw_samples

        // and line_samples array respectively.

        for (int o = 0; o < num; o++) {

            rb_yjit_add_frame(frames, yjit_raw_samples[idx]);

            rb_ary_push(raw_samples, SIZET2NUM(yjit_raw_samples[idx]));

            rb_ary_push(line_samples, INT2NUM(yjit_line_samples[idx]));

            idx++;

        }


        rb_ary_push(raw_samples, SIZET2NUM(yjit_raw_samples[idx]));

        rb_ary_push(line_samples, INT2NUM(yjit_line_samples[idx]));

        idx++;


        rb_ary_push(raw_samples, SIZET2NUM(yjit_raw_samples[idx]));

        rb_ary_push(line_samples, INT2NUM(yjit_line_samples[idx]));

        idx++;

    }


    // Set add the raw_samples, line_samples, and frames to the results

    // hash.

    rb_hash_aset(result, ID2SYM(rb_intern("raw")), raw_samples);

    rb_hash_aset(result, ID2SYM(rb_intern("lines")), line_samples);

    rb_hash_aset(result, ID2SYM(rb_intern("frames")), frames);


    return result;

}


uint32_t

rb_yjit_get_page_size(void)

{

#if defined(_SC_PAGESIZE)

    long page_size = sysconf(_SC_PAGESIZE);

    if (page_size <= 0) rb_bug("yjit: failed to get page size");


    // 1 GiB limit. x86 CPUs with PDPE1GB can do this and anything larger is unexpected.

    // Though our design sort of assume we have fine grained control over memory protection

    // which require small page sizes.

    if (page_size > 0x40000000l) rb_bug("yjit page size too large");


    return (uint32_t)page_size;

#else

#error "YJIT supports POSIX only for now"

#endif

}


#if defined(MAP_FIXED_NOREPLACE) && defined(_SC_PAGESIZE)

// Align the current write position to a multiple of bytes

static uint8_t *

align_ptr(uint8_t *ptr, uint32_t multiple)

{

    // Compute the pointer modulo the given alignment boundary

    uint32_t rem = ((uint32_t)(uintptr_t)ptr) % multiple;


    // If the pointer is already aligned, stop

    if (rem == 0)

        return ptr;


    // Pad the pointer by the necessary amount to align it

    uint32_t pad = multiple - rem;


    return ptr + pad;

}

#endif


// Address space reservation. Memory pages are mapped on an as needed basis.

// See the Rust mm module for details.

uint8_t *

rb_yjit_reserve_addr_space(uint32_t mem_size)

{

#ifndef _WIN32

    uint8_t *mem_block;


    // On Linux

    #if defined(MAP_FIXED_NOREPLACE) && defined(_SC_PAGESIZE)

        uint32_t const page_size = (uint32_t)sysconf(_SC_PAGESIZE);

        uint8_t *const cfunc_sample_addr = (void *)(uintptr_t)&rb_yjit_reserve_addr_space;

        uint8_t *const probe_region_end = cfunc_sample_addr + INT32_MAX;

        // Align the requested address to page size

        uint8_t *req_addr = align_ptr(cfunc_sample_addr, page_size);


        // Probe for addresses close to this function using MAP_FIXED_NOREPLACE

        // to improve odds of being in range for 32-bit relative call instructions.

        do {

            mem_block = mmap(

                req_addr,

                mem_size,

                PROT_NONE,

                MAP_PRIVATE | MAP_ANONYMOUS | MAP_FIXED_NOREPLACE,

                -1,

                0

            );


            // If we succeeded, stop

            if (mem_block != MAP_FAILED) {

                ruby_annotate_mmap(mem_block, mem_size, "Ruby:rb_yjit_reserve_addr_space");

                break;

            }


            // -4MiB. Downwards to probe away from the heap. (On x86/A64 Linux

            // main_code_addr < heap_addr, and in case we are in a shared

            // library mapped higher than the heap, downwards is still better

            // since it's towards the end of the heap rather than the stack.)

            req_addr -= 4 * 1024 * 1024;

        } while (req_addr < probe_region_end);


    // On MacOS and other platforms

    #else

        // Try to map a chunk of memory as executable

        mem_block = mmap(

            (void *)rb_yjit_reserve_addr_space,

            mem_size,

            PROT_NONE,

            MAP_PRIVATE | MAP_ANONYMOUS,

            -1,

            0

        );

    #endif


    // Fallback

    if (mem_block == MAP_FAILED) {

        // Try again without the address hint (e.g., valgrind)

        mem_block = mmap(

            NULL,

            mem_size,

            PROT_NONE,

            MAP_PRIVATE | MAP_ANONYMOUS,

            -1,

            0

        );


        if (mem_block != MAP_FAILED) {

            ruby_annotate_mmap(mem_block, mem_size, "Ruby:rb_yjit_reserve_addr_space:fallback");

        }

    }


    // Check that the memory mapping was successful

    if (mem_block == MAP_FAILED) {

        perror("ruby: yjit: mmap:");

        if(errno == ENOMEM) {

            // No crash report if it's only insufficient memory

            exit(EXIT_FAILURE);

        }

        rb_bug("mmap failed");

    }


    return mem_block;

#else

    // Windows not supported for now

    return NULL;

#endif

}


// Is anyone listening for :c_call and :c_return event currently?

bool

rb_c_method_tracing_currently_enabled(const rb_execution_context_t *ec)

{

    rb_event_flag_t tracing_events;

    if (rb_multi_ractor_p()) {

        tracing_events = ruby_vm_event_enabled_global_flags;

    }

    else {

        // At the time of writing, events are never removed from

        // ruby_vm_event_enabled_global_flags so always checking using it would

        // mean we don't compile even after tracing is disabled.

        tracing_events = rb_ec_ractor_hooks(ec)->events;

    }


    return tracing_events & (RUBY_EVENT_C_CALL | RUBY_EVENT_C_RETURN);

}


// The code we generate in gen_send_cfunc() doesn't fire the c_return TracePoint event

// like the interpreter. When tracing for c_return is enabled, we patch the code after

// the C method return to call into this to fire the event.

void

rb_full_cfunc_return(rb_execution_context_t *ec, VALUE return_value)

{

    rb_control_frame_t *cfp = ec->cfp;

    RUBY_ASSERT_ALWAYS(cfp == GET_EC()->cfp);

    const rb_callable_method_entry_t *me = rb_vm_frame_method_entry(cfp);


    RUBY_ASSERT_ALWAYS(RUBYVM_CFUNC_FRAME_P(cfp));

    RUBY_ASSERT_ALWAYS(me->def->type == VM_METHOD_TYPE_CFUNC);


    // CHECK_CFP_CONSISTENCY("full_cfunc_return"); TODO revive this


    // Pop the C func's frame and fire the c_return TracePoint event

    // Note that this is the same order as vm_call_cfunc_with_frame().

    rb_vm_pop_frame(ec);

    EXEC_EVENT_HOOK(ec, RUBY_EVENT_C_RETURN, cfp->self, me->def->original_id, me->called_id, me->owner, return_value);

    // Note, this deviates from the interpreter in that users need to enable

    // a c_return TracePoint for this DTrace hook to work. A reasonable change

    // since the Ruby return event works this way as well.

    RUBY_DTRACE_CMETHOD_RETURN_HOOK(ec, me->owner, me->def->original_id);


    // Push return value into the caller's stack. We know that it's a frame that

    // uses cfp->sp because we are patching a call done with gen_send_cfunc().

    ec->cfp->sp[0] = return_value;

    ec->cfp->sp++;

}


unsigned int

rb_iseq_encoded_size(const rb_iseq_t *iseq)

{

    return iseq->body->iseq_size;

}


// TODO(alan): consider using an opaque pointer for the payload rather than a void pointer

void *

rb_iseq_get_yjit_payload(const rb_iseq_t *iseq)

{

    RUBY_ASSERT_ALWAYS(IMEMO_TYPE_P(iseq, imemo_iseq));

    if (iseq->body) {

        return iseq->body->yjit_payload;

    }

    else {

        // Body is NULL when constructing the iseq.

        return NULL;

    }

}


void

rb_iseq_set_yjit_payload(const rb_iseq_t *iseq, void *payload)

{

    RUBY_ASSERT_ALWAYS(IMEMO_TYPE_P(iseq, imemo_iseq));

    RUBY_ASSERT_ALWAYS(iseq->body);

    RUBY_ASSERT_ALWAYS(NULL == iseq->body->yjit_payload);

    iseq->body->yjit_payload = payload;

}


void

rb_iseq_reset_jit_func(const rb_iseq_t *iseq)

{

    RUBY_ASSERT_ALWAYS(IMEMO_TYPE_P(iseq, imemo_iseq));

    iseq->body->jit_entry = NULL;

    iseq->body->jit_exception = NULL;

    // Enable re-compiling this ISEQ. Event when it's invalidated for TracePoint,

    // we'd like to re-compile ISEQs that haven't been converted to trace_* insns.

    iseq->body->jit_entry_calls = 0;

    iseq->body->jit_exception_calls = 0;

}


// Get the PC for a given index in an iseq

VALUE *

rb_iseq_pc_at_idx(const rb_iseq_t *iseq, uint32_t insn_idx)

{

    RUBY_ASSERT_ALWAYS(IMEMO_TYPE_P(iseq, imemo_iseq));

    RUBY_ASSERT_ALWAYS(insn_idx < iseq->body->iseq_size);

    VALUE *encoded = iseq->body->iseq_encoded;

    VALUE *pc = &encoded[insn_idx];

    return pc;

}


// Get the opcode given a program counter. Can return trace opcode variants.

int

rb_iseq_opcode_at_pc(const rb_iseq_t *iseq, const VALUE *pc)

{

    // YJIT should only use iseqs after AST to bytecode compilation

    RUBY_ASSERT_ALWAYS(FL_TEST_RAW((VALUE)iseq, ISEQ_TRANSLATED));


    const VALUE at_pc = *pc;

    return rb_vm_insn_addr2opcode((const void *)at_pc);

}


unsigned long

rb_RSTRING_LEN(VALUE str)

{

    return RSTRING_LEN(str);

}


char *

rb_RSTRING_PTR(VALUE str)

{

    return RSTRING_PTR(str);

}


rb_proc_t *

rb_yjit_get_proc_ptr(VALUE procv)

{

    rb_proc_t *proc;

    GetProcPtr(procv, proc);

    return proc;

}


// This is defined only as a named struct inside rb_iseq_constant_body.

// By giving it a separate typedef, we make it nameable by rust-bindgen.

// Bindgen's temp/anon name isn't guaranteed stable.

typedef struct rb_iseq_param_keyword rb_seq_param_keyword_struct;


const char *

rb_insn_name(VALUE insn)

{

    return insn_name(insn);

}


unsigned int

rb_vm_ci_argc(const struct rb_callinfo *ci)

{

    return vm_ci_argc(ci);

}


ID

rb_vm_ci_mid(const struct rb_callinfo *ci)

{

    return vm_ci_mid(ci);

}


unsigned int

rb_vm_ci_flag(const struct rb_callinfo *ci)

{

    return vm_ci_flag(ci);

}


const struct rb_callinfo_kwarg *

rb_vm_ci_kwarg(const struct rb_callinfo *ci)

{

    return vm_ci_kwarg(ci);

}


int

rb_get_cikw_keyword_len(const struct rb_callinfo_kwarg *cikw)

{

    return cikw->keyword_len;

}


VALUE

rb_get_cikw_keywords_idx(const struct rb_callinfo_kwarg *cikw, int idx)

{

    return cikw->keywords[idx];

}


rb_method_visibility_t

rb_METHOD_ENTRY_VISI(const rb_callable_method_entry_t *me)

{

    return METHOD_ENTRY_VISI(me);

}


rb_method_type_t

rb_get_cme_def_type(const rb_callable_method_entry_t *cme)

{

    if (UNDEFINED_METHOD_ENTRY_P(cme)) {

        return VM_METHOD_TYPE_UNDEF;

    }

    else {

        return cme->def->type;

    }

}


ID

rb_get_cme_def_body_attr_id(const rb_callable_method_entry_t *cme)

{

    return cme->def->body.attr.id;

}


ID rb_get_symbol_id(VALUE namep);


enum method_optimized_type

rb_get_cme_def_body_optimized_type(const rb_callable_method_entry_t *cme)

{

    return cme->def->body.optimized.type;

}


unsigned int

rb_get_cme_def_body_optimized_index(const rb_callable_method_entry_t *cme)

{

    return cme->def->body.optimized.index;

}


rb_method_cfunc_t *

rb_get_cme_def_body_cfunc(const rb_callable_method_entry_t *cme)

{

    return UNALIGNED_MEMBER_PTR(cme->def, body.cfunc);

}


uintptr_t

rb_get_def_method_serial(const rb_method_definition_t *def)

{

    return def->method_serial;

}


ID

rb_get_def_original_id(const rb_method_definition_t *def)

{

    return def->original_id;

}


int

rb_get_mct_argc(const rb_method_cfunc_t *mct)

{

    return mct->argc;

}


void *

rb_get_mct_func(const rb_method_cfunc_t *mct)

{

    return (void*)(uintptr_t)mct->func; // this field is defined as type VALUE (*func)(ANYARGS)

}


const rb_iseq_t *

rb_get_def_iseq_ptr(rb_method_definition_t *def)

{

    return def_iseq_ptr(def);

}


VALUE

rb_get_def_bmethod_proc(rb_method_definition_t *def)

{

    RUBY_ASSERT(def->type == VM_METHOD_TYPE_BMETHOD);

    return def->body.bmethod.proc;

}


const rb_iseq_t *

rb_get_iseq_body_local_iseq(const rb_iseq_t *iseq)

{

    return iseq->body->local_iseq;

}


const rb_iseq_t *

rb_get_iseq_body_parent_iseq(const rb_iseq_t *iseq)

{

    return iseq->body->parent_iseq;

}


unsigned int

rb_get_iseq_body_local_table_size(const rb_iseq_t *iseq)

{

    return iseq->body->local_table_size;

}


VALUE *

rb_get_iseq_body_iseq_encoded(const rb_iseq_t *iseq)

{

    return iseq->body->iseq_encoded;

}


unsigned

rb_get_iseq_body_stack_max(const rb_iseq_t *iseq)

{

    return iseq->body->stack_max;

}


enum rb_iseq_type

rb_get_iseq_body_type(const rb_iseq_t *iseq)

{

    return iseq->body->type;

}


bool

rb_get_iseq_flags_has_lead(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.has_lead;

}


bool

rb_get_iseq_flags_has_opt(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.has_opt;

}


bool

rb_get_iseq_flags_has_kw(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.has_kw;

}


bool

rb_get_iseq_flags_has_post(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.has_post;

}


bool

rb_get_iseq_flags_has_kwrest(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.has_kwrest;

}


bool

rb_get_iseq_flags_anon_kwrest(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.anon_kwrest;

}


bool

rb_get_iseq_flags_has_rest(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.has_rest;

}


bool

rb_get_iseq_flags_ruby2_keywords(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.ruby2_keywords;

}


bool

rb_get_iseq_flags_has_block(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.has_block;

}


bool

rb_get_iseq_flags_ambiguous_param0(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.ambiguous_param0;

}


bool

rb_get_iseq_flags_accepts_no_kwarg(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.accepts_no_kwarg;

}


bool

rb_get_iseq_flags_forwardable(const rb_iseq_t *iseq)

{

    return iseq->body->param.flags.forwardable;

}


const rb_seq_param_keyword_struct *

rb_get_iseq_body_param_keyword(const rb_iseq_t *iseq)

{

    return iseq->body->param.keyword;

}


unsigned

rb_get_iseq_body_param_size(const rb_iseq_t *iseq)

{

    return iseq->body->param.size;

}


int

rb_get_iseq_body_param_lead_num(const rb_iseq_t *iseq)

{

    return iseq->body->param.lead_num;

}


int

rb_get_iseq_body_param_opt_num(const rb_iseq_t *iseq)

{

    return iseq->body->param.opt_num;

}


const VALUE *

rb_get_iseq_body_param_opt_table(const rb_iseq_t *iseq)

{

    return iseq->body->param.opt_table;

}


VALUE

rb_optimized_call(VALUE *recv, rb_execution_context_t *ec, int argc, VALUE *argv, int kw_splat, VALUE block_handler)

{

    rb_proc_t *proc;

    GetProcPtr(recv, proc);

    return rb_vm_invoke_proc(ec, proc, argc, argv, kw_splat, block_handler);

}


unsigned int

rb_yjit_iseq_builtin_attrs(const rb_iseq_t *iseq)

{

    return iseq->body->builtin_attrs;

}


// If true, the iseq has only opt_invokebuiltin_delegate(_leave) and leave insns.

static bool

invokebuiltin_delegate_leave_p(const rb_iseq_t *iseq)

{

    int insn1 = rb_vm_insn_addr2opcode((void *)iseq->body->iseq_encoded[0]);

    if ((int)iseq->body->iseq_size != insn_len(insn1) + insn_len(BIN(leave))) {

        return false;

    }

    int insn2 = rb_vm_insn_addr2opcode((void *)iseq->body->iseq_encoded[insn_len(insn1)]);

    return (insn1 == BIN(opt_invokebuiltin_delegate) || insn1 == BIN(opt_invokebuiltin_delegate_leave)) &&

            insn2 == BIN(leave);

}


// Return an rb_builtin_function if the iseq contains only that builtin function.

const struct rb_builtin_function *

rb_yjit_builtin_function(const rb_iseq_t *iseq)

{

    if (invokebuiltin_delegate_leave_p(iseq)) {

        return (const struct rb_builtin_function *)iseq->body->iseq_encoded[1];

    }

    else {

        return NULL;

    }

}


VALUE

rb_yjit_str_simple_append(VALUE str1, VALUE str2)

{

    return rb_str_cat(str1, RSTRING_PTR(str2), RSTRING_LEN(str2));

}


struct rb_control_frame_struct *

rb_get_ec_cfp(const rb_execution_context_t *ec)

{

    return ec->cfp;

}


const rb_iseq_t *

rb_get_cfp_iseq(struct rb_control_frame_struct *cfp)

{

    return cfp->iseq;

}


VALUE *

rb_get_cfp_pc(struct rb_control_frame_struct *cfp)

{

    return (VALUE*)cfp->pc;

}


VALUE *

rb_get_cfp_sp(struct rb_control_frame_struct *cfp)

{

    return cfp->sp;

}


void

rb_set_cfp_pc(struct rb_control_frame_struct *cfp, const VALUE *pc)

{

    cfp->pc = pc;

}


void

rb_set_cfp_sp(struct rb_control_frame_struct *cfp, VALUE *sp)

{

    cfp->sp = sp;

}


VALUE

rb_get_cfp_self(struct rb_control_frame_struct *cfp)

{

    return cfp->self;

}


VALUE *

rb_get_cfp_ep(struct rb_control_frame_struct *cfp)

{

    return (VALUE*)cfp->ep;

}


const VALUE *

rb_get_cfp_ep_level(struct rb_control_frame_struct *cfp, uint32_t lv)

{

    uint32_t i;

    const VALUE *ep = (VALUE*)cfp->ep;

    for (i = 0; i < lv; i++) {

        ep = VM_ENV_PREV_EP(ep);

    }

    return ep;

}


extern VALUE *rb_vm_base_ptr(struct rb_control_frame_struct *cfp);


VALUE

rb_yarv_class_of(VALUE obj)

{

    return rb_class_of(obj);

}


// YJIT needs this function to never allocate and never raise

VALUE

rb_yarv_str_eql_internal(VALUE str1, VALUE str2)

{

    // We wrap this since it's static inline

    return rb_str_eql_internal(str1, str2);

}


VALUE

rb_str_neq_internal(VALUE str1, VALUE str2)

{

    return rb_str_eql_internal(str1, str2) == Qtrue ? Qfalse : Qtrue;

}


// YJIT needs this function to never allocate and never raise

VALUE

rb_yarv_ary_entry_internal(VALUE ary, long offset)

{

    return rb_ary_entry_internal(ary, offset);

}


extern VALUE rb_ary_unshift_m(int argc, VALUE *argv, VALUE ary);


VALUE

rb_yjit_rb_ary_subseq_length(VALUE ary, long beg)

{

    long len = RARRAY_LEN(ary);

    return rb_ary_subseq(ary, beg, len);

}


VALUE

rb_yjit_fix_div_fix(VALUE recv, VALUE obj)

{

    return rb_fix_div_fix(recv, obj);

}


VALUE

rb_yjit_fix_mod_fix(VALUE recv, VALUE obj)

{

    return rb_fix_mod_fix(recv, obj);

}


// Return non-zero when `obj` is an array and its last item is a

// `ruby2_keywords` hash. We don't support this kind of splat.

size_t

rb_yjit_ruby2_keywords_splat_p(VALUE obj)

{

    if (!RB_TYPE_P(obj, T_ARRAY)) return 0;

    long len = RARRAY_LEN(obj);

    if (len == 0) return 0;

    VALUE last = RARRAY_AREF(obj, len - 1);

    if (!RB_TYPE_P(last, T_HASH)) return 0;

    return FL_TEST_RAW(last, RHASH_PASS_AS_KEYWORDS);

}


// Checks to establish preconditions for rb_yjit_splat_varg_cfunc()

VALUE

rb_yjit_splat_varg_checks(VALUE *sp, VALUE splat_array, rb_control_frame_t *cfp)

{

    // We inserted a T_ARRAY guard before this call

    long len = RARRAY_LEN(splat_array);


    // Large splat arrays need a separate allocation

    if (len < 0 || len > VM_ARGC_STACK_MAX) return Qfalse;


    // Would we overflow if we put the contents of the array onto the stack?

    if (sp + len > (VALUE *)(cfp - 2)) return Qfalse;


    // Reject keywords hash since that requires duping it sometimes

    if (len > 0) {

        VALUE last_hash = RARRAY_AREF(splat_array, len - 1);

        if (RB_TYPE_P(last_hash, T_HASH) &&

                FL_TEST_RAW(last_hash, RHASH_PASS_AS_KEYWORDS)) {

            return Qfalse;

        }

    }


    return Qtrue;

}


// Push array elements to the stack for a C method that has a variable number

// of parameters. Returns the number of arguments the splat array contributes.

int

rb_yjit_splat_varg_cfunc(VALUE *stack_splat_array)

{

    VALUE splat_array = *stack_splat_array;

    int len;


    // We already checked that length fits in `int`

    RUBY_ASSERT(RB_TYPE_P(splat_array, T_ARRAY));

    len = (int)RARRAY_LEN(splat_array);


    // Push the contents of the array onto the stack

    MEMCPY(stack_splat_array, RARRAY_CONST_PTR(splat_array), VALUE, len);


    return len;

}


// Print the Ruby source location of some ISEQ for debugging purposes

void

rb_yjit_dump_iseq_loc(const rb_iseq_t *iseq, uint32_t insn_idx)

{

    char *ptr;

    long len;

    VALUE path = rb_iseq_path(iseq);

    RSTRING_GETMEM(path, ptr, len);

    fprintf(stderr, "%s %.*s:%u\n", __func__, (int)len, ptr, rb_iseq_line_no(iseq, insn_idx));

}


// Get the number of digits required to print an integer

static int

num_digits(int integer)

{

    int num = 1;

    while (integer /= 10) {

        num++;

    }

    return num;

}


// Allocate a C string that formats an ISEQ label like iseq_inspect()

char *

rb_yjit_iseq_inspect(const rb_iseq_t *iseq)

{

    const char *label = RSTRING_PTR(iseq->body->location.label);

    const char *path = RSTRING_PTR(rb_iseq_path(iseq));

    int lineno = iseq->body->location.code_location.beg_pos.lineno;


    char *buf = ZALLOC_N(char, strlen(label) + strlen(path) + num_digits(lineno) + 3);

    sprintf(buf, "%s@%s:%d", label, path, lineno);

    return buf;

}


// The FL_TEST() macro

VALUE

rb_FL_TEST(VALUE obj, VALUE flags)

{

    return RB_FL_TEST(obj, flags);

}


// The FL_TEST_RAW() macro, normally an internal implementation detail

VALUE

rb_FL_TEST_RAW(VALUE obj, VALUE flags)

{

    return FL_TEST_RAW(obj, flags);

}


// The RB_TYPE_P macro

bool

rb_RB_TYPE_P(VALUE obj, enum ruby_value_type t)

{

    return RB_TYPE_P(obj, t);

}


long

rb_RSTRUCT_LEN(VALUE st)

{

    return RSTRUCT_LEN(st);

}


// There are RSTRUCT_SETs in ruby/internal/core/rstruct.h and internal/struct.h

// with different types (int vs long) for k. Here we use the one from ruby/internal/core/rstruct.h,

// which takes an int.

void

rb_RSTRUCT_SET(VALUE st, int k, VALUE v)

{

    RSTRUCT_SET(st, k, v);

}


const struct rb_callinfo *

rb_get_call_data_ci(const struct rb_call_data *cd)

{

    return cd->ci;

}


bool

rb_BASIC_OP_UNREDEFINED_P(enum ruby_basic_operators bop, uint32_t klass)

{

    return BASIC_OP_UNREDEFINED_P(bop, klass);

}


VALUE

rb_RCLASS_ORIGIN(VALUE c)

{

    return RCLASS_ORIGIN(c);

}


// Return the string encoding index

int

rb_ENCODING_GET(VALUE obj)

{

    return RB_ENCODING_GET(obj);

}


bool

rb_yjit_multi_ractor_p(void)

{

    return rb_multi_ractor_p();

}


// For debug builds

void

rb_assert_iseq_handle(VALUE handle)

{

    RUBY_ASSERT_ALWAYS(IMEMO_TYPE_P(handle, imemo_iseq));

}


int

rb_IMEMO_TYPE_P(VALUE imemo, enum imemo_type imemo_type)

{

    return IMEMO_TYPE_P(imemo, imemo_type);

}


bool

rb_yjit_constcache_shareable(const struct iseq_inline_constant_cache_entry *ice)

{

    return (ice->flags & IMEMO_CONST_CACHE_SHAREABLE) != 0;

}


void

rb_assert_cme_handle(VALUE handle)

{

    RUBY_ASSERT_ALWAYS(!rb_objspace_garbage_object_p(handle));

    RUBY_ASSERT_ALWAYS(IMEMO_TYPE_P(handle, imemo_ment));

}


// Used for passing a callback and other data over rb_objspace_each_objects


struct iseq_callback_data {

    rb_iseq_callback callback;

    void *data;

};


// Heap-walking callback for rb_yjit_for_each_iseq().

static int

for_each_iseq_i(void *vstart, void *vend, size_t stride, void *data)

{

    const struct iseq_callback_data *callback_data = (struct iseq_callback_data *)data;

    VALUE v = (VALUE)vstart;

    for (; v != (VALUE)vend; v += stride) {

        void *ptr = rb_asan_poisoned_object_p(v);

        rb_asan_unpoison_object(v, false);


        if (rb_obj_is_iseq(v)) {

            rb_iseq_t *iseq = (rb_iseq_t *)v;

            callback_data->callback(iseq, callback_data->data);

        }


        asan_poison_object_if(ptr, v);

    }

    return 0;

}


// Iterate through the whole GC heap and invoke a callback for each iseq.

// Used for global code invalidation.

void

rb_yjit_for_each_iseq(rb_iseq_callback callback, void *data)

{

    struct iseq_callback_data callback_data = { .callback = callback, .data = data };

    rb_objspace_each_objects(for_each_iseq_i, (void *)&callback_data);

}


// For running write barriers from Rust. Required when we add a new edge in the

// object graph from `old` to `young`.

void

rb_yjit_obj_written(VALUE old, VALUE young, const char *file, int line)

{

    rb_obj_written(old, Qundef, young, file, line);

}


// Acquire the VM lock and then signal all other Ruby threads (ractors) to

// contend for the VM lock, putting them to sleep. YJIT uses this to evict

// threads running inside generated code so among other things, it can

// safely change memory protection of regions housing generated code.

void

rb_yjit_vm_lock_then_barrier(unsigned int *recursive_lock_level, const char *file, int line)

{

    rb_vm_lock_enter(recursive_lock_level, file, line);

    rb_vm_barrier();

}


// Release the VM lock. The lock level must point to the same integer used to

// acquire the lock.

void

rb_yjit_vm_unlock(unsigned int *recursive_lock_level, const char *file, int line)

{

    rb_vm_lock_leave(recursive_lock_level, file, line);

}


void

rb_yjit_compile_iseq(const rb_iseq_t *iseq, rb_execution_context_t *ec, bool jit_exception)

{

    RB_VM_LOCK_ENTER();

    rb_vm_barrier();


    // Compile a block version starting at the current instruction

    uint8_t *rb_yjit_iseq_gen_entry_point(const rb_iseq_t *iseq, rb_execution_context_t *ec, bool jit_exception); // defined in Rust

    uintptr_t code_ptr = (uintptr_t)rb_yjit_iseq_gen_entry_point(iseq, ec, jit_exception);


    if (jit_exception) {

        iseq->body->jit_exception = (rb_jit_func_t)code_ptr;

    }

    else {

        iseq->body->jit_entry = (rb_jit_func_t)code_ptr;

    }


    RB_VM_LOCK_LEAVE();

}


// GC root for interacting with the GC


struct yjit_root_struct {

    bool unused; // empty structs are not legal in C99

};


// For dealing with refinements

void

rb_yjit_invalidate_all_method_lookup_assumptions(void)

{

    // It looks like Module#using actually doesn't need to invalidate all the

    // method caches, so we do nothing here for now.

}


// Number of object shapes, which might be useful for investigating YJIT exit reasons.

VALUE

rb_object_shape_count(void)

{

    // next_shape_id starts from 0, so it's the same as the count

    return ULONG2NUM((unsigned long)GET_SHAPE_TREE()->next_shape_id);

}


// Assert that we have the VM lock. Relevant mostly for multi ractor situations.

// The GC takes the lock before calling us, and this asserts that it indeed happens.

void

rb_yjit_assert_holding_vm_lock(void)

{

    ASSERT_vm_locking();

}


// The number of stack slots that vm_sendish() pops for send and invokesuper.

size_t

rb_yjit_sendish_sp_pops(const struct rb_callinfo *ci)

{

    return 1 - sp_inc_of_sendish(ci); // + 1 to ignore return value push

}


// The number of stack slots that vm_sendish() pops for invokeblock.

size_t

rb_yjit_invokeblock_sp_pops(const struct rb_callinfo *ci)

{

    return 1 - sp_inc_of_invokeblock(ci); // + 1 to ignore return value push

}


// Setup jit_return to avoid returning a non-Qundef value on a non-FINISH frame.

// See [jit_compile_exception] for details.

void

rb_yjit_set_exception_return(rb_control_frame_t *cfp, void *leave_exit, void *leave_exception)

{

    if (VM_FRAME_FINISHED_P(cfp)) {

        // If it's a FINISH frame, just normally exit with a non-Qundef value.

        cfp->jit_return = leave_exit;

    }

    else if (cfp->jit_return) {

        while (!VM_FRAME_FINISHED_P(cfp)) {

            if (cfp->jit_return == leave_exit) {

                // Unlike jit_exec(), leave_exit is not safe on a non-FINISH frame on

                // jit_exec_exception(). See [jit_exec] and [jit_exec_exception] for

                // details. Exit to the interpreter with Qundef to let it keep executing

                // other Ruby frames.

                cfp->jit_return = leave_exception;

                return;

            }

            cfp = RUBY_VM_PREVIOUS_CONTROL_FRAME(cfp);

        }

    }

    else {

        // If the caller was not JIT code, exit to the interpreter with Qundef

        // to keep executing Ruby frames with the interpreter.

        cfp->jit_return = leave_exception;

    }

}


// Primitives used by yjit.rb

VALUE rb_yjit_stats_enabled_p(rb_execution_context_t *ec, VALUE self);

VALUE rb_yjit_print_stats_p(rb_execution_context_t *ec, VALUE self);

VALUE rb_yjit_log_enabled_p(rb_execution_context_t *c, VALUE self);

VALUE rb_yjit_print_log_p(rb_execution_context_t *c, VALUE self);

VALUE rb_yjit_trace_exit_locations_enabled_p(rb_execution_context_t *ec, VALUE self);

VALUE rb_yjit_get_stats(rb_execution_context_t *ec, VALUE self, VALUE key);

VALUE rb_yjit_reset_stats_bang(rb_execution_context_t *ec, VALUE self);

VALUE rb_yjit_get_log(rb_execution_context_t *ec, VALUE self);

VALUE rb_yjit_disasm_iseq(rb_execution_context_t *ec, VALUE self, VALUE iseq);

VALUE rb_yjit_insns_compiled(rb_execution_context_t *ec, VALUE self, VALUE iseq);

VALUE rb_yjit_code_gc(rb_execution_context_t *ec, VALUE self);

VALUE rb_yjit_simulate_oom_bang(rb_execution_context_t *ec, VALUE self);

VALUE rb_yjit_get_exit_locations(rb_execution_context_t *ec, VALUE self);

VALUE rb_yjit_enable(rb_execution_context_t *ec, VALUE self, VALUE gen_stats, VALUE print_stats, VALUE gen_compilation_log, VALUE print_compilation_log, VALUE mem_size, VALUE call_threshold);

VALUE rb_yjit_c_builtin_p(rb_execution_context_t *ec, VALUE self);


// Allow YJIT_C_BUILTIN macro to force --yjit-c-builtin

#ifdef YJIT_C_BUILTIN

static VALUE yjit_c_builtin_p(rb_execution_context_t *ec, VALUE self) { return Qtrue; }

#else

#define yjit_c_builtin_p rb_yjit_c_builtin_p

#endif


// Preprocessed yjit.rb generated during build

#include "yjit.rbinc"

RUBY_ASSERT_ALWAYS
#define RUBY_ASSERT_ALWAYS(expr,...)
A variant of RUBY_ASSERT that does not interface with RUBY_DEBUG.
Definition assert.h:199

RUBY_ASSERT
#define RUBY_ASSERT(...)
Asserts that the given expression is truthy if and only if RUBY_DEBUG is truthy.
Definition assert.h:219

debug.h

rb_profile_frame_full_label
VALUE rb_profile_frame_full_label(VALUE frame)
Identical to rb_profile_frame_label(), except it returns a qualified result.
Definition vm_backtrace.c:1972

rb_profile_frame_absolute_path
VALUE rb_profile_frame_absolute_path(VALUE frame)
Identical to rb_profile_frame_path(), except it tries to expand the returning path.
Definition vm_backtrace.c:1852

rb_profile_frame_path
VALUE rb_profile_frame_path(VALUE frame)
Queries the path of the passed backtrace.
Definition vm_backtrace.c:1820

rb_profile_frame_first_lineno
VALUE rb_profile_frame_first_lineno(VALUE frame)
Queries the first line of the method of the passed frame pointer.
Definition vm_backtrace.c:1881

RUBY_EVENT_C_CALL
#define RUBY_EVENT_C_CALL
A method, written in C, is called.
Definition event.h:43

RUBY_EVENT_C_RETURN
#define RUBY_EVENT_C_RETURN
Return from a method, written in C.
Definition event.h:44

rb_event_flag_t
uint32_t rb_event_flag_t
Represents event(s).
Definition event.h:108

RB_FL_TEST
static VALUE RB_FL_TEST(VALUE obj, VALUE flags)
Tests if the given flag(s) are set or not.
Definition fl_type.h:495

Qundef
#define Qundef
Old name of RUBY_Qundef.
Definition special_consts.h:62

INT2FIX
#define INT2FIX
Old name of RB_INT2FIX.
Definition long.h:48

ID2SYM
#define ID2SYM
Old name of RB_ID2SYM.
Definition symbol.h:44

ULONG2NUM
#define ULONG2NUM
Old name of RB_ULONG2NUM.
Definition long.h:60

SIZET2NUM
#define SIZET2NUM
Old name of RB_SIZE2NUM.
Definition size_t.h:62

ZALLOC_N
#define ZALLOC_N
Old name of RB_ZALLOC_N.
Definition memory.h:401

T_HASH
#define T_HASH
Old name of RUBY_T_HASH.
Definition value_type.h:65

FL_TEST_RAW
#define FL_TEST_RAW
Old name of RB_FL_TEST_RAW.
Definition fl_type.h:132

Qtrue
#define Qtrue
Old name of RUBY_Qtrue.
Definition special_consts.h:61

INT2NUM
#define INT2NUM
Old name of RB_INT2NUM.
Definition int.h:43

Qfalse
#define Qfalse
Old name of RUBY_Qfalse.
Definition special_consts.h:59

T_ARRAY
#define T_ARRAY
Old name of RUBY_T_ARRAY.
Definition value_type.h:56

NIL_P
#define NIL_P
Old name of RB_NIL_P.
Definition special_consts.h:55

rb_class_of
static VALUE rb_class_of(VALUE obj)
Object to class mapping function.
Definition globals.h:172

RB_ENCODING_GET
static int RB_ENCODING_GET(VALUE obj)
Just another name of rb_enc_get_index.
Definition encoding.h:195

builtin.h
Defines RBIMPL_HAS_BUILTIN.

rb_str_cat
VALUE rb_str_cat(VALUE dst, const char *src, long srclen)
Destructively appends the passed contents to the string.
Definition string.c:3836

len
int len
Length of the buffer.
Definition io.h:8

MEMCPY
#define MEMCPY(p1, p2, type, n)
Handy macro to call memcpy.
Definition memory.h:372

RARRAY_LEN
#define RARRAY_LEN
Just another name of rb_array_len.
Definition rarray.h:51

rb_array_len
static long rb_array_len(VALUE a)
Queries the length of the array.
Definition rarray.h:255

RARRAY_AREF
#define RARRAY_AREF(a, i)
Definition rarray.h:403

RARRAY_CONST_PTR
#define RARRAY_CONST_PTR
Just another name of rb_array_const_ptr.
Definition rarray.h:52

RSTRING_GETMEM
#define RSTRING_GETMEM(str, ptrvar, lenvar)
Convenient macro to obtain the contents and length at once.
Definition rstring.h:488

errno
#define errno
Ractor-aware version of errno.
Definition ruby.h:388

RTEST
#define RTEST
This is an old name of RB_TEST.
Definition special_consts.h:51

USE_FLONUM
#define USE_FLONUM
Definition special_consts.h:45

RObject
Ruby's ordinal objects.
Definition robject.h:83

RObject::ivptr
VALUE * ivptr
Pointer to a C array that holds instance variables.
Definition robject.h:97

RObject::heap
struct RObject::@50::@51 heap
Object that use separated memory region for instance variables use this pattern.

RString
Ruby's String.
Definition rstring.h:196

iseq_callback_data
Definition yjit.c:1086

iseq_inline_constant_cache_entry
Definition vm_core.h:259

rb_builtin_function
Definition builtin.h:6

rb_call_data
Definition vm_callinfo.h:559

rb_callable_method_entry_struct
Definition method.h:63

rb_callinfo_kwarg
Definition vm_callinfo.h:48

rb_callinfo
Definition vm_callinfo.h:65

rb_control_frame_struct
Definition vm_core.h:893

rb_execution_context_struct
Definition vm_core.h:1015

rb_iseq_constant_body::param
struct rb_iseq_constant_body::@155 param
parameter information

rb_iseq_struct
Definition vm_core.h:563

rb_method_cfunc_struct
Definition method.h:141

rb_method_definition_struct
Definition method.h:180

rb_proc_t
Definition vm_core.h:1258

yjit_root_struct
Definition yjit.c:1168

ID
uintptr_t ID
Type that represents a Ruby identifier such as a variable name.
Definition value.h:52

VALUE
uintptr_t VALUE
Type that represents a Ruby object.
Definition value.h:40

RB_TYPE_P
static bool RB_TYPE_P(VALUE obj, enum ruby_value_type t)
Queries if the given object is of given type.
Definition value_type.h:376

ruby_value_type
ruby_value_type
C-level type of an object.
Definition value_type.h:113