mirror of
https://github.com/ruby/ruby.git
synced 2022-11-09 12:17:21 -05:00
b91b3bc771
Redo of34a2acdac7
and931138b006
which were reverted. GitHub PR #4340. This change implements a cache for class variables. Previously there was no cache for cvars. Cvar access is slow due to needing to travel all the way up th ancestor tree before returning the cvar value. The deeper the ancestor tree the slower cvar access will be. The benefits of the cache are more visible with a higher number of included modules due to the way Ruby looks up class variables. The benchmark here includes 26 modules and shows with the cache, this branch is 6.5x faster when accessing class variables. ``` compare-ruby: ruby 3.1.0dev (2021-03-15T06:22:34Z master9e5105c
) [x86_64-darwin19] built-ruby: ruby 3.1.0dev (2021-03-15T12:12:44Z add-cache-for-clas.. c6be009) [x86_64-darwin19] | |compare-ruby|built-ruby| |:--------|-----------:|---------:| |vm_cvar | 5.681M| 36.980M| | | -| 6.51x| ``` Benchmark.ips calling `ActiveRecord::Base.logger` from within a Rails application. ActiveRecord::Base.logger has 71 ancestors. The more ancestors a tree has, the more clear the speed increase. IE if Base had only one ancestor we'd see no improvement. This benchmark is run on a vanilla Rails application. Benchmark code: ```ruby require "benchmark/ips" require_relative "config/environment" Benchmark.ips do |x| x.report "logger" do ActiveRecord::Base.logger end end ``` Ruby 3.0 master / Rails 6.1: ``` Warming up -------------------------------------- logger 155.251k i/100ms Calculating ------------------------------------- ``` Ruby 3.0 with cvar cache / Rails 6.1: ``` Warming up -------------------------------------- logger 1.546M i/100ms Calculating ------------------------------------- logger 14.857M (± 4.8%) i/s - 74.198M in 5.006202s ``` Lastly we ran a benchmark to demonstate the difference between master and our cache when the number of modules increases. This benchmark measures 1 ancestor, 30 ancestors, and 100 ancestors. Ruby 3.0 master: ``` Warming up -------------------------------------- 1 module 1.231M i/100ms 30 modules 432.020k i/100ms 100 modules 145.399k i/100ms Calculating ------------------------------------- 1 module 12.210M (± 2.1%) i/s - 61.553M in 5.043400s 30 modules 4.354M (± 2.7%) i/s - 22.033M in 5.063839s 100 modules 1.434M (± 2.9%) i/s - 7.270M in 5.072531s Comparison: 1 module: 12209958.3 i/s 30 modules: 4354217.8 i/s - 2.80x (± 0.00) slower 100 modules: 1434447.3 i/s - 8.51x (± 0.00) slower ``` Ruby 3.0 with cvar cache: ``` Warming up -------------------------------------- 1 module 1.641M i/100ms 30 modules 1.655M i/100ms 100 modules 1.620M i/100ms Calculating ------------------------------------- 1 module 16.279M (± 3.8%) i/s - 82.038M in 5.046923s 30 modules 15.891M (± 3.9%) i/s - 79.459M in 5.007958s 100 modules 16.087M (± 3.6%) i/s - 81.005M in 5.041931s Comparison: 1 module: 16279458.0 i/s 100 modules: 16087484.6 i/s - same-ish: difference falls within error 30 modules: 15891406.2 i/s - same-ish: difference falls within error ``` Co-authored-by: Aaron Patterson <tenderlove@ruby-lang.org>
467 lines
16 KiB
C
467 lines
16 KiB
C
/**********************************************************************
|
|
|
|
debug_counter.h -
|
|
|
|
created at: Tue Feb 21 16:51:18 2017
|
|
|
|
Copyright (C) 2017 Koichi Sasada
|
|
|
|
**********************************************************************/
|
|
|
|
#ifndef USE_DEBUG_COUNTER
|
|
#define USE_DEBUG_COUNTER 0
|
|
#endif
|
|
|
|
#ifdef RB_DEBUG_COUNTER
|
|
|
|
// method cache (IMC: inline method cache)
|
|
RB_DEBUG_COUNTER(mc_inline_hit) // IMC hit
|
|
RB_DEBUG_COUNTER(mc_inline_miss_klass) // IMC miss by different class
|
|
RB_DEBUG_COUNTER(mc_inline_miss_invalidated) // IMC miss by invalidated ME
|
|
RB_DEBUG_COUNTER(mc_inline_miss_empty) // IMC miss because prev is empty slot
|
|
RB_DEBUG_COUNTER(mc_inline_miss_same_cc) // IMC miss, but same CC
|
|
RB_DEBUG_COUNTER(mc_inline_miss_same_cme) // IMC miss, but same CME
|
|
RB_DEBUG_COUNTER(mc_inline_miss_same_def) // IMC miss, but same definition
|
|
RB_DEBUG_COUNTER(mc_inline_miss_diff) // IMC miss, different methods
|
|
|
|
RB_DEBUG_COUNTER(cvar_write_inline_hit) // cvar cache hit on write
|
|
RB_DEBUG_COUNTER(cvar_read_inline_hit) // cvar cache hit on read
|
|
RB_DEBUG_COUNTER(cvar_inline_miss) // miss inline cache
|
|
RB_DEBUG_COUNTER(cvar_class_invalidate) // invalidate cvar cache when define a cvar that's defined on a subclass
|
|
RB_DEBUG_COUNTER(cvar_include_invalidate) // invalidate cvar cache on module include or prepend
|
|
|
|
RB_DEBUG_COUNTER(mc_cme_complement) // number of acquiring complement CME
|
|
RB_DEBUG_COUNTER(mc_cme_complement_hit) // number of cache hit for complemented CME
|
|
|
|
RB_DEBUG_COUNTER(mc_search) // count for method lookup in class tree
|
|
RB_DEBUG_COUNTER(mc_search_notfound) // method lookup, but not found
|
|
RB_DEBUG_COUNTER(mc_search_super) // total traversed classes
|
|
|
|
// callinfo
|
|
RB_DEBUG_COUNTER(ci_packed) // number of packed CI
|
|
RB_DEBUG_COUNTER(ci_kw) // non-packed CI w/ keywords
|
|
RB_DEBUG_COUNTER(ci_nokw) // non-packed CI w/o keywords
|
|
RB_DEBUG_COUNTER(ci_runtime) // creating temporary CI
|
|
|
|
// callcache
|
|
RB_DEBUG_COUNTER(cc_new) // number of CC
|
|
RB_DEBUG_COUNTER(cc_temp) // dummy CC (stack-allocated)
|
|
RB_DEBUG_COUNTER(cc_found_in_ccs) // count for CC lookup success in CCS
|
|
RB_DEBUG_COUNTER(cc_not_found_in_ccs) // count for CC lookup success in CCS
|
|
|
|
RB_DEBUG_COUNTER(cc_ent_invalidate) // count for invalidating cc (cc->klass = 0)
|
|
RB_DEBUG_COUNTER(cc_cme_invalidate) // count for invalidating CME
|
|
|
|
RB_DEBUG_COUNTER(cc_invalidate_leaf) // count for invalidating klass if klass has no-subclasses
|
|
RB_DEBUG_COUNTER(cc_invalidate_leaf_ccs) // corresponding CCS
|
|
RB_DEBUG_COUNTER(cc_invalidate_leaf_callable) // complimented cache (no-subclasses)
|
|
RB_DEBUG_COUNTER(cc_invalidate_tree) // count for invalidating klass if klass has subclasses
|
|
RB_DEBUG_COUNTER(cc_invalidate_tree_cme) // cme if cme is found in this class or superclasses
|
|
RB_DEBUG_COUNTER(cc_invalidate_tree_callable) // complimented cache (subclasses)
|
|
RB_DEBUG_COUNTER(cc_invalidate_negative) // count for invalidating negative cache
|
|
|
|
RB_DEBUG_COUNTER(ccs_free) // count for free'ing ccs
|
|
RB_DEBUG_COUNTER(ccs_maxlen) // maximum length of ccs
|
|
RB_DEBUG_COUNTER(ccs_found) // count for finding corresponding ccs on method lookup
|
|
RB_DEBUG_COUNTER(ccs_not_found) // count for not found corresponding ccs on method lookup
|
|
|
|
// vm_eval.c
|
|
RB_DEBUG_COUNTER(call0_public)
|
|
RB_DEBUG_COUNTER(call0_other)
|
|
RB_DEBUG_COUNTER(gccct_hit)
|
|
RB_DEBUG_COUNTER(gccct_miss)
|
|
RB_DEBUG_COUNTER(gccct_null)
|
|
|
|
// iseq
|
|
RB_DEBUG_COUNTER(iseq_num) // number of total created iseq
|
|
RB_DEBUG_COUNTER(iseq_cd_num) // number of total created cd (call_data)
|
|
|
|
/*
|
|
* call cache fastpath usage
|
|
*/
|
|
RB_DEBUG_COUNTER(ccf_general)
|
|
RB_DEBUG_COUNTER(ccf_iseq_setup)
|
|
RB_DEBUG_COUNTER(ccf_iseq_setup_0start)
|
|
RB_DEBUG_COUNTER(ccf_iseq_setup_tailcall_0start)
|
|
RB_DEBUG_COUNTER(ccf_iseq_fix) /* several functions created with tool/mk_call_iseq_optimized.rb */
|
|
RB_DEBUG_COUNTER(ccf_iseq_opt) /* has_opt == TRUE (has optional parameters), but other flags are FALSE */
|
|
RB_DEBUG_COUNTER(ccf_iseq_kw1) /* vm_call_iseq_setup_kwparm_kwarg() */
|
|
RB_DEBUG_COUNTER(ccf_iseq_kw2) /* vm_call_iseq_setup_kwparm_nokwarg() */
|
|
RB_DEBUG_COUNTER(ccf_cfunc)
|
|
RB_DEBUG_COUNTER(ccf_cfunc_with_frame)
|
|
RB_DEBUG_COUNTER(ccf_ivar) /* attr_reader */
|
|
RB_DEBUG_COUNTER(ccf_attrset) /* attr_writer */
|
|
RB_DEBUG_COUNTER(ccf_method_missing)
|
|
RB_DEBUG_COUNTER(ccf_zsuper)
|
|
RB_DEBUG_COUNTER(ccf_bmethod)
|
|
RB_DEBUG_COUNTER(ccf_opt_send)
|
|
RB_DEBUG_COUNTER(ccf_opt_call)
|
|
RB_DEBUG_COUNTER(ccf_opt_block_call)
|
|
RB_DEBUG_COUNTER(ccf_super_method)
|
|
|
|
/*
|
|
* control frame push counts.
|
|
*
|
|
* * frame_push: frame push counts.
|
|
* * frame_push_*: frame push counts per each type.
|
|
* * frame_R2R: Ruby frame to Ruby frame
|
|
* * frame_R2C: Ruby frame to C frame
|
|
* * frame_C2C: C frame to C frame
|
|
* * frame_C2R: C frame to Ruby frame
|
|
*/
|
|
RB_DEBUG_COUNTER(frame_push)
|
|
RB_DEBUG_COUNTER(frame_push_method)
|
|
RB_DEBUG_COUNTER(frame_push_block)
|
|
RB_DEBUG_COUNTER(frame_push_class)
|
|
RB_DEBUG_COUNTER(frame_push_top)
|
|
RB_DEBUG_COUNTER(frame_push_cfunc)
|
|
RB_DEBUG_COUNTER(frame_push_ifunc)
|
|
RB_DEBUG_COUNTER(frame_push_eval)
|
|
RB_DEBUG_COUNTER(frame_push_rescue)
|
|
RB_DEBUG_COUNTER(frame_push_dummy)
|
|
|
|
RB_DEBUG_COUNTER(frame_R2R)
|
|
RB_DEBUG_COUNTER(frame_R2C)
|
|
RB_DEBUG_COUNTER(frame_C2C)
|
|
RB_DEBUG_COUNTER(frame_C2R)
|
|
|
|
/* instance variable counts
|
|
*
|
|
* * ivar_get_ic_hit/miss: ivar_get inline cache (ic) hit/miss counts (VM insn)
|
|
* * ivar_get_ic_miss_serial: ivar_get ic miss reason by serial (VM insn)
|
|
* * ivar_get_ic_miss_unset: ... by unset (VM insn)
|
|
* * ivar_get_ic_miss_noobject: ... by "not T_OBJECT" (VM insn)
|
|
* * ivar_set_...: same counts with ivar_set (VM insn)
|
|
* * ivar_get/set_base: call counts of "rb_ivar_get/set()".
|
|
* because of (1) ic miss.
|
|
* (2) direct call by C extensions.
|
|
*/
|
|
RB_DEBUG_COUNTER(ivar_get_ic_hit)
|
|
RB_DEBUG_COUNTER(ivar_get_ic_miss)
|
|
RB_DEBUG_COUNTER(ivar_get_ic_miss_serial)
|
|
RB_DEBUG_COUNTER(ivar_get_ic_miss_unset)
|
|
RB_DEBUG_COUNTER(ivar_get_ic_miss_noobject)
|
|
RB_DEBUG_COUNTER(ivar_set_ic_hit)
|
|
RB_DEBUG_COUNTER(ivar_set_ic_miss)
|
|
RB_DEBUG_COUNTER(ivar_set_ic_miss_serial)
|
|
RB_DEBUG_COUNTER(ivar_set_ic_miss_unset)
|
|
RB_DEBUG_COUNTER(ivar_set_ic_miss_iv_hit)
|
|
RB_DEBUG_COUNTER(ivar_set_ic_miss_noobject)
|
|
RB_DEBUG_COUNTER(ivar_get_base)
|
|
RB_DEBUG_COUNTER(ivar_set_base)
|
|
|
|
/* local variable counts
|
|
*
|
|
* * lvar_get: total lvar get counts (VM insn)
|
|
* * lvar_get_dynamic: lvar get counts if accessing upper env (VM insn)
|
|
* * lvar_set*: same as "get"
|
|
* * lvar_set_slowpath: counts using vm_env_write_slowpath()
|
|
*/
|
|
RB_DEBUG_COUNTER(lvar_get)
|
|
RB_DEBUG_COUNTER(lvar_get_dynamic)
|
|
RB_DEBUG_COUNTER(lvar_set)
|
|
RB_DEBUG_COUNTER(lvar_set_dynamic)
|
|
RB_DEBUG_COUNTER(lvar_set_slowpath)
|
|
|
|
/* GC counts:
|
|
*
|
|
* * count: simple count
|
|
* * _minor: minor gc
|
|
* * _major: major gc
|
|
* * other suffix is corresponding to last_gc_info or
|
|
* gc_profile_record_flag in gc.c.
|
|
*/
|
|
RB_DEBUG_COUNTER(gc_count)
|
|
RB_DEBUG_COUNTER(gc_minor_newobj)
|
|
RB_DEBUG_COUNTER(gc_minor_malloc)
|
|
RB_DEBUG_COUNTER(gc_minor_method)
|
|
RB_DEBUG_COUNTER(gc_minor_capi)
|
|
RB_DEBUG_COUNTER(gc_minor_stress)
|
|
RB_DEBUG_COUNTER(gc_major_nofree)
|
|
RB_DEBUG_COUNTER(gc_major_oldgen)
|
|
RB_DEBUG_COUNTER(gc_major_shady)
|
|
RB_DEBUG_COUNTER(gc_major_force)
|
|
RB_DEBUG_COUNTER(gc_major_oldmalloc)
|
|
|
|
RB_DEBUG_COUNTER(gc_enter_start)
|
|
RB_DEBUG_COUNTER(gc_enter_mark_continue)
|
|
RB_DEBUG_COUNTER(gc_enter_sweep_continue)
|
|
RB_DEBUG_COUNTER(gc_enter_rest)
|
|
RB_DEBUG_COUNTER(gc_enter_finalizer)
|
|
|
|
RB_DEBUG_COUNTER(gc_isptr_trial)
|
|
RB_DEBUG_COUNTER(gc_isptr_range)
|
|
RB_DEBUG_COUNTER(gc_isptr_align)
|
|
RB_DEBUG_COUNTER(gc_isptr_maybe)
|
|
|
|
/* object allocation counts:
|
|
*
|
|
* * obj_newobj: newobj counts
|
|
* * obj_newobj_slowpath: newobj with slowpath counts
|
|
* * obj_newobj_wb_unprotected: newobj for wb_unprotected.
|
|
* * obj_free: obj_free() counts
|
|
* * obj_promote: promoted counts (oldgen)
|
|
* * obj_wb_unprotect: wb unprotect counts
|
|
*
|
|
* * obj_[type]_[attr]: *free'ed counts* for each type.
|
|
* Note that it is not a allocated counts.
|
|
* * [type]
|
|
* * _obj: T_OBJECT
|
|
* * _str: T_STRING
|
|
* * _ary: T_ARRAY
|
|
* * _xxx: T_XXX (hash, struct, ...)
|
|
*
|
|
* * [attr]
|
|
* * _ptr: R?? is not embed.
|
|
* * _embed: R?? is embed.
|
|
* * _transient: R?? uses transient heap.
|
|
* * type specific attr.
|
|
* * str_shared: str is shared.
|
|
* * str_nofree: nofree
|
|
* * str_fstr: fstr
|
|
* * hash_empty: hash is empty
|
|
* * hash_1_4: has 1 to 4 entries
|
|
* * hash_5_8: has 5 to 8 entries
|
|
* * hash_g8: has n entries (n>8)
|
|
* * match_under4: has under 4 oniguruma regions allocated
|
|
* * match_ge4: has n regions allocated (4<=n<8)
|
|
* * match_ge8: has n regions allocated (8<=n)
|
|
* * data_empty: T_DATA but no memory free.
|
|
* * data_xfree: free'ed by xfree().
|
|
* * data_imm_free: free'ed immediately.
|
|
* * data_zombie: free'ed with zombie.
|
|
* * imemo_*: T_IMEMO with each type.
|
|
*/
|
|
RB_DEBUG_COUNTER(obj_newobj)
|
|
RB_DEBUG_COUNTER(obj_newobj_slowpath)
|
|
RB_DEBUG_COUNTER(obj_newobj_wb_unprotected)
|
|
RB_DEBUG_COUNTER(obj_free)
|
|
RB_DEBUG_COUNTER(obj_promote)
|
|
RB_DEBUG_COUNTER(obj_wb_unprotect)
|
|
|
|
RB_DEBUG_COUNTER(obj_obj_embed)
|
|
RB_DEBUG_COUNTER(obj_obj_transient)
|
|
RB_DEBUG_COUNTER(obj_obj_ptr)
|
|
|
|
RB_DEBUG_COUNTER(obj_str_ptr)
|
|
RB_DEBUG_COUNTER(obj_str_embed)
|
|
RB_DEBUG_COUNTER(obj_str_shared)
|
|
RB_DEBUG_COUNTER(obj_str_nofree)
|
|
RB_DEBUG_COUNTER(obj_str_fstr)
|
|
|
|
RB_DEBUG_COUNTER(obj_ary_embed)
|
|
RB_DEBUG_COUNTER(obj_ary_transient)
|
|
RB_DEBUG_COUNTER(obj_ary_ptr)
|
|
RB_DEBUG_COUNTER(obj_ary_extracapa)
|
|
/*
|
|
ary_shared_create: shared ary by Array#dup and so on.
|
|
ary_shared: finished in shard.
|
|
ary_shared_root_occupied: shared_root but has only 1 refcnt.
|
|
The number (ary_shared - ary_shared_root_occupied) is meaningful.
|
|
*/
|
|
RB_DEBUG_COUNTER(obj_ary_shared_create)
|
|
RB_DEBUG_COUNTER(obj_ary_shared)
|
|
RB_DEBUG_COUNTER(obj_ary_shared_root_occupied)
|
|
|
|
RB_DEBUG_COUNTER(obj_hash_empty)
|
|
RB_DEBUG_COUNTER(obj_hash_1)
|
|
RB_DEBUG_COUNTER(obj_hash_2)
|
|
RB_DEBUG_COUNTER(obj_hash_3)
|
|
RB_DEBUG_COUNTER(obj_hash_4)
|
|
RB_DEBUG_COUNTER(obj_hash_5_8)
|
|
RB_DEBUG_COUNTER(obj_hash_g8)
|
|
|
|
RB_DEBUG_COUNTER(obj_hash_null)
|
|
RB_DEBUG_COUNTER(obj_hash_ar)
|
|
RB_DEBUG_COUNTER(obj_hash_st)
|
|
RB_DEBUG_COUNTER(obj_hash_transient)
|
|
RB_DEBUG_COUNTER(obj_hash_force_convert)
|
|
|
|
RB_DEBUG_COUNTER(obj_struct_embed)
|
|
RB_DEBUG_COUNTER(obj_struct_transient)
|
|
RB_DEBUG_COUNTER(obj_struct_ptr)
|
|
|
|
RB_DEBUG_COUNTER(obj_data_empty)
|
|
RB_DEBUG_COUNTER(obj_data_xfree)
|
|
RB_DEBUG_COUNTER(obj_data_imm_free)
|
|
RB_DEBUG_COUNTER(obj_data_zombie)
|
|
|
|
RB_DEBUG_COUNTER(obj_match_under4)
|
|
RB_DEBUG_COUNTER(obj_match_ge4)
|
|
RB_DEBUG_COUNTER(obj_match_ge8)
|
|
RB_DEBUG_COUNTER(obj_match_ptr)
|
|
|
|
RB_DEBUG_COUNTER(obj_iclass_ptr)
|
|
RB_DEBUG_COUNTER(obj_class_ptr)
|
|
RB_DEBUG_COUNTER(obj_module_ptr)
|
|
|
|
RB_DEBUG_COUNTER(obj_bignum_ptr)
|
|
RB_DEBUG_COUNTER(obj_bignum_embed)
|
|
RB_DEBUG_COUNTER(obj_float)
|
|
RB_DEBUG_COUNTER(obj_complex)
|
|
RB_DEBUG_COUNTER(obj_rational)
|
|
|
|
RB_DEBUG_COUNTER(obj_regexp_ptr)
|
|
RB_DEBUG_COUNTER(obj_file_ptr)
|
|
RB_DEBUG_COUNTER(obj_symbol)
|
|
|
|
RB_DEBUG_COUNTER(obj_imemo_ment)
|
|
RB_DEBUG_COUNTER(obj_imemo_iseq)
|
|
RB_DEBUG_COUNTER(obj_imemo_env)
|
|
RB_DEBUG_COUNTER(obj_imemo_tmpbuf)
|
|
RB_DEBUG_COUNTER(obj_imemo_ast)
|
|
RB_DEBUG_COUNTER(obj_imemo_cref)
|
|
RB_DEBUG_COUNTER(obj_imemo_svar)
|
|
RB_DEBUG_COUNTER(obj_imemo_throw_data)
|
|
RB_DEBUG_COUNTER(obj_imemo_ifunc)
|
|
RB_DEBUG_COUNTER(obj_imemo_memo)
|
|
RB_DEBUG_COUNTER(obj_imemo_parser_strterm)
|
|
RB_DEBUG_COUNTER(obj_imemo_callinfo)
|
|
RB_DEBUG_COUNTER(obj_imemo_callcache)
|
|
RB_DEBUG_COUNTER(obj_imemo_constcache)
|
|
|
|
/* ar_table */
|
|
RB_DEBUG_COUNTER(artable_hint_hit)
|
|
RB_DEBUG_COUNTER(artable_hint_miss)
|
|
RB_DEBUG_COUNTER(artable_hint_notfound)
|
|
|
|
/* heap function counts
|
|
*
|
|
* * heap_xmalloc/realloc/xfree: call counts
|
|
*/
|
|
RB_DEBUG_COUNTER(heap_xmalloc)
|
|
RB_DEBUG_COUNTER(heap_xrealloc)
|
|
RB_DEBUG_COUNTER(heap_xfree)
|
|
|
|
/* transient_heap */
|
|
RB_DEBUG_COUNTER(theap_alloc)
|
|
RB_DEBUG_COUNTER(theap_alloc_fail)
|
|
RB_DEBUG_COUNTER(theap_evacuate)
|
|
|
|
// VM sync
|
|
RB_DEBUG_COUNTER(vm_sync_lock)
|
|
RB_DEBUG_COUNTER(vm_sync_lock_enter)
|
|
RB_DEBUG_COUNTER(vm_sync_lock_enter_nb)
|
|
RB_DEBUG_COUNTER(vm_sync_lock_enter_cr)
|
|
RB_DEBUG_COUNTER(vm_sync_barrier)
|
|
|
|
/* mjit_exec() counts */
|
|
RB_DEBUG_COUNTER(mjit_exec)
|
|
RB_DEBUG_COUNTER(mjit_exec_not_added)
|
|
RB_DEBUG_COUNTER(mjit_exec_not_ready)
|
|
RB_DEBUG_COUNTER(mjit_exec_not_compiled)
|
|
RB_DEBUG_COUNTER(mjit_exec_call_func)
|
|
|
|
/* MJIT enqueue / unload */
|
|
RB_DEBUG_COUNTER(mjit_add_iseq_to_process)
|
|
RB_DEBUG_COUNTER(mjit_unload_units)
|
|
|
|
/* MJIT <-> VM frame push counts */
|
|
RB_DEBUG_COUNTER(mjit_frame_VM2VM)
|
|
RB_DEBUG_COUNTER(mjit_frame_VM2JT)
|
|
RB_DEBUG_COUNTER(mjit_frame_JT2JT)
|
|
RB_DEBUG_COUNTER(mjit_frame_JT2VM)
|
|
|
|
/* MJIT cancel counters */
|
|
RB_DEBUG_COUNTER(mjit_cancel)
|
|
RB_DEBUG_COUNTER(mjit_cancel_ivar_inline)
|
|
RB_DEBUG_COUNTER(mjit_cancel_exivar_inline)
|
|
RB_DEBUG_COUNTER(mjit_cancel_send_inline)
|
|
RB_DEBUG_COUNTER(mjit_cancel_opt_insn) /* CALL_SIMPLE_METHOD */
|
|
RB_DEBUG_COUNTER(mjit_cancel_invalidate_all)
|
|
RB_DEBUG_COUNTER(mjit_cancel_leave)
|
|
|
|
/* rb_mjit_unit_list length */
|
|
RB_DEBUG_COUNTER(mjit_length_unit_queue)
|
|
RB_DEBUG_COUNTER(mjit_length_active_units)
|
|
RB_DEBUG_COUNTER(mjit_length_compact_units)
|
|
RB_DEBUG_COUNTER(mjit_length_stale_units)
|
|
|
|
/* Other MJIT counters */
|
|
RB_DEBUG_COUNTER(mjit_compile_failures)
|
|
|
|
/* load (not implemented yet) */
|
|
/*
|
|
RB_DEBUG_COUNTER(load_files)
|
|
RB_DEBUG_COUNTER(load_path_is_not_realpath)
|
|
*/
|
|
#endif
|
|
|
|
#ifndef RUBY_DEBUG_COUNTER_H
|
|
#define RUBY_DEBUG_COUNTER_H 1
|
|
|
|
#include "ruby/internal/config.h"
|
|
#include <stddef.h> /* for size_t */
|
|
#include "ruby/ruby.h" /* for VALUE */
|
|
|
|
#if !defined(__GNUC__) && USE_DEBUG_COUNTER
|
|
#error "USE_DEBUG_COUNTER is not supported by other than __GNUC__"
|
|
#endif
|
|
|
|
enum rb_debug_counter_type {
|
|
#define RB_DEBUG_COUNTER(name) RB_DEBUG_COUNTER_##name,
|
|
#include __FILE__
|
|
RB_DEBUG_COUNTER_MAX
|
|
#undef RB_DEBUG_COUNTER
|
|
};
|
|
|
|
#if USE_DEBUG_COUNTER
|
|
extern size_t rb_debug_counter[];
|
|
RUBY_EXTERN struct rb_ractor_struct *ruby_single_main_ractor;
|
|
RUBY_EXTERN void rb_debug_counter_add_atomic(enum rb_debug_counter_type type, int add);
|
|
|
|
inline static int
|
|
rb_debug_counter_add(enum rb_debug_counter_type type, int add, int cond)
|
|
{
|
|
if (cond) {
|
|
if (ruby_single_main_ractor != NULL) {
|
|
rb_debug_counter[(int)type] += add;
|
|
}
|
|
else {
|
|
rb_debug_counter_add_atomic(type, add);
|
|
}
|
|
}
|
|
return cond;
|
|
}
|
|
|
|
inline static int
|
|
rb_debug_counter_max(enum rb_debug_counter_type type, unsigned int num)
|
|
{
|
|
// TODO: sync
|
|
if (rb_debug_counter[(int)type] < num) {
|
|
rb_debug_counter[(int)type] = num;
|
|
return 1;
|
|
}
|
|
else {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
VALUE rb_debug_counter_reset(VALUE klass);
|
|
VALUE rb_debug_counter_show(VALUE klass);
|
|
|
|
#define RB_DEBUG_COUNTER_INC(type) rb_debug_counter_add(RB_DEBUG_COUNTER_##type, 1, 1)
|
|
#define RB_DEBUG_COUNTER_INC_UNLESS(type, cond) (!rb_debug_counter_add(RB_DEBUG_COUNTER_##type, 1, !(cond)))
|
|
#define RB_DEBUG_COUNTER_INC_IF(type, cond) rb_debug_counter_add(RB_DEBUG_COUNTER_##type, 1, !!(cond))
|
|
#define RB_DEBUG_COUNTER_ADD(type, num) rb_debug_counter_add(RB_DEBUG_COUNTER_##type, (num), 1)
|
|
#define RB_DEBUG_COUNTER_SETMAX(type, num) rb_debug_counter_max(RB_DEBUG_COUNTER_##type, (unsigned int)(num))
|
|
|
|
#else
|
|
#define RB_DEBUG_COUNTER_INC(type) ((void)0)
|
|
#define RB_DEBUG_COUNTER_INC_UNLESS(type, cond) (!!(cond))
|
|
#define RB_DEBUG_COUNTER_INC_IF(type, cond) (!!(cond))
|
|
#define RB_DEBUG_COUNTER_ADD(type, num) ((void)0)
|
|
#define RB_DEBUG_COUNTER_SETMAX(type, num) 0
|
|
#endif
|
|
|
|
void rb_debug_counter_show_results(const char *msg);
|
|
|
|
RUBY_SYMBOL_EXPORT_BEGIN
|
|
|
|
size_t ruby_debug_counter_get(const char **names_ptr, size_t *counters_ptr);
|
|
void ruby_debug_counter_reset(void);
|
|
void ruby_debug_counter_show_at_exit(int enable);
|
|
|
|
RUBY_SYMBOL_EXPORT_END
|
|
|
|
#endif /* RUBY_DEBUG_COUNTER_H */
|