Skip to content

Commit 0e0fad1

Browse files
authored
ZJIT: Specialize OPTIMIZED_METHOD_TYPE_CALL (ruby#15859)
Closes: Shopify#865 ## Benchmark ### lobsters - wall clock time - before patch: Average of last 10, non-warmup iters: 809ms - after patch: Average of last 10, non-warmup iters: 754ms - zjit stats below <details> <summary>before patch</summary> ``` ***ZJIT: Printing ZJIT statistics on exit*** Top-20 not inlined C methods (54.9% of total 18,003,698): Hash#fetch: 3,184,106 (17.7%) Regexp#match?: 707,148 ( 3.9%) Hash#key?: 689,879 ( 3.8%) String#sub!: 489,841 ( 2.7%) Array#include?: 470,648 ( 2.6%) Set#include?: 397,520 ( 2.2%) String#<<: 396,279 ( 2.2%) String#start_with?: 373,666 ( 2.1%) Kernel#dup: 352,617 ( 2.0%) Array#any?: 350,454 ( 1.9%) Hash#delete: 331,784 ( 1.8%) String.new: 307,248 ( 1.7%) Integer#===: 262,336 ( 1.5%) Symbol#end_with?: 255,538 ( 1.4%) Kernel#is_a?: 247,292 ( 1.4%) Process.clock_gettime: 221,588 ( 1.2%) Integer#>: 219,718 ( 1.2%) String#match?: 216,903 ( 1.2%) String#downcase: 213,108 ( 1.2%) Integer#<=: 202,617 ( 1.1%) Top-20 calls to C functions from JIT code (80.3% of total 130,255,689): rb_vm_opt_send_without_block: 28,329,698 (21.7%) rb_hash_aref: 8,992,191 ( 6.9%) rb_vm_env_write: 8,526,087 ( 6.5%) rb_vm_send: 8,337,448 ( 6.4%) rb_zjit_writebarrier_check_immediate: 7,809,310 ( 6.0%) rb_obj_is_kind_of: 6,098,929 ( 4.7%) rb_vm_getinstancevariable: 5,783,055 ( 4.4%) rb_vm_invokesuper: 5,038,443 ( 3.9%) rb_ivar_get_at_no_ractor_check: 4,762,093 ( 3.7%) rb_ary_entry: 4,283,966 ( 3.3%) rb_hash_aset: 2,429,862 ( 1.9%) rb_vm_setinstancevariable: 2,343,571 ( 1.8%) rb_vm_opt_getconstant_path: 2,284,810 ( 1.8%) Hash#fetch: 1,778,515 ( 1.4%) fetch: 1,405,591 ( 1.1%) rb_vm_invokeblock: 1,381,332 ( 1.1%) rb_str_buf_append: 1,362,272 ( 1.0%) rb_ec_ary_new_from_values: 1,324,997 ( 1.0%) rb_class_allocate_instance: 1,288,936 ( 1.0%) rb_hash_new_with_size: 998,628 ( 0.8%) Top-2 not optimized method types for send (100.0% of total 4,896,274): iseq: 4,893,452 (99.9%) null: 2,822 ( 0.1%) Top-4 not optimized method types for send_without_block (100.0% of total 782,296): optimized_send: 479,562 (61.3%) optimized_call: 256,609 (32.8%) null: 41,967 ( 5.4%) optimized_block_call: 4,158 ( 0.5%) Top-4 instructions with uncategorized fallback reason (100.0% of total 7,250,555): invokesuper: 5,038,443 (69.5%) invokeblock: 1,381,332 (19.1%) sendforward: 798,924 (11.0%) opt_send_without_block: 31,856 ( 0.4%) Top-18 send fallback reasons (100.0% of total 43,885,845): send_without_block_polymorphic: 18,533,639 (42.2%) uncategorized: 7,250,555 (16.5%) send_not_optimized_method_type: 4,896,274 (11.2%) send_without_block_no_profiles: 4,741,871 (10.8%) send_no_profiles: 2,865,577 ( 6.5%) one_or_more_complex_arg_pass: 2,825,240 ( 6.4%) send_without_block_not_optimized_method_type_optimized: 740,329 ( 1.7%) send_without_block_megamorphic: 709,818 ( 1.6%) send_polymorphic: 541,186 ( 1.2%) send_without_block_not_optimized_need_permission: 382,622 ( 0.9%) too_many_args_for_lir: 173,244 ( 0.4%) argc_param_mismatch: 50,382 ( 0.1%) send_without_block_not_optimized_method_type: 41,967 ( 0.1%) send_without_block_cfunc_array_variadic: 36,302 ( 0.1%) obj_to_string_not_string: 34,169 ( 0.1%) send_without_block_direct_keyword_mismatch: 32,436 ( 0.1%) send_megamorphic: 28,613 ( 0.1%) ccall_with_frame_too_many_args: 1,621 ( 0.0%) Top-4 setivar fallback reasons (100.0% of total 2,343,571): not_monomorphic: 2,120,856 (90.5%) not_t_object: 125,163 ( 5.3%) too_complex: 97,531 ( 4.2%) new_shape_needs_extension: 21 ( 0.0%) Top-2 getivar fallback reasons (100.0% of total 5,908,168): not_monomorphic: 5,658,909 (95.8%) too_complex: 249,259 ( 4.2%) Top-3 definedivar fallback reasons (100.0% of total 405,079): not_monomorphic: 397,150 (98.0%) too_complex: 5,122 ( 1.3%) not_t_object: 2,807 ( 0.7%) Top-6 invokeblock handler (100.0% of total 1,381,332): monomorphic_iseq: 685,359 (49.6%) polymorphic: 521,992 (37.8%) monomorphic_other: 104,640 ( 7.6%) monomorphic_ifunc: 55,505 ( 4.0%) no_profiles: 9,164 ( 0.7%) megamorphic: 4,672 ( 0.3%) Top-9 popular complex argument-parameter features not optimized (100.0% of total 3,097,538): param_kw_opt: 1,333,367 (43.0%) param_block: 632,885 (20.4%) param_forwardable: 600,601 (19.4%) param_rest: 329,020 (10.6%) param_kwrest: 119,971 ( 3.9%) caller_kw_splat: 39,001 ( 1.3%) caller_splat: 36,785 ( 1.2%) caller_blockarg: 5,798 ( 0.2%) caller_kwarg: 110 ( 0.0%) Top-1 compile error reasons (100.0% of total 186,900): exception_handler: 186,900 (100.0%) Top-7 unhandled YARV insns (100.0% of total 186,598): getblockparam: 99,414 (53.3%) invokesuperforward: 81,667 (43.8%) setblockparam: 2,837 ( 1.5%) getconstant: 1,537 ( 0.8%) checkmatch: 616 ( 0.3%) expandarray: 360 ( 0.2%) once: 167 ( 0.1%) Top-3 unhandled HIR insns (100.0% of total 236,962): throw: 198,474 (83.8%) invokebuiltin: 35,767 (15.1%) array_max: 2,721 ( 1.1%) Top-19 side exit reasons (100.0% of total 15,427,184): guard_type_failure: 6,865,696 (44.5%) guard_shape_failure: 6,779,586 (43.9%) block_param_proxy_not_iseq_or_ifunc: 1,030,319 ( 6.7%) unhandled_hir_insn: 236,962 ( 1.5%) compile_error: 186,900 ( 1.2%) unhandled_yarv_insn: 186,598 ( 1.2%) fixnum_mult_overflow: 50,739 ( 0.3%) block_param_proxy_modified: 28,119 ( 0.2%) patchpoint_no_singleton_class: 14,903 ( 0.1%) unhandled_newarray_send_pack: 14,481 ( 0.1%) fixnum_lshift_overflow: 10,085 ( 0.1%) patchpoint_stable_constant_names: 9,198 ( 0.1%) patchpoint_no_ep_escape: 7,815 ( 0.1%) expandarray_failure: 4,533 ( 0.0%) patchpoint_method_redefined: 662 ( 0.0%) obj_to_string_fallback: 277 ( 0.0%) guard_less_failure: 163 ( 0.0%) interrupt: 128 ( 0.0%) guard_greater_eq_failure: 20 ( 0.0%) send_count: 151,233,937 dynamic_send_count: 43,885,845 (29.0%) optimized_send_count: 107,348,092 (71.0%) dynamic_setivar_count: 2,343,571 ( 1.5%) dynamic_getivar_count: 5,908,168 ( 3.9%) dynamic_definedivar_count: 405,079 ( 0.3%) iseq_optimized_send_count: 37,324,023 (24.7%) inline_cfunc_optimized_send_count: 46,056,028 (30.5%) inline_iseq_optimized_send_count: 3,756,875 ( 2.5%) non_variadic_cfunc_optimized_send_count: 11,618,909 ( 7.7%) variadic_cfunc_optimized_send_count: 8,592,257 ( 5.7%) compiled_iseq_count: 5,289 failed_iseq_count: 0 compile_time: 1,664ms profile_time: 13ms gc_time: 20ms invalidation_time: 479ms vm_write_pc_count: 127,571,422 vm_write_sp_count: 127,571,422 vm_write_locals_count: 122,781,971 vm_write_stack_count: 122,781,971 vm_write_to_parent_iseq_local_count: 689,945 vm_read_from_parent_iseq_local_count: 14,721,820 guard_type_count: 167,633,896 guard_type_exit_ratio: 4.1% guard_shape_count: 0 code_region_bytes: 38,912,000 zjit_alloc_bytes: 40,542,102 total_mem_bytes: 79,454,102 side_exit_count: 15,427,184 total_insn_count: 927,373,567 vm_insn_count: 156,976,359 zjit_insn_count: 770,397,208 ratio_in_zjit: 83.1% ``` </details> <details> <summary>after patch</summary> ``` ***ZJIT: Printing ZJIT statistics on exit*** Top-20 not inlined C methods (55.0% of total 18,012,630): Hash#fetch: 3,184,101 (17.7%) Regexp#match?: 707,150 ( 3.9%) Hash#key?: 689,871 ( 3.8%) String#sub!: 489,841 ( 2.7%) Array#include?: 470,648 ( 2.6%) Set#include?: 397,520 ( 2.2%) String#<<: 396,279 ( 2.2%) String#start_with?: 382,538 ( 2.1%) Kernel#dup: 352,617 ( 2.0%) Array#any?: 350,454 ( 1.9%) Hash#delete: 331,802 ( 1.8%) String.new: 307,248 ( 1.7%) Integer#===: 262,336 ( 1.5%) Symbol#end_with?: 255,540 ( 1.4%) Kernel#is_a?: 247,292 ( 1.4%) Process.clock_gettime: 221,588 ( 1.2%) Integer#>: 219,718 ( 1.2%) String#match?: 216,905 ( 1.2%) String#downcase: 213,107 ( 1.2%) Integer#<=: 202,617 ( 1.1%) Top-20 calls to C functions from JIT code (80.1% of total 130,218,934): rb_vm_opt_send_without_block: 28,073,153 (21.6%) rb_hash_aref: 8,992,167 ( 6.9%) rb_vm_env_write: 8,526,089 ( 6.5%) rb_vm_send: 8,337,453 ( 6.4%) rb_zjit_writebarrier_check_immediate: 7,786,426 ( 6.0%) rb_obj_is_kind_of: 6,098,927 ( 4.7%) rb_vm_getinstancevariable: 5,783,053 ( 4.4%) rb_vm_invokesuper: 5,038,444 ( 3.9%) rb_ivar_get_at_no_ractor_check: 4,762,093 ( 3.7%) rb_ary_entry: 4,283,965 ( 3.3%) rb_hash_aset: 2,429,864 ( 1.9%) rb_vm_setinstancevariable: 2,343,573 ( 1.8%) rb_vm_opt_getconstant_path: 2,284,809 ( 1.8%) Hash#fetch: 1,778,510 ( 1.4%) fetch: 1,405,591 ( 1.1%) rb_vm_invokeblock: 1,381,329 ( 1.1%) rb_str_buf_append: 1,362,272 ( 1.0%) rb_ec_ary_new_from_values: 1,325,005 ( 1.0%) rb_class_allocate_instance: 1,288,944 ( 1.0%) rb_hash_new_with_size: 998,629 ( 0.8%) Top-2 not optimized method types for send (100.0% of total 4,896,276): iseq: 4,893,454 (99.9%) null: 2,822 ( 0.1%) Top-3 not optimized method types for send_without_block (100.0% of total 525,687): optimized_send: 479,562 (91.2%) null: 41,967 ( 8.0%) optimized_block_call: 4,158 ( 0.8%) Top-4 instructions with uncategorized fallback reason (100.0% of total 7,250,556): invokesuper: 5,038,444 (69.5%) invokeblock: 1,381,329 (19.1%) sendforward: 798,924 (11.0%) opt_send_without_block: 31,859 ( 0.4%) Top-18 send fallback reasons (100.0% of total 43,629,303): send_without_block_polymorphic: 18,533,669 (42.5%) uncategorized: 7,250,556 (16.6%) send_not_optimized_method_type: 4,896,276 (11.2%) send_without_block_no_profiles: 4,741,899 (10.9%) send_no_profiles: 2,865,579 ( 6.6%) one_or_more_complex_arg_pass: 2,825,242 ( 6.5%) send_without_block_megamorphic: 709,818 ( 1.6%) send_polymorphic: 541,187 ( 1.2%) send_without_block_not_optimized_method_type_optimized: 483,720 ( 1.1%) send_without_block_not_optimized_need_permission: 382,623 ( 0.9%) too_many_args_for_lir: 173,244 ( 0.4%) argc_param_mismatch: 50,382 ( 0.1%) send_without_block_not_optimized_method_type: 41,967 ( 0.1%) send_without_block_cfunc_array_variadic: 36,302 ( 0.1%) obj_to_string_not_string: 34,169 ( 0.1%) send_without_block_direct_keyword_mismatch: 32,436 ( 0.1%) send_megamorphic: 28,613 ( 0.1%) ccall_with_frame_too_many_args: 1,621 ( 0.0%) Top-4 setivar fallback reasons (100.0% of total 2,343,573): not_monomorphic: 2,120,858 (90.5%) not_t_object: 125,163 ( 5.3%) too_complex: 97,531 ( 4.2%) new_shape_needs_extension: 21 ( 0.0%) Top-2 getivar fallback reasons (100.0% of total 5,908,165): not_monomorphic: 5,658,912 (95.8%) too_complex: 249,253 ( 4.2%) Top-3 definedivar fallback reasons (100.0% of total 405,079): not_monomorphic: 397,150 (98.0%) too_complex: 5,122 ( 1.3%) not_t_object: 2,807 ( 0.7%) Top-6 invokeblock handler (100.0% of total 1,381,329): monomorphic_iseq: 685,363 (49.6%) polymorphic: 521,984 (37.8%) monomorphic_other: 104,640 ( 7.6%) monomorphic_ifunc: 55,505 ( 4.0%) no_profiles: 9,164 ( 0.7%) megamorphic: 4,673 ( 0.3%) Top-9 popular complex argument-parameter features not optimized (100.0% of total 3,094,719): param_kw_opt: 1,333,367 (43.1%) param_block: 632,886 (20.5%) param_forwardable: 600,605 (19.4%) param_rest: 329,019 (10.6%) param_kwrest: 119,971 ( 3.9%) caller_kw_splat: 39,001 ( 1.3%) caller_splat: 33,962 ( 1.1%) caller_blockarg: 5,798 ( 0.2%) caller_kwarg: 110 ( 0.0%) Top-1 compile error reasons (100.0% of total 186,917): exception_handler: 186,917 (100.0%) Top-7 unhandled YARV insns (100.0% of total 186,598): getblockparam: 99,414 (53.3%) invokesuperforward: 81,667 (43.8%) setblockparam: 2,837 ( 1.5%) getconstant: 1,537 ( 0.8%) checkmatch: 616 ( 0.3%) expandarray: 360 ( 0.2%) once: 167 ( 0.1%) Top-3 unhandled HIR insns (100.0% of total 236,969): throw: 198,475 (83.8%) invokebuiltin: 35,773 (15.1%) array_max: 2,721 ( 1.1%) Top-19 side exit reasons (100.0% of total 15,450,102): guard_type_failure: 6,888,596 (44.6%) guard_shape_failure: 6,779,586 (43.9%) block_param_proxy_not_iseq_or_ifunc: 1,030,319 ( 6.7%) unhandled_hir_insn: 236,969 ( 1.5%) compile_error: 186,917 ( 1.2%) unhandled_yarv_insn: 186,598 ( 1.2%) fixnum_mult_overflow: 50,739 ( 0.3%) block_param_proxy_modified: 28,119 ( 0.2%) patchpoint_no_singleton_class: 14,903 ( 0.1%) unhandled_newarray_send_pack: 14,481 ( 0.1%) fixnum_lshift_overflow: 10,085 ( 0.1%) patchpoint_stable_constant_names: 9,198 ( 0.1%) patchpoint_no_ep_escape: 7,815 ( 0.1%) expandarray_failure: 4,533 ( 0.0%) patchpoint_method_redefined: 662 ( 0.0%) obj_to_string_fallback: 277 ( 0.0%) guard_less_failure: 163 ( 0.0%) interrupt: 122 ( 0.0%) guard_greater_eq_failure: 20 ( 0.0%) send_count: 150,986,368 dynamic_send_count: 43,629,303 (28.9%) optimized_send_count: 107,357,065 (71.1%) dynamic_setivar_count: 2,343,573 ( 1.6%) dynamic_getivar_count: 5,908,165 ( 3.9%) dynamic_definedivar_count: 405,079 ( 0.3%) iseq_optimized_send_count: 37,324,039 (24.7%) inline_cfunc_optimized_send_count: 46,056,046 (30.5%) inline_iseq_optimized_send_count: 3,756,881 ( 2.5%) non_variadic_cfunc_optimized_send_count: 11,618,958 ( 7.7%) variadic_cfunc_optimized_send_count: 8,601,141 ( 5.7%) compiled_iseq_count: 5,289 failed_iseq_count: 0 compile_time: 1,700ms profile_time: 13ms gc_time: 21ms invalidation_time: 519ms vm_write_pc_count: 127,557,549 vm_write_sp_count: 127,557,549 vm_write_locals_count: 122,768,084 vm_write_stack_count: 122,768,084 vm_write_to_parent_iseq_local_count: 689,953 vm_read_from_parent_iseq_local_count: 14,730,705 guard_type_count: 167,853,730 guard_type_exit_ratio: 4.1% guard_shape_count: 0 code_region_bytes: 38,928,384 zjit_alloc_bytes: 41,103,415 total_mem_bytes: 80,031,799 side_exit_count: 15,450,102 total_insn_count: 927,432,364 vm_insn_count: 157,182,251 zjit_insn_count: 770,250,113 ratio_in_zjit: 83.1% ``` </details>
1 parent 8a586af commit 0e0fad1

File tree

8 files changed

+361
-24
lines changed

8 files changed

+361
-24
lines changed

jit.c

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -191,6 +191,14 @@ rb_jit_get_proc_ptr(VALUE procv)
191191
return proc;
192192
}
193193

194+
VALUE
195+
rb_optimized_call(VALUE *recv, rb_execution_context_t *ec, int argc, VALUE *argv, int kw_splat, VALUE block_handler)
196+
{
197+
rb_proc_t *proc;
198+
GetProcPtr(recv, proc);
199+
return rb_vm_invoke_proc(ec, proc, argc, argv, kw_splat, block_handler);
200+
}
201+
194202
unsigned int
195203
rb_jit_iseq_builtin_attrs(const rb_iseq_t *iseq)
196204
{

test/ruby/test_zjit.rb

Lines changed: 68 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -470,6 +470,74 @@ def test(&block)
470470
}, insns: [:getblockparamproxy]
471471
end
472472

473+
def test_optimized_method_call_proc_call
474+
assert_compiles '2', %q{
475+
p = proc { |x| x * 2 }
476+
def test(p)
477+
p.call(1)
478+
end
479+
test(p)
480+
test(p)
481+
}, call_threshold: 2, insns: [:opt_send_without_block]
482+
end
483+
484+
def test_optimized_method_call_proc_aref
485+
assert_compiles '4', %q{
486+
p = proc { |x| x * 2 }
487+
def test(p)
488+
p[2]
489+
end
490+
test(p)
491+
test(p)
492+
}, call_threshold: 2, insns: [:opt_aref]
493+
end
494+
495+
def test_optimized_method_call_proc_yield
496+
assert_compiles '6', %q{
497+
p = proc { |x| x * 2 }
498+
def test(p)
499+
p.yield(3)
500+
end
501+
test(p)
502+
test(p)
503+
}, call_threshold: 2, insns: [:opt_send_without_block]
504+
end
505+
506+
def test_optimized_method_call_proc_kw_splat
507+
assert_compiles '3', %q{
508+
p = proc { |**kw| kw[:a] + kw[:b] }
509+
def test(p, h)
510+
p.call(**h)
511+
end
512+
h = { a: 1, b: 2 }
513+
test(p, h)
514+
test(p, h)
515+
}, call_threshold: 2, insns: [:opt_send_without_block]
516+
end
517+
518+
def test_optimized_method_call_proc_call_splat
519+
assert_compiles '43', %q{
520+
p = proc { |x| x + 1 }
521+
def test(p)
522+
ary = [42]
523+
p.call(*ary)
524+
end
525+
test(p)
526+
test(p)
527+
}, call_threshold: 2
528+
end
529+
530+
def test_optimized_method_call_proc_call_kwarg
531+
assert_compiles '1', %q{
532+
p = proc { |a:| a }
533+
def test(p)
534+
p.call(a: 1)
535+
end
536+
test(p)
537+
test(p)
538+
}, call_threshold: 2
539+
end
540+
473541
def test_call_a_forwardable_method
474542
assert_runs '[]', %q{
475543
def test_root = forwardable

yjit.c

Lines changed: 0 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -223,14 +223,6 @@ typedef struct rb_iseq_param_keyword rb_seq_param_keyword_struct;
223223

224224
ID rb_get_symbol_id(VALUE namep);
225225

226-
VALUE
227-
rb_optimized_call(VALUE *recv, rb_execution_context_t *ec, int argc, VALUE *argv, int kw_splat, VALUE block_handler)
228-
{
229-
rb_proc_t *proc;
230-
GetProcPtr(recv, proc);
231-
return rb_vm_invoke_proc(ec, proc, argc, argv, kw_splat, block_handler);
232-
}
233-
234226
// If true, the iseq has only opt_invokebuiltin_delegate(_leave) and leave insns.
235227
static bool
236228
invokebuiltin_delegate_leave_p(const rb_iseq_t *iseq)

yjit/src/cruby_bindings.inc.rs

Lines changed: 8 additions & 8 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

zjit/src/codegen.rs

Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -404,6 +404,7 @@ fn gen_insn(cb: &mut CodeBlock, jit: &mut JITState, asm: &mut Assembler, functio
404404
Insn::SendWithoutBlockDirect { cme, iseq, recv, args, state, .. } => gen_send_iseq_direct(cb, jit, asm, *cme, *iseq, opnd!(recv), opnds!(args), &function.frame_state(*state), None),
405405
&Insn::InvokeSuper { cd, blockiseq, state, reason, .. } => gen_invokesuper(jit, asm, cd, blockiseq, &function.frame_state(state), reason),
406406
&Insn::InvokeBlock { cd, state, reason, .. } => gen_invokeblock(jit, asm, cd, &function.frame_state(state), reason),
407+
Insn::InvokeProc { recv, args, state, kw_splat } => gen_invokeproc(jit, asm, opnd!(recv), opnds!(args), *kw_splat, &function.frame_state(*state)),
407408
// Ensure we have enough room fit ec, self, and arguments
408409
// TODO remove this check when we have stack args (we can use Time.new to test it)
409410
Insn::InvokeBuiltin { bf, state, .. } if bf.argc + 2 > (C_ARG_OPNDS.len() as i32) => return Err(*state),
@@ -1497,6 +1498,35 @@ fn gen_invokeblock(
14971498
)
14981499
}
14991500

1501+
fn gen_invokeproc(
1502+
jit: &mut JITState,
1503+
asm: &mut Assembler,
1504+
recv: Opnd,
1505+
args: Vec<Opnd>,
1506+
kw_splat: bool,
1507+
state: &FrameState,
1508+
) -> lir::Opnd {
1509+
gen_prepare_non_leaf_call(jit, asm, state);
1510+
1511+
asm_comment!(asm, "call invokeproc");
1512+
1513+
let argv_ptr = gen_push_opnds(asm, &args);
1514+
let kw_splat_opnd = Opnd::Imm(i64::from(kw_splat));
1515+
let result = asm_ccall!(
1516+
asm,
1517+
rb_optimized_call,
1518+
recv,
1519+
EC,
1520+
args.len().into(),
1521+
argv_ptr,
1522+
kw_splat_opnd,
1523+
VM_BLOCK_HANDLER_NONE.into()
1524+
);
1525+
gen_pop_opnds(asm, &args);
1526+
1527+
result
1528+
}
1529+
15001530
/// Compile a dynamic dispatch for `super`
15011531
fn gen_invokesuper(
15021532
jit: &mut JITState,

zjit/src/cruby_bindings.inc.rs

Lines changed: 8 additions & 0 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

zjit/src/hir.rs

Lines changed: 59 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -932,6 +932,13 @@ pub enum Insn {
932932
state: InsnId,
933933
reason: SendFallbackReason,
934934
},
935+
/// Call Proc#call optimized method type.
936+
InvokeProc {
937+
recv: InsnId,
938+
args: Vec<InsnId>,
939+
state: InsnId,
940+
kw_splat: bool,
941+
},
935942

936943
/// Optimized ISEQ call
937944
SendWithoutBlockDirect {
@@ -1452,6 +1459,16 @@ impl<'a> std::fmt::Display for InsnPrinter<'a> {
14521459
write!(f, " # SendFallbackReason: {reason}")?;
14531460
Ok(())
14541461
}
1462+
Insn::InvokeProc { recv, args, kw_splat, .. } => {
1463+
write!(f, "InvokeProc {recv}")?;
1464+
for arg in args {
1465+
write!(f, ", {arg}")?;
1466+
}
1467+
if *kw_splat {
1468+
write!(f, ", kw_splat")?;
1469+
}
1470+
Ok(())
1471+
}
14551472
Insn::InvokeBuiltin { bf, args, leaf, .. } => {
14561473
let bf_name = unsafe { CStr::from_ptr(bf.name) }.to_str().unwrap();
14571474
write!(f, "InvokeBuiltin{} {}",
@@ -2228,6 +2245,12 @@ impl Function {
22282245
state,
22292246
reason,
22302247
},
2248+
&InvokeProc { recv, ref args, state, kw_splat } => InvokeProc {
2249+
recv: find!(recv),
2250+
args: find_vec!(args),
2251+
state: find!(state),
2252+
kw_splat,
2253+
},
22312254
&InvokeBuiltin { bf, recv, ref args, state, leaf, return_type } => InvokeBuiltin { bf, recv: find!(recv), args: find_vec!(args), state, leaf, return_type },
22322255
&ArrayDup { val, state } => ArrayDup { val: find!(val), state },
22332256
&HashDup { val, state } => HashDup { val: find!(val), state },
@@ -2416,6 +2439,7 @@ impl Function {
24162439
Insn::SendForward { .. } => types::BasicObject,
24172440
Insn::InvokeSuper { .. } => types::BasicObject,
24182441
Insn::InvokeBlock { .. } => types::BasicObject,
2442+
Insn::InvokeProc { .. } => types::BasicObject,
24192443
Insn::InvokeBuiltin { return_type, .. } => return_type.unwrap_or(types::BasicObject),
24202444
Insn::Defined { pushval, .. } => Type::from_value(*pushval).union(types::NilClass),
24212445
Insn::DefinedIvar { pushval, .. } => Type::from_value(*pushval).union(types::NilClass),
@@ -2828,14 +2852,7 @@ impl Function {
28282852
};
28292853
let ci = unsafe { get_call_data_ci(cd) }; // info about the call site
28302854

2831-
// If the call site info indicates that the `Function` has overly complex arguments, then
2832-
// do not optimize into a `SendWithoutBlockDirect`.
28332855
let flags = unsafe { rb_vm_ci_flag(ci) };
2834-
if unspecializable_call_type(flags) {
2835-
self.count_complex_call_features(block, flags);
2836-
self.set_dynamic_send_reason(insn_id, ComplexArgPass);
2837-
self.push_insn_id(block, insn_id); continue;
2838-
}
28392856

28402857
let mid = unsafe { vm_ci_mid(ci) };
28412858
// Do method lookup
@@ -2863,6 +2880,14 @@ impl Function {
28632880
def_type = unsafe { get_cme_def_type(cme) };
28642881
}
28652882

2883+
// If the call site info indicates that the `Function` has overly complex arguments, then do not optimize into a `SendWithoutBlockDirect`.
2884+
// Optimized methods(`VM_METHOD_TYPE_OPTIMIZED`) handle their own argument constraints (e.g., kw_splat for Proc call).
2885+
if def_type != VM_METHOD_TYPE_OPTIMIZED && unspecializable_call_type(flags) {
2886+
self.count_complex_call_features(block, flags);
2887+
self.set_dynamic_send_reason(insn_id, ComplexArgPass);
2888+
self.push_insn_id(block, insn_id); continue;
2889+
}
2890+
28662891
if def_type == VM_METHOD_TYPE_ISEQ {
28672892
// TODO(max): Allow non-iseq; cache cme
28682893
// Only specialize positional-positional calls
@@ -2993,7 +3018,31 @@ impl Function {
29933018
} else if def_type == VM_METHOD_TYPE_OPTIMIZED {
29943019
let opt_type: OptimizedMethodType = unsafe { get_cme_def_body_optimized_type(cme) }.into();
29953020
match (opt_type, args.as_slice()) {
3021+
(OptimizedMethodType::Call, _) => {
3022+
if flags & (VM_CALL_ARGS_SPLAT | VM_CALL_KWARG) != 0 {
3023+
self.count_complex_call_features(block, flags);
3024+
self.set_dynamic_send_reason(insn_id, ComplexArgPass);
3025+
self.push_insn_id(block, insn_id); continue;
3026+
}
3027+
// Check singleton class assumption first, before emitting other patchpoints
3028+
if !self.assume_no_singleton_classes(block, klass, state) {
3029+
self.set_dynamic_send_reason(insn_id, SingletonClassSeen);
3030+
self.push_insn_id(block, insn_id); continue;
3031+
}
3032+
self.push_insn(block, Insn::PatchPoint { invariant: Invariant::MethodRedefined { klass, method: mid, cme }, state });
3033+
if let Some(profiled_type) = profiled_type {
3034+
recv = self.push_insn(block, Insn::GuardType { val: recv, guard_type: Type::from_profiled_type(profiled_type), state });
3035+
}
3036+
let kw_splat = flags & VM_CALL_KW_SPLAT != 0;
3037+
let invoke_proc = self.push_insn(block, Insn::InvokeProc { recv, args: args.clone(), state, kw_splat });
3038+
self.make_equal_to(insn_id, invoke_proc);
3039+
}
29963040
(OptimizedMethodType::StructAref, &[]) | (OptimizedMethodType::StructAset, &[_]) => {
3041+
if unspecializable_call_type(flags) {
3042+
self.count_complex_call_features(block, flags);
3043+
self.set_dynamic_send_reason(insn_id, ComplexArgPass);
3044+
self.push_insn_id(block, insn_id); continue;
3045+
}
29973046
let index: i32 = unsafe { get_cme_def_body_optimized_index(cme) }
29983047
.try_into()
29993048
.unwrap();
@@ -4416,7 +4465,8 @@ impl Function {
44164465
| &Insn::CCallWithFrame { recv, ref args, state, .. }
44174466
| &Insn::SendWithoutBlockDirect { recv, ref args, state, .. }
44184467
| &Insn::InvokeBuiltin { recv, ref args, state, .. }
4419-
| &Insn::InvokeSuper { recv, ref args, state, .. } => {
4468+
| &Insn::InvokeSuper { recv, ref args, state, .. }
4469+
| &Insn::InvokeProc { recv, ref args, state, .. } => {
44204470
worklist.push_back(recv);
44214471
worklist.extend(args);
44224472
worklist.push_back(state);
@@ -5041,6 +5091,7 @@ impl Function {
50415091
| Insn::CCallWithFrame { recv, ref args, .. }
50425092
| Insn::CCallVariadic { recv, ref args, .. }
50435093
| Insn::InvokeBuiltin { recv, ref args, .. }
5094+
| Insn::InvokeProc { recv, ref args, .. }
50445095
| Insn::ArrayInclude { target: recv, elements: ref args, .. } => {
50455096
self.assert_subtype(insn_id, recv, types::BasicObject)?;
50465097
for &arg in args {

0 commit comments

Comments
 (0)