Skip to content

Commit 840ec0e

Browse files
tenderloveXrXr
authored andcommitted
Improve set instance variable
This commit improves the set ivar implementation.
1 parent 0285e8d commit 840ec0e

File tree

3 files changed

+212
-56
lines changed

3 files changed

+212
-56
lines changed

bootstraptest/test_yjit.rb

Lines changed: 85 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -239,6 +239,91 @@ def itself
239239
end
240240
}
241241

242+
# test setinstancevariable on extended objects
243+
assert_equal '1', %q{
244+
class Extended
245+
attr_reader :one
246+
247+
def write_many
248+
@a = 1
249+
@b = 2
250+
@c = 3
251+
@d = 4
252+
@one = 1
253+
end
254+
end
255+
256+
foo = Extended.new
257+
foo.write_many
258+
foo.write_many
259+
foo.write_many
260+
}
261+
262+
# test setinstancevariable on embedded objects
263+
assert_equal '1', %q{
264+
class Embedded
265+
attr_reader :one
266+
267+
def write_one
268+
@one = 1
269+
end
270+
end
271+
272+
foo = Embedded.new
273+
foo.write_one
274+
foo.write_one
275+
foo.write_one
276+
}
277+
278+
# test setinstancevariable after extension
279+
assert_equal '[10, 11, 12, 13, 1]', %q{
280+
class WillExtend
281+
attr_reader :one
282+
283+
def make_extended
284+
@foo1 = 10
285+
@foo2 = 11
286+
@foo3 = 12
287+
@foo4 = 13
288+
end
289+
290+
def write_one
291+
@one = 1
292+
end
293+
294+
def read_all
295+
[@foo1, @foo2, @foo3, @foo4, @one]
296+
end
297+
end
298+
299+
foo = WillExtend.new
300+
foo.write_one
301+
foo.write_one
302+
foo.make_extended
303+
foo.write_one
304+
foo.read_all
305+
}
306+
307+
# test setinstancevariable on frozen object
308+
assert_equal 'object was not modified', %q{
309+
class WillFreeze
310+
def write
311+
@ivar = 1
312+
end
313+
end
314+
315+
wf = WillFreeze.new
316+
wf.write
317+
wf.write
318+
wf.freeze
319+
320+
begin
321+
wf.write
322+
rescue FrozenError
323+
"object was not modified"
324+
end
325+
}
326+
242327
# Test getinstancevariable and inline caches
243328
assert_equal '6', %q{
244329
class Foo

yjit_codegen.c

Lines changed: 120 additions & 56 deletions
Original file line numberDiff line numberDiff line change
@@ -745,6 +745,112 @@ enum {
745745
OSWB_MAX_DEPTH = 5, // up to 5 different classes
746746
};
747747

748+
// Codegen for setting an instance variable.
749+
// Preconditions:
750+
// - receiver is in REG0
751+
// - receiver has the same class as CLASS_OF(comptime_receiver)
752+
// - no stack push or pops to ctx since the entry to the codegen of the instruction being compiled
753+
static codegen_status_t
754+
gen_set_ivar(jitstate_t *jit, ctx_t *ctx, const int max_chain_depth, VALUE comptime_receiver, ID ivar_name, insn_opnd_t reg0_opnd, uint8_t *side_exit)
755+
{
756+
VALUE comptime_val_klass = CLASS_OF(comptime_receiver);
757+
const ctx_t starting_context = *ctx; // make a copy for use with jit_chain_guard
758+
759+
// If the class uses the default allocator, instances should all be T_OBJECT
760+
// NOTE: This assumes nobody changes the allocator of the class after allocation.
761+
// Eventually, we can encode whether an object is T_OBJECT or not
762+
// inside object shapes.
763+
if (rb_get_alloc_func(comptime_val_klass) != rb_class_allocate_instance) {
764+
GEN_COUNTER_INC(cb, setivar_not_object);
765+
return YJIT_CANT_COMPILE;
766+
}
767+
RUBY_ASSERT(BUILTIN_TYPE(comptime_receiver) == T_OBJECT); // because we checked the allocator
768+
769+
// ID for the name of the ivar
770+
ID id = ivar_name;
771+
struct rb_iv_index_tbl_entry *ent;
772+
struct st_table *iv_index_tbl = ROBJECT_IV_INDEX_TBL(comptime_receiver);
773+
774+
// Bail if this is a heap object, because this needs a write barrier
775+
ADD_COMMENT(cb, "guard value is immediate");
776+
test(cb, REG1, imm_opnd(RUBY_IMMEDIATE_MASK));
777+
jz_ptr(cb, COUNTED_EXIT(side_exit, setivar_val_heapobject));
778+
779+
// Lookup index for the ivar the instruction loads
780+
if (iv_index_tbl && rb_iv_index_tbl_lookup(iv_index_tbl, id, &ent)) {
781+
uint32_t ivar_index = ent->index;
782+
783+
x86opnd_t val_to_write = ctx_stack_pop(ctx, 1);
784+
mov(cb, REG1, val_to_write);
785+
786+
x86opnd_t flags_opnd = member_opnd(REG0, struct RBasic, flags);
787+
788+
// Bail if this object is frozen
789+
ADD_COMMENT(cb, "guard self is not frozen");
790+
test(cb, flags_opnd, imm_opnd(RUBY_FL_FREEZE));
791+
jz_ptr(cb, COUNTED_EXIT(side_exit, setivar_frozen));
792+
793+
// Pop receiver if it's on the temp stack
794+
if (!reg0_opnd.is_self) {
795+
(void)ctx_stack_pop(ctx, 1);
796+
}
797+
798+
// Compile time self is embedded and the ivar index lands within the object
799+
if (RB_FL_TEST_RAW(comptime_receiver, ROBJECT_EMBED) && ivar_index < ROBJECT_EMBED_LEN_MAX) {
800+
// See ROBJECT_IVPTR() from include/ruby/internal/core/robject.h
801+
802+
// Guard that self is embedded
803+
// TODO: BT and JC is shorter
804+
ADD_COMMENT(cb, "guard embedded setivar");
805+
test(cb, flags_opnd, imm_opnd(ROBJECT_EMBED));
806+
jit_chain_guard(JCC_JZ, jit, &starting_context, max_chain_depth, side_exit);
807+
808+
// Load the variable
809+
x86opnd_t ivar_opnd = mem_opnd(64, REG0, offsetof(struct RObject, as.ary) + ivar_index * SIZEOF_VALUE);
810+
811+
mov(cb, ivar_opnd, REG1);
812+
813+
// Push the ivar on the stack
814+
// For attr_writer we'll need to push the value on the stack
815+
//x86opnd_t out_opnd = ctx_stack_push(ctx, TYPE_UNKNOWN);
816+
}
817+
else {
818+
// Compile time value is *not* embeded.
819+
820+
// Guard that value is *not* embedded
821+
// See ROBJECT_IVPTR() from include/ruby/internal/core/robject.h
822+
ADD_COMMENT(cb, "guard extended setivar");
823+
x86opnd_t flags_opnd = member_opnd(REG0, struct RBasic, flags);
824+
test(cb, flags_opnd, imm_opnd(ROBJECT_EMBED));
825+
jit_chain_guard(JCC_JNZ, jit, &starting_context, max_chain_depth, side_exit);
826+
827+
// check that the extended table is big enough
828+
if (ivar_index >= ROBJECT_EMBED_LEN_MAX + 1) {
829+
// Check that the slot is inside the extended table (num_slots > index)
830+
x86opnd_t num_slots = mem_opnd(32, REG0, offsetof(struct RObject, as.heap.numiv));
831+
cmp(cb, num_slots, imm_opnd(ivar_index));
832+
jle_ptr(cb, COUNTED_EXIT(side_exit, setivar_idx_out_of_range));
833+
}
834+
835+
// Get a pointer to the extended table
836+
x86opnd_t tbl_opnd = mem_opnd(64, REG0, offsetof(struct RObject, as.heap.ivptr));
837+
mov(cb, REG0, tbl_opnd);
838+
839+
// Write the ivar to the extended table
840+
x86opnd_t ivar_opnd = mem_opnd(64, REG0, sizeof(VALUE) * ivar_index);
841+
mov(cb, REG1, val_to_write);
842+
mov(cb, ivar_opnd, REG1);
843+
}
844+
845+
// Jump to next instruction. This allows guard chains to share the same successor.
846+
jit_jump_to_next_insn(jit, ctx);
847+
return YJIT_END_BLOCK;
848+
}
849+
850+
GEN_COUNTER_INC(cb, setivar_name_not_mapped);
851+
return YJIT_CANT_COMPILE;
852+
}
853+
748854
// Codegen for getting an instance variable.
749855
// Preconditions:
750856
// - receiver is in REG0
@@ -867,7 +973,7 @@ gen_getinstancevariable(jitstate_t *jit, ctx_t *ctx)
867973

868974
// Guard that the receiver has the same class as the one from compile time.
869975
mov(cb, REG0, member_opnd(REG_CFP, rb_control_frame_t, self));
870-
guard_self_is_heap(cb, REG0, side_exit, ctx);
976+
guard_self_is_heap(cb, REG0, COUNTED_EXIT(side_exit, getivar_se_self_not_heap), ctx);
871977

872978
jit_guard_known_klass(jit, ctx, comptime_val_klass, OPND_SELF, GETIVAR_MAX_DEPTH, side_exit);
873979

@@ -877,69 +983,27 @@ gen_getinstancevariable(jitstate_t *jit, ctx_t *ctx)
877983
static codegen_status_t
878984
gen_setinstancevariable(jitstate_t* jit, ctx_t* ctx)
879985
{
880-
IVC ic = (IVC)jit_get_arg(jit, 1);
881-
882-
// Check that the inline cache has been set, slot index is known
883-
if (!ic->entry) {
884-
return YJIT_CANT_COMPILE;
986+
// Defer compilation so we can specialize on a runtime `self`
987+
if (!jit_at_current_insn(jit)) {
988+
defer_compilation(jit->block, jit->insn_idx, ctx);
989+
return YJIT_END_BLOCK;
885990
}
886991

887-
// If the class uses the default allocator, instances should all be T_OBJECT
888-
// NOTE: This assumes nobody changes the allocator of the class after allocation.
889-
// Eventually, we can encode whether an object is T_OBJECT or not
890-
// inside object shapes.
891-
if (rb_get_alloc_func(ic->entry->class_value) != rb_class_allocate_instance) {
892-
return YJIT_CANT_COMPILE;
893-
}
992+
ID ivar_name = (ID)jit_get_arg(jit, 0);
894993

895-
uint32_t ivar_index = ic->entry->index;
994+
VALUE comptime_val = jit_peek_at_self(jit, ctx);
995+
VALUE comptime_val_klass = CLASS_OF(comptime_val);
896996

897-
// Create a size-exit to fall back to the interpreter
898-
uint8_t* side_exit = yjit_side_exit(jit, ctx);
997+
// Generate a side exit
998+
uint8_t *side_exit = yjit_side_exit(jit, ctx);
899999

900-
// Load self from CFP
1000+
// Guard that the receiver has the same class as the one from compile time.
9011001
mov(cb, REG0, member_opnd(REG_CFP, rb_control_frame_t, self));
1002+
guard_self_is_heap(cb, REG0, COUNTED_EXIT(side_exit, setivar_se_self_not_heap), ctx);
9021003

903-
guard_self_is_heap(cb, REG0, side_exit, ctx);
904-
905-
// Bail if receiver class is different from compiled time call cache class
906-
x86opnd_t klass_opnd = mem_opnd(64, REG0, offsetof(struct RBasic, klass));
907-
mov(cb, REG1, klass_opnd);
908-
x86opnd_t serial_opnd = mem_opnd(64, REG1, offsetof(struct RClass, class_serial));
909-
cmp(cb, serial_opnd, imm_opnd(ic->entry->class_serial));
910-
jne_ptr(cb, side_exit);
911-
912-
// Bail if the ivars are not on the extended table
913-
// See ROBJECT_IVPTR() from include/ruby/internal/core/robject.h
914-
x86opnd_t flags_opnd = member_opnd(REG0, struct RBasic, flags);
915-
test(cb, flags_opnd, imm_opnd(ROBJECT_EMBED));
916-
jnz_ptr(cb, side_exit);
917-
918-
// If we can't guarantee that the extended table is big enoughg
919-
if (ivar_index >= ROBJECT_EMBED_LEN_MAX + 1) {
920-
// Check that the slot is inside the extended table (num_slots > index)
921-
x86opnd_t num_slots = mem_opnd(32, REG0, offsetof(struct RObject, as.heap.numiv));
922-
cmp(cb, num_slots, imm_opnd(ivar_index));
923-
jle_ptr(cb, side_exit);
924-
}
925-
926-
// Get a pointer to the extended table
927-
x86opnd_t tbl_opnd = mem_opnd(64, REG0, offsetof(struct RObject, as.heap.ivptr));
928-
mov(cb, REG0, tbl_opnd);
929-
930-
// Pop the value to write from the stack
931-
x86opnd_t stack_top = ctx_stack_pop(ctx, 1);
932-
mov(cb, REG1, stack_top);
933-
934-
// Bail if this is a heap object, because this needs a write barrier
935-
test(cb, REG1, imm_opnd(RUBY_IMMEDIATE_MASK));
936-
jz_ptr(cb, side_exit);
937-
938-
// Write the ivar to the extended table
939-
x86opnd_t ivar_opnd = mem_opnd(64, REG0, sizeof(VALUE) * ivar_index);
940-
mov(cb, ivar_opnd, REG1);
1004+
jit_guard_known_klass(jit, ctx, comptime_val_klass, OPND_SELF, GETIVAR_MAX_DEPTH, side_exit);
9411005

942-
return YJIT_KEEP_COMPILING;
1006+
return gen_set_ivar(jit, ctx, GETIVAR_MAX_DEPTH, comptime_val, ivar_name, OPND_SELF, side_exit);
9431007
}
9441008

9451009
static void

yjit_iface.h

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -57,6 +57,13 @@ YJIT_DECLARE_COUNTERS(
5757
getivar_name_not_mapped,
5858
getivar_not_object,
5959

60+
setivar_se_self_not_heap,
61+
setivar_idx_out_of_range,
62+
setivar_val_heapobject,
63+
setivar_name_not_mapped,
64+
setivar_not_object,
65+
setivar_frozen,
66+
6067
oaref_argc_not_one,
6168
oaref_arg_not_fixnum,
6269

0 commit comments

Comments
 (0)