Skip to content

Commit

Permalink
YJIT: handle expandarray_rhs_too_small case
Browse files Browse the repository at this point in the history
YJIT: fix csel bug in x86 backend, add test

Remove commented out lines

Refactor expandarray to use chain guards
  • Loading branch information
maximecb committed Aug 2, 2023
1 parent 32e828b commit 10f619d
Show file tree
Hide file tree
Showing 4 changed files with 132 additions and 39 deletions.
11 changes: 11 additions & 0 deletions bootstraptest/test_yjit.rb
Original file line number Diff line number Diff line change
Expand Up @@ -2276,6 +2276,17 @@ def expandarray_rhs_too_small
expandarray_rhs_too_small
}

assert_equal '[nil, 2, nil]', %q{
def foo(arr)
a, b, c = arr
end
a, b, c1 = foo([0, 1])
a, b, c2 = foo([0, 1, 2])
a, b, c3 = foo([0, 1])
[c1, c2, c3]
}

assert_equal '[1, [2]]', %q{
def expandarray_splat
a, *b = [1, 2]
Expand Down
66 changes: 54 additions & 12 deletions yjit/src/backend/x86_64/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -428,11 +428,31 @@ impl Assembler
}
}

fn emit_csel(cb: &mut CodeBlock, truthy: Opnd, falsy: Opnd, out: Opnd, cmov_fn: fn(&mut CodeBlock, X86Opnd, X86Opnd)) {
if out != truthy {
mov(cb, out.into(), truthy.into());
fn emit_csel(
cb: &mut CodeBlock,
truthy: Opnd,
falsy: Opnd,
out: Opnd,
cmov_fn: fn(&mut CodeBlock, X86Opnd, X86Opnd),
cmov_neg: fn(&mut CodeBlock, X86Opnd, X86Opnd)){

// Assert that output is a register
out.unwrap_reg();

// If the truthy value is a memory operand
if let Opnd::Mem(_) = truthy {
if out != falsy {
mov(cb, out.into(), falsy.into());
}

cmov_fn(cb, out.into(), truthy.into());
} else {
if out != truthy {
mov(cb, out.into(), truthy.into());
}

cmov_neg(cb, out.into(), falsy.into());
}
cmov_fn(cb, out.into(), falsy.into());
}

//dbg!(&self.insns);
Expand Down Expand Up @@ -724,28 +744,28 @@ impl Assembler
Insn::Breakpoint => int3(cb),

Insn::CSelZ { truthy, falsy, out } => {
emit_csel(cb, *truthy, *falsy, *out, cmovnz);
emit_csel(cb, *truthy, *falsy, *out, cmovz, cmovnz);
},
Insn::CSelNZ { truthy, falsy, out } => {
emit_csel(cb, *truthy, *falsy, *out, cmovz);
emit_csel(cb, *truthy, *falsy, *out, cmovnz, cmovz);
},
Insn::CSelE { truthy, falsy, out } => {
emit_csel(cb, *truthy, *falsy, *out, cmovne);
emit_csel(cb, *truthy, *falsy, *out, cmove, cmovne);
},
Insn::CSelNE { truthy, falsy, out } => {
emit_csel(cb, *truthy, *falsy, *out, cmove);
emit_csel(cb, *truthy, *falsy, *out, cmovne, cmove);
},
Insn::CSelL { truthy, falsy, out } => {
emit_csel(cb, *truthy, *falsy, *out, cmovge);
emit_csel(cb, *truthy, *falsy, *out, cmovl, cmovge);
},
Insn::CSelLE { truthy, falsy, out } => {
emit_csel(cb, *truthy, *falsy, *out, cmovg);
emit_csel(cb, *truthy, *falsy, *out, cmovle, cmovg);
},
Insn::CSelG { truthy, falsy, out } => {
emit_csel(cb, *truthy, *falsy, *out, cmovle);
emit_csel(cb, *truthy, *falsy, *out, cmovg, cmovle);
},
Insn::CSelGE { truthy, falsy, out } => {
emit_csel(cb, *truthy, *falsy, *out, cmovl);
emit_csel(cb, *truthy, *falsy, *out, cmovge, cmovl);
}
Insn::LiveReg { .. } => (), // just a reg alloc signal, no code
Insn::PadInvalPatch => {
Expand Down Expand Up @@ -1177,4 +1197,26 @@ mod tests {
0x23: call rax
"});
}

#[test]
fn test_cmov_mem() {
let (mut asm, mut cb) = setup_asm();

let top = Opnd::mem(64, SP, 0);
let ary_opnd = SP;
let array_len_opnd = Opnd::mem(64, SP, 16);

asm.cmp(array_len_opnd, 1.into());
let elem_opnd = asm.csel_g(Opnd::mem(64, ary_opnd, 0), Qnil.into());
asm.mov(top, elem_opnd);

asm.compile_with_num_regs(&mut cb, 1);

assert_disasm!(cb, "48837b1001b804000000480f4f03488903", {"
0x0: cmp qword ptr [rbx + 0x10], 1
0x5: mov eax, 4
0xa: cmovg rax, qword ptr [rbx]
0xe: mov qword ptr [rbx], rax
"});
}
}
92 changes: 66 additions & 26 deletions yjit/src/codegen.rs
Original file line number Diff line number Diff line change
Expand Up @@ -1467,7 +1467,7 @@ fn guard_object_is_not_ruby2_keyword_hash(
fn gen_expandarray(
jit: &mut JITState,
asm: &mut Assembler,
_ocb: &mut OutlinedCb,
ocb: &mut OutlinedCb,
) -> Option<CodegenStatus> {
// Both arguments are rb_num_t which is unsigned
let num = jit.get_arg(0).as_usize();
Expand Down Expand Up @@ -1500,49 +1500,89 @@ fn gen_expandarray(
return Some(KeepCompiling);
}

// Defer compilation so we can specialize on a runtime `self`
if !jit.at_current_insn() {
defer_compilation(jit, asm, ocb);
return Some(EndBlock);
}

let comptime_recv = jit.peek_at_stack(&asm.ctx, 0);

// If the comptime receiver is not an array, bail
if comptime_recv.class_of() != unsafe { rb_cArray } {
return None;
}

// Get the compile-time array length
let comptime_len = unsafe { rb_yjit_array_len(comptime_recv) as u32 };
//println!("comptime_len={}", comptime_len);

// Move the array from the stack and check that it's an array.
guard_object_is_array(
asm,
array_opnd,
array_opnd.into(),
Counter::expandarray_not_array,
);
let array_opnd = asm.stack_pop(1); // pop after using the type info

// If we don't actually want any values, then just return.
if num == 0 {
asm.stack_pop(1); // pop the array
return Some(KeepCompiling);
}

let array_opnd = asm.stack_opnd(0);
let array_reg = asm.load(array_opnd);
let array_len_opnd = get_array_len(asm, array_reg);

// Only handle the case where the number of values in the array is greater
// than or equal to the number of values requested.
asm.cmp(array_len_opnd, num.into());
asm.jl(Target::side_exit(Counter::expandarray_rhs_too_small));
// Guard on the comptime/expected array length
asm.comment(&format!("guard array length == {}", comptime_len));
asm.cmp(array_len_opnd, comptime_len.into());
jit_chain_guard(
JCC_JNE,
jit,
asm,
ocb,
OPT_AREF_MAX_CHAIN_DEPTH,
Counter::expandarray_chain_max_depth,
);

// Load the address of the embedded array into REG1.
// (struct RArray *)(obj)->as.ary
let array_reg = asm.load(array_opnd);
let ary_opnd = asm.lea(Opnd::mem(VALUE_BITS, array_reg, RUBY_OFFSET_RARRAY_AS_ARY));
let array_opnd = asm.stack_pop(1); // pop after using the type info

// Conditionally load the address of the heap array into REG1.
// (struct RArray *)(obj)->as.heap.ptr
let flags_opnd = Opnd::mem(VALUE_BITS, array_reg, RUBY_OFFSET_RBASIC_FLAGS);
asm.test(flags_opnd, Opnd::UImm(RARRAY_EMBED_FLAG as u64));
let heap_ptr_opnd = Opnd::mem(
usize::BITS as u8,
asm.load(array_opnd),
RUBY_OFFSET_RARRAY_AS_HEAP_PTR,
);
let ary_opnd = asm.csel_nz(ary_opnd, heap_ptr_opnd);
//println!("generating loads");

// Loop backward through the array and push each element onto the stack.
for i in (0..num).rev() {
let top = asm.stack_push(Type::Unknown);
let offset = i32::try_from(i * SIZEOF_VALUE).unwrap();
asm.mov(top, Opnd::mem(64, ary_opnd, offset));
// If the array has length 0, then we don't even need the array pointer
if comptime_len == 0 {
// Loop backward through the array and push Qnils onto the stack.
for _ in 0..num {
let top = asm.stack_push(Type::Nil);
asm.mov(top, Qnil.into());
}
} else {
let array_reg = asm.load(array_opnd);
let ary_opnd = asm.lea(Opnd::mem(VALUE_BITS, array_reg, RUBY_OFFSET_RARRAY_AS_ARY));

// Conditionally load the address of the heap array
// (struct RArray *)(obj)->as.heap.ptr
let flags_opnd = Opnd::mem(VALUE_BITS, array_reg, RUBY_OFFSET_RBASIC_FLAGS);
asm.test(flags_opnd, Opnd::UImm(RARRAY_EMBED_FLAG as u64));
let heap_ptr_opnd = Opnd::mem(
usize::BITS as u8,
asm.load(array_opnd),
RUBY_OFFSET_RARRAY_AS_HEAP_PTR,
);
let ary_opnd = asm.csel_nz(ary_opnd, heap_ptr_opnd);

// Loop backward through the array and push each element onto the stack.
for i in (0..num).rev() {
let top = asm.stack_push(Type::Unknown);
let offset = i32::try_from(i * SIZEOF_VALUE).unwrap();

// Missing elements are Qnil
asm.comment(&format!("load array[{}]", i));
let elem_opnd = if (i as u32) < comptime_len { Opnd::mem(64, ary_opnd, offset) } else { Qnil.into() };
asm.mov(top, elem_opnd);
}
}

Some(KeepCompiling)
Expand Down Expand Up @@ -7394,7 +7434,7 @@ fn gen_leave(
ocb: &mut OutlinedCb,
) -> Option<CodegenStatus> {
// Only the return value should be on the stack
assert_eq!(1, asm.ctx.get_stack_size());
assert_eq!(1, asm.ctx.get_stack_size(), "leave instruction expects stack size 1");

let ocb_asm = Assembler::new();

Expand Down
2 changes: 1 addition & 1 deletion yjit/src/stats.rs
Original file line number Diff line number Diff line change
Expand Up @@ -358,7 +358,7 @@ make_counters! {
expandarray_splat,
expandarray_postarg,
expandarray_not_array,
expandarray_rhs_too_small,
expandarray_chain_max_depth,

// getblockparam
gbp_wb_required,
Expand Down

0 comments on commit 10f619d

Please sign in to comment.