Add flag bits to avoid compiling stubs multiple times.

Fixes bug involving ractors and branch stubs.
author: Maxime Chevalier-Boisvert <maxime.chevalierboisvert@shopify.com> 2021-04-07 15:36:02 -0400
committer: Alan Wu <XrXr@users.noreply.github.com> 2021-10-20 18:19:33 -0400
commit: 42af04efee38de4435a04ea0487fce483db10dee (patch)
tree: f8759b06af2d47d0f0274d211a5a2da352cbac15 /yjit_core.c
parent: 54312d777cc22a52cfafcce0a0a20ed48375b82e (diff)
1 files changed, 73 insertions, 58 deletions
diff --git a/yjit_core.c b/yjit_core.c
index 0a7e2c6442..2055d0a663 100644
--- a/yjit_core.c
+++ b/yjit_core.c
@@ -499,73 +499,85 @@ branch_stub_hit(const uint32_t branch_idx, const uint32_t target_idx, rb_executi
     blockid_t target = branch->targets[target_idx];
     const ctx_t* target_ctx = &branch->target_ctxs[target_idx];
 
-    // :stub-sp-flush:
-    // Generated code do stack operations without modifying cfp->sp, while the
-    // cfp->sp tells the GC what values on the stack to root. Generated code
-    // generally takes care of updating cfp->sp when it calls runtime routines that
-    // could trigger GC, but for the case of branch stubs, it's inconvenient. So
-    // we do it here.
-    VALUE *const original_interp_sp = ec->cfp->sp;
-    ec->cfp->sp += target_ctx->sp_offset;
-
-    //fprintf(stderr, "\nstub hit, branch idx: %d, target idx: %d\n", branch_idx, target_idx);
-    //fprintf(stderr, "blockid.iseq=%p, blockid.idx=%d\n", target.iseq, target.idx);
-    //fprintf(stderr, "chain_depth=%d\n", target_ctx->chain_depth);
-
-    // Update the PC in the current CFP, because it
-    // may be out of sync in JITted code
-    ec->cfp->pc = iseq_pc_at_idx(target.iseq, target.idx);
-
-    // Try to find an existing compiled version of this block
-    block_t* p_block = find_block_version(target, target_ctx);
-
-    // If this block hasn't yet been compiled
-    if (!p_block) {
-        // Limit the number of block versions
-        ctx_t generic_ctx = DEFAULT_CTX;
-        generic_ctx.stack_size = target_ctx->stack_size;
-        generic_ctx.sp_offset = target_ctx->sp_offset;
-        if (target_ctx->chain_depth == 0) { // guard chains implement limits individually
-            if (get_num_versions(target) >= MAX_VERSIONS - 1) {
-                //fprintf(stderr, "version limit hit in branch_stub_hit\n");
-                target_ctx = &generic_ctx;
+    // If this branch has already been patched, return the dst address
+    // Note: ractors can cause the same stub to be hit multiple times
+    if (branch->dst_patched & (1 << target_idx)) {
+        dst_addr =  branch->dst_addrs[target_idx];
+    }
+    else
+    {
+        //fprintf(stderr, "\nstub hit, branch idx: %d, target idx: %d\n", branch_idx, target_idx);
+        //fprintf(stderr, "blockid.iseq=%p, blockid.idx=%d\n", target.iseq, target.idx);
+        //fprintf(stderr, "chain_depth=%d\n", target_ctx->chain_depth);
+
+        // :stub-sp-flush:
+        // Generated code do stack operations without modifying cfp->sp, while the
+        // cfp->sp tells the GC what values on the stack to root. Generated code
+        // generally takes care of updating cfp->sp when it calls runtime routines that
+        // could trigger GC, but for the case of branch stubs, it's inconvenient. So
+        // we do it here.
+        VALUE *const original_interp_sp = ec->cfp->sp;
+        ec->cfp->sp += target_ctx->sp_offset;
+
+        // Update the PC in the current CFP, because it
+        // may be out of sync in JITted code
+        ec->cfp->pc = iseq_pc_at_idx(target.iseq, target.idx);
+
+        // Try to find an existing compiled version of this block
+        block_t* p_block = find_block_version(target, target_ctx);
+
+        // If this block hasn't yet been compiled
+        if (!p_block) {
+            // Limit the number of block versions
+            ctx_t generic_ctx = DEFAULT_CTX;
+            generic_ctx.stack_size = target_ctx->stack_size;
+            generic_ctx.sp_offset = target_ctx->sp_offset;
+            if (target_ctx->chain_depth == 0) { // guard chains implement limits individually
+                if (get_num_versions(target) >= MAX_VERSIONS - 1) {
+                    //fprintf(stderr, "version limit hit in branch_stub_hit\n");
+                    target_ctx = &generic_ctx;
+                }
             }
-        }
 
-        // If the new block can be generated right after the branch (at cb->write_pos)
-        if (cb->write_pos == branch->end_pos) {
-            // Change the branch shape to indicate the target block will be placed next
-            branch->shape = (uint8_t)target_idx;
+            // If the new block can be generated right after the branch (at cb->write_pos)
+            if (cb->write_pos == branch->end_pos) {
+                // Change the branch shape to indicate the target block will be placed next
+                branch->shape = (uint8_t)target_idx;
+
+                // Rewrite the branch with the new, potentially more compact shape
+                cb_set_pos(cb, branch->start_pos);
+                branch->gen_fn(cb, branch->dst_addrs[0], branch->dst_addrs[1], branch->shape);
+                RUBY_ASSERT(cb->write_pos <= branch->end_pos && "can't enlarge branches");
+                branch->end_pos = cb->write_pos;
+            }
 
-            // Rewrite the branch with the new, potentially more compact shape
-            cb_set_pos(cb, branch->start_pos);
-            branch->gen_fn(cb, branch->dst_addrs[0], branch->dst_addrs[1], branch->shape);
-            RUBY_ASSERT(cb->write_pos <= branch->end_pos && "can't enlarge branches");
-            branch->end_pos = cb->write_pos;
+            p_block = gen_block_version(target, target_ctx, ec);
+            RUBY_ASSERT(p_block);
+            RUBY_ASSERT(!(branch->shape == (uint8_t)target_idx && p_block->start_pos != branch->end_pos));
         }
 
-        p_block = gen_block_version(target, target_ctx, ec);
-        RUBY_ASSERT(p_block);
-        RUBY_ASSERT(branch->shape != (uint8_t)target_idx || p_block->start_pos == branch->end_pos);
-    }
+        // Add this branch to the list of incoming branches for the target
+        rb_darray_append(&p_block->incoming, branch_idx);
 
-    // Add this branch to the list of incoming branches for the target
-    rb_darray_append(&p_block->incoming, branch_idx);
+        // Update the branch target address
+        dst_addr = cb_get_ptr(cb, p_block->start_pos);
+        branch->dst_addrs[target_idx] = dst_addr;
 
-    // Update the branch target address
-    dst_addr = cb_get_ptr(cb, p_block->start_pos);
-    branch->dst_addrs[target_idx] = dst_addr;
+        // Rewrite the branch with the new jump target address
+        RUBY_ASSERT(branch->dst_addrs[0] != NULL);
+        uint32_t cur_pos = cb->write_pos;
+        cb_set_pos(cb, branch->start_pos);
+        branch->gen_fn(cb, branch->dst_addrs[0], branch->dst_addrs[1], branch->shape);
+        RUBY_ASSERT(cb->write_pos == branch->end_pos && "branch can't change size");
+        cb_set_pos(cb, cur_pos);
+
+        // Mark this branch target as patched (no longer a stub)
+        branch->dst_patched |= (1 << target_idx);
 
-    // Rewrite the branch with the new jump target address
-    RUBY_ASSERT(branch->dst_addrs[0] != NULL);
-    uint32_t cur_pos = cb->write_pos;
-    cb_set_pos(cb, branch->start_pos);
-    branch->gen_fn(cb, branch->dst_addrs[0], branch->dst_addrs[1], branch->shape);
-    RUBY_ASSERT(cb->write_pos == branch->end_pos && "branch can't change size");
-    cb_set_pos(cb, cur_pos);
+        // Restore interpreter sp, since the code hitting the stub expects the original.
+        ec->cfp->sp = original_interp_sp;
+    }
 
-    // Restore interpreter sp, since the code hitting the stub expects the original.
-    ec->cfp->sp = original_interp_sp;
     RB_VM_LOCK_LEAVE();
 
     // Return a pointer to the compiled block version
@@ -867,6 +879,9 @@ invalidate_block_version(block_t* block)
             target_idx
         );
 
+        // Mark this target as being a stub
+        branch->dst_patched &= ~(1 << target_idx);
+
         // Check if the invalidated block immediately follows
         bool target_next = block->start_pos == branch->end_pos;
author	Maxime Chevalier-Boisvert <maxime.chevalierboisvert@shopify.com>	2021-04-07 15:36:02 -0400
committer	Alan Wu <XrXr@users.noreply.github.com>	2021-10-20 18:19:33 -0400
commit	42af04efee38de4435a04ea0487fce483db10dee (patch)
tree	f8759b06af2d47d0f0274d211a5a2da352cbac15 /yjit_core.c
parent	54312d777cc22a52cfafcce0a0a20ed48375b82e (diff)