Skip to content

Commit 095c956

Browse files
authored
Merge pull request #24171 from mlugg/atomic-order-derp
compiler: fix races in link queue
2 parents 180e844 + 55b7187 commit 095c956

File tree

3 files changed

+30
-34
lines changed

3 files changed

+30
-34
lines changed

src/Zcu/PerThread.zig

Lines changed: 18 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -4373,34 +4373,29 @@ pub fn addDependency(pt: Zcu.PerThread, unit: AnalUnit, dependee: InternPool.Dep
43734373
/// codegen thread, depending on whether the backend supports `Zcu.Feature.separate_thread`.
43744374
pub fn runCodegen(pt: Zcu.PerThread, func_index: InternPool.Index, air: *Air, out: *@import("../link.zig").ZcuTask.LinkFunc.SharedMir) void {
43754375
const zcu = pt.zcu;
4376-
if (runCodegenInner(pt, func_index, air)) |mir| {
4376+
const success: bool = if (runCodegenInner(pt, func_index, air)) |mir| success: {
43774377
out.value = mir;
4378-
out.status.store(.ready, .release);
4379-
} else |err| switch (err) {
4380-
error.OutOfMemory => {
4381-
zcu.comp.setAllocFailure();
4382-
out.status.store(.failed, .monotonic);
4383-
},
4384-
error.CodegenFail => {
4385-
zcu.assertCodegenFailed(zcu.funcInfo(func_index).owner_nav);
4386-
out.status.store(.failed, .monotonic);
4387-
},
4388-
error.NoLinkFile => {
4389-
assert(zcu.comp.bin_file == null);
4390-
out.status.store(.failed, .monotonic);
4391-
},
4392-
error.BackendDoesNotProduceMir => {
4393-
const backend = target_util.zigBackend(zcu.root_mod.resolved_target.result, zcu.comp.config.use_llvm);
4394-
switch (backend) {
4378+
break :success true;
4379+
} else |err| success: {
4380+
switch (err) {
4381+
error.OutOfMemory => zcu.comp.setAllocFailure(),
4382+
error.CodegenFail => zcu.assertCodegenFailed(zcu.funcInfo(func_index).owner_nav),
4383+
error.NoLinkFile => assert(zcu.comp.bin_file == null),
4384+
error.BackendDoesNotProduceMir => switch (target_util.zigBackend(
4385+
zcu.root_mod.resolved_target.result,
4386+
zcu.comp.config.use_llvm,
4387+
)) {
43954388
else => unreachable, // assertion failure
43964389
.stage2_spirv64,
43974390
.stage2_llvm,
43984391
=> {},
4399-
}
4400-
out.status.store(.failed, .monotonic);
4401-
},
4402-
}
4403-
zcu.comp.link_task_queue.mirReady(zcu.comp, out);
4392+
},
4393+
}
4394+
break :success false;
4395+
};
4396+
// release `out.value` with this store; synchronizes with acquire loads in `link`
4397+
out.status.store(if (success) .ready else .failed, .release);
4398+
zcu.comp.link_task_queue.mirReady(zcu.comp, func_index, out);
44044399
if (zcu.pending_codegen_jobs.rmw(.Sub, 1, .monotonic) == 1) {
44054400
// Decremented to 0, so all done.
44064401
zcu.codegen_prog_node.end();

src/link.zig

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1249,7 +1249,7 @@ pub const ZcuTask = union(enum) {
12491249
.update_line_number,
12501250
=> {},
12511251
.link_func => |link_func| {
1252-
switch (link_func.mir.status.load(.monotonic)) {
1252+
switch (link_func.mir.status.load(.acquire)) {
12531253
.pending => unreachable, // cannot deinit until MIR done
12541254
.failed => {}, // MIR not populated so doesn't need freeing
12551255
.ready => link_func.mir.value.deinit(zcu),
@@ -1453,7 +1453,7 @@ pub fn doZcuTask(comp: *Compilation, tid: usize, task: ZcuTask) void {
14531453
const fqn_slice = ip.getNav(nav).fqn.toSlice(ip);
14541454
const nav_prog_node = comp.link_prog_node.start(fqn_slice, 0);
14551455
defer nav_prog_node.end();
1456-
switch (func.mir.status.load(.monotonic)) {
1456+
switch (func.mir.status.load(.acquire)) {
14571457
.pending => unreachable,
14581458
.ready => {},
14591459
.failed => return,

src/link/Queue.zig

Lines changed: 10 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -64,7 +64,7 @@ state: union(enum) {
6464
finished,
6565
/// The link thread is not running or queued, because it is waiting for this MIR to be populated.
6666
/// Once codegen completes, it must call `mirReady` which will restart the link thread.
67-
wait_for_mir: *ZcuTask.LinkFunc.SharedMir,
67+
wait_for_mir: InternPool.Index,
6868
},
6969

7070
/// In the worst observed case, MIR is around 50 times as large as AIR. More typically, the ratio is
@@ -113,20 +113,20 @@ pub fn start(q: *Queue, comp: *Compilation) void {
113113

114114
/// Called by codegen workers after they have populated a `ZcuTask.LinkFunc.SharedMir`. If the link
115115
/// thread was waiting for this MIR, it can resume.
116-
pub fn mirReady(q: *Queue, comp: *Compilation, mir: *ZcuTask.LinkFunc.SharedMir) void {
116+
pub fn mirReady(q: *Queue, comp: *Compilation, func_index: InternPool.Index, mir: *ZcuTask.LinkFunc.SharedMir) void {
117117
// We would like to assert that `mir` is not pending, but that would race with a worker thread
118118
// potentially freeing it.
119119
{
120120
q.mutex.lock();
121121
defer q.mutex.unlock();
122122
switch (q.state) {
123123
.finished, .running => return,
124-
.wait_for_mir => |wait_for| if (wait_for != mir) return,
124+
.wait_for_mir => |wait_for| if (wait_for != func_index) return,
125125
}
126126
// We were waiting for `mir`, so we will restart the linker thread.
127127
q.state = .running;
128128
}
129-
assert(mir.status.load(.monotonic) != .pending);
129+
assert(mir.status.load(.acquire) != .pending);
130130
comp.thread_pool.spawnWgId(&comp.link_task_wait_group, flushTaskQueue, .{ q, comp });
131131
}
132132

@@ -170,8 +170,8 @@ pub fn enqueueZcu(q: *Queue, comp: *Compilation, task: ZcuTask) Allocator.Error!
170170
.finished => if (q.pending_prelink_tasks != 0) return,
171171
}
172172
// Restart the linker thread, unless it would immediately be blocked
173-
if (task == .link_func and task.link_func.mir.status.load(.monotonic) == .pending) {
174-
q.state = .{ .wait_for_mir = task.link_func.mir };
173+
if (task == .link_func and task.link_func.mir.status.load(.acquire) == .pending) {
174+
q.state = .{ .wait_for_mir = task.link_func.func };
175175
return;
176176
}
177177
q.state = .running;
@@ -243,12 +243,12 @@ fn flushTaskQueue(tid: usize, q: *Queue, comp: *Compilation) void {
243243
if (task != .link_func) break :pending;
244244
const status_ptr = &task.link_func.mir.status;
245245
// First check without the mutex to optimize for the common case where MIR is ready.
246-
if (status_ptr.load(.monotonic) != .pending) break :pending;
246+
if (status_ptr.load(.acquire) != .pending) break :pending;
247247
q.mutex.lock();
248248
defer q.mutex.unlock();
249-
if (status_ptr.load(.monotonic) != .pending) break :pending;
249+
if (status_ptr.load(.acquire) != .pending) break :pending;
250250
// We will stop for now, and get restarted once this MIR is ready.
251-
q.state = .{ .wait_for_mir = task.link_func.mir };
251+
q.state = .{ .wait_for_mir = task.link_func.func };
252252
q.flush_safety.unlock();
253253
return;
254254
}
@@ -273,6 +273,7 @@ const std = @import("std");
273273
const assert = std.debug.assert;
274274
const Allocator = std.mem.Allocator;
275275
const Compilation = @import("../Compilation.zig");
276+
const InternPool = @import("../InternPool.zig");
276277
const link = @import("../link.zig");
277278
const PrelinkTask = link.PrelinkTask;
278279
const ZcuTask = link.ZcuTask;

0 commit comments

Comments
 (0)