Skip to content

Commit ee9d86c

Browse files
authored
Ps/fix/log durations (#641)
* disable fake db * fix log durations * enable fake db again * bump version * up
1 parent a03ef06 commit ee9d86c

File tree

5 files changed

+55
-48
lines changed

5 files changed

+55
-48
lines changed

deploy/prod/common-values-iris-mpc.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
image: "ghcr.io/worldcoin/iris-mpc:v0.8.41"
1+
image: "ghcr.io/worldcoin/iris-mpc:v0.8.42"
22

33
environment: prod
44
replicaCount: 1

deploy/prod/smpcv2-0-prod/values-iris-mpc.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -90,7 +90,7 @@ env:
9090
value: "10000000"
9191

9292
- name: SMPC__FAKE_DB_SIZE
93-
value: "0"
93+
value: "6400000"
9494

9595
- name: SMPC__MAX_BATCH_SIZE
9696
value: "64"

deploy/prod/smpcv2-1-prod/values-iris-mpc.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -90,7 +90,7 @@ env:
9090
value: "10000000"
9191

9292
- name: SMPC__FAKE_DB_SIZE
93-
value: "0"
93+
value: "6400000"
9494

9595
- name: SMPC__MAX_BATCH_SIZE
9696
value: "64"

deploy/prod/smpcv2-2-prod/values-iris-mpc.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -90,7 +90,7 @@ env:
9090
value: "10000000"
9191

9292
- name: SMPC__FAKE_DB_SIZE
93-
value: "0"
93+
value: "6400000"
9494

9595
- name: SMPC__MAX_BATCH_SIZE
9696
value: "64"

iris-mpc-gpu/src/server/actor.rs

Lines changed: 51 additions & 44 deletions
Original file line numberDiff line numberDiff line change
@@ -1130,27 +1130,39 @@ impl ServerActor {
11301130
self.device_manager
11311131
.await_event(request_streams, &current_exchange_event);
11321132

1133-
record_stream_time!(&self.device_manager, batch_streams, events, "db_reduce", {
1134-
compact_device_sums.compute_dot_reducer_against_db(
1135-
&mut self.codes_engine,
1136-
&mut self.masks_engine,
1137-
code_db_slices,
1138-
mask_db_slices,
1139-
&dot_chunk_size,
1140-
offset,
1141-
request_streams,
1142-
);
1143-
});
1133+
record_stream_time!(
1134+
&self.device_manager,
1135+
request_streams,
1136+
events,
1137+
"db_reduce",
1138+
{
1139+
compact_device_sums.compute_dot_reducer_against_db(
1140+
&mut self.codes_engine,
1141+
&mut self.masks_engine,
1142+
code_db_slices,
1143+
mask_db_slices,
1144+
&dot_chunk_size,
1145+
offset,
1146+
request_streams,
1147+
);
1148+
}
1149+
);
11441150

11451151
self.device_manager
11461152
.record_event(request_streams, &next_dot_event);
11471153

1148-
record_stream_time!(&self.device_manager, batch_streams, events, "db_reshare", {
1149-
self.codes_engine
1150-
.reshare_results(&dot_chunk_size, request_streams);
1151-
self.masks_engine
1152-
.reshare_results(&dot_chunk_size, request_streams);
1153-
});
1154+
record_stream_time!(
1155+
&self.device_manager,
1156+
request_streams,
1157+
events,
1158+
"db_reshare",
1159+
{
1160+
self.codes_engine
1161+
.reshare_results(&dot_chunk_size, request_streams);
1162+
self.masks_engine
1163+
.reshare_results(&dot_chunk_size, request_streams);
1164+
}
1165+
);
11541166

11551167
// ---- END PHASE 1 ----
11561168

@@ -1170,9 +1182,10 @@ impl ServerActor {
11701182
);
11711183
self.phase2
11721184
.set_chunk_size(max_chunk_size * self.max_batch_size * ROTATIONS / 64);
1185+
11731186
record_stream_time!(
11741187
&self.device_manager,
1175-
batch_streams,
1188+
request_streams,
11761189
events,
11771190
"db_threshold",
11781191
{
@@ -1190,20 +1203,22 @@ impl ServerActor {
11901203
.record_event(request_streams, &next_exchange_event);
11911204

11921205
let res = self.phase2.take_result_buffer();
1193-
open(
1194-
&mut self.phase2,
1195-
&res,
1196-
&self.distance_comparator,
1197-
db_match_bitmap,
1198-
max_chunk_size * self.max_batch_size * ROTATIONS / 64,
1199-
&dot_chunk_size,
1200-
&chunk_size,
1201-
offset,
1202-
&self.current_db_sizes,
1203-
&ignore_device_results,
1204-
request_streams,
1205-
);
1206-
self.phase2.return_result_buffer(res);
1206+
record_stream_time!(&self.device_manager, request_streams, events, "db_open", {
1207+
open(
1208+
&mut self.phase2,
1209+
&res,
1210+
&self.distance_comparator,
1211+
db_match_bitmap,
1212+
max_chunk_size * self.max_batch_size * ROTATIONS / 64,
1213+
&dot_chunk_size,
1214+
&chunk_size,
1215+
offset,
1216+
&self.current_db_sizes,
1217+
&ignore_device_results,
1218+
request_streams,
1219+
);
1220+
self.phase2.return_result_buffer(res);
1221+
});
12071222
}
12081223
self.device_manager
12091224
.record_event(request_streams, &next_phase2_event);
@@ -1336,19 +1351,11 @@ impl ServerActor {
13361351

13371352
/// Internal helper function to log the timers of measured cuda streams.
13381353
fn log_timers(events: HashMap<&str, Vec<Vec<CUevent>>>) {
1339-
for (name, event_vecs) in &events {
1354+
for (name, event_vecs) in events {
1355+
assert!(event_vecs.len() % 2 == 0);
13401356
let duration: f32 = event_vecs
1341-
.chunks(2)
1342-
.map(|pair| {
1343-
let (start_events, end_events) = (&pair[0], &pair[1]);
1344-
let total_duration: f32 = start_events
1345-
.iter()
1346-
.zip(end_events.iter())
1347-
.map(|(start, end)| unsafe { elapsed(*start, *end) }.unwrap())
1348-
.sum();
1349-
1350-
total_duration / start_events.len() as f32
1351-
})
1357+
.iter()
1358+
.map(|pair| unsafe { elapsed(pair[0], pair[1]) }.unwrap())
13521359
.sum();
13531360

13541361
tracing::info!("Event {}: {:?} ms", name, duration);

0 commit comments

Comments
 (0)