Skip to content

Commit

Permalink
remove some unnecessary syncthreads calls
Browse files Browse the repository at this point in the history
  • Loading branch information
etseidl committed Nov 15, 2023
1 parent 2004caa commit 883a236
Show file tree
Hide file tree
Showing 3 changed files with 2 additions and 4 deletions.
2 changes: 1 addition & 1 deletion cpp/src/io/parquet/page_data.cu
Original file line number Diff line number Diff line change
Expand Up @@ -491,7 +491,7 @@ __global__ void __launch_bounds__(decode_block_size)
target_pos = min(s->nz_count, src_pos + decode_block_size - out_thread0);
if (out_thread0 > 32) { target_pos = min(target_pos, s->dict_pos); }
}
__syncthreads();

if (t < 32) {
// decode repetition and definition levels.
// - update validity vectors
Expand Down
2 changes: 0 additions & 2 deletions cpp/src/io/parquet/page_delta_decode.cu
Original file line number Diff line number Diff line change
Expand Up @@ -364,7 +364,6 @@ __global__ void __launch_bounds__(96)
} else { // warp2
target_pos = min(s->nz_count, src_pos + batch_size);
}
__syncthreads();

// warp0 will decode the rep/def levels, warp1 will unpack a mini-batch of deltas.
// warp2 waits one cycle for warps 0/1 to produce a batch, and then stuffs values
Expand Down Expand Up @@ -503,7 +502,6 @@ __global__ void __launch_bounds__(decode_block_size)
} else { // warp 3
target_pos = min(s->nz_count, src_pos + batch_size);
}
__syncthreads();

// warp0 will decode the rep/def levels, warp1 will unpack a mini-batch of prefixes, warp 2 will
// unpack a mini-batch of suffixes. warp3 waits one cycle for warps 0-2 to produce a batch, and
Expand Down
2 changes: 1 addition & 1 deletion cpp/src/io/parquet/page_string_decode.cu
Original file line number Diff line number Diff line change
Expand Up @@ -833,7 +833,7 @@ __global__ void __launch_bounds__(decode_block_size)
target_pos = min(s->nz_count, src_pos + decode_block_size - out_thread0);
if (out_thread0 > 32) { target_pos = min(target_pos, s->dict_pos); }
}
__syncthreads();

if (t < 32) {
// decode repetition and definition levels.
// - update validity vectors
Expand Down

0 comments on commit 883a236

Please sign in to comment.