Skip to content

Commit

Permalink
wip signal < ok through stage 3
Browse files Browse the repository at this point in the history
  • Loading branch information
bHimes committed Jan 7, 2025
1 parent 59bacd2 commit c9d4dba
Show file tree
Hide file tree
Showing 2 changed files with 6 additions and 3 deletions.
7 changes: 5 additions & 2 deletions src/fastfft/FastFFT.cu
Original file line number Diff line number Diff line change
Expand Up @@ -1453,7 +1453,7 @@ __global__ void block_fft_kernel_C2C_INCREASE(const ComplexData_t* __restrict__
complex_compute_t twiddle;

// No need to __syncthreads as each thread only accesses its own shared mem anyway
io<FFT>::load_shared(&input_values[Return1DFFTAddress(size_of<FFT>::value)],
io<FFT>::load_shared(&input_values[Return1DFFTAddress(mem_offsets.physical_x_input)],
shared_input_complex,
thread_data,
twiddle_factor_args,
Expand All @@ -1480,7 +1480,9 @@ __global__ void block_fft_kernel_C2C_INCREASE(const ComplexData_t* __restrict__
// Now that the memory output can be coalesced send to global
// FIXME: is this actually coalced?
for ( int sub_fft = 0; sub_fft < Q; sub_fft++ ) {
io<FFT>::store_coalesced(shared_output, &output_values[Return1DFFTAddress(size_of<FFT>::value * Q)], sub_fft * mem_offsets.shared_input);
io<FFT>::store_coalesced(shared_output,
&output_values[Return1DFFTAddress(mem_offsets.physical_x_output)],
sub_fft * mem_offsets.shared_input); // FIXME: if we shrink shared_input == SignalLength then this should be size_of<FFT>::value
}
}

Expand Down Expand Up @@ -3080,6 +3082,7 @@ LaunchParams FourierTransformer<ComputeBaseType, PositionSpaceType, OtherImageTy
L.mem_offsets.physical_x_output = fwd_dims_out.w;
}
}

else if ( IsC2RType(kernel_type) ) {
// This is always the last op, so if there is a size change, it will have happened once on C2C, reducing the number of blocks
if constexpr ( Rank == 2 ) {
Expand Down
2 changes: 1 addition & 1 deletion src/tests/debug_with_index_values.cu
Original file line number Diff line number Diff line change
Expand Up @@ -189,7 +189,7 @@ int main(int argc, char** argv) {
std::cout << "This doesn't make sense as the synchronizations are invalidating.\n";
// exit(1);
#endif
std::vector<int> size = {64, 128};
std::vector<int> size = {60, 128};

SCT size_change_type;
// Set the SCT to no_change, increase, or decrease
Expand Down

0 comments on commit c9d4dba

Please sign in to comment.