Skip to content

Commit

Permalink
Merge pull request #3542 from anagainaru/warpx-bug-null-blocks
Browse files Browse the repository at this point in the history
Fix bug when writing null blocks
  • Loading branch information
anagainaru authored and vicentebolea committed Mar 20, 2023
2 parents 68bb627 + cc5dce6 commit e29b99d
Show file tree
Hide file tree
Showing 3 changed files with 110 additions and 2 deletions.
2 changes: 1 addition & 1 deletion source/adios2/engine/bp5/BP5Writer.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1803,7 +1803,7 @@ void BP5Writer::PutCommon(VariableBase &variable, const void *values, bool sync)
variable.m_MemoryCount, sourceRowMajor, false, (char *)ptr,
variable.m_MemoryStart, variable.m_Count, sourceRowMajor, false,
ObjSize, helper::CoreDims(), helper::CoreDims(), helper::CoreDims(),
helper::CoreDims(), false /* safemode */, MemorySpace::Host);
helper::CoreDims(), false /* safemode */, variable.m_MemSpace);
}
else
{
Expand Down
8 changes: 7 additions & 1 deletion source/adios2/toolkit/format/bp/bp4/BP4Serializer.tcc
Original file line number Diff line number Diff line change
Expand Up @@ -118,7 +118,13 @@ inline void BP4Serializer::PutVariablePayload(
}
else
{
PutOperationPayloadInBuffer(variable, blockInfo);
const bool isZeroCount =
std::all_of(blockInfo.Count.begin(), blockInfo.Count.end(),
[](const size_t i) { return i == 0; });
if (!isZeroCount)
{
PutOperationPayloadInBuffer(variable, blockInfo);
}
}

/* Now we can update the varLength including payload size including the
Expand Down
102 changes: 102 additions & 0 deletions testing/adios2/engine/bp/TestBPWriteReadCuda.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -199,6 +199,107 @@ void CUDADetectMemSpace(const std::string mode)
}
}

void CUDAWriteReadMemorySelection()
{
const std::string fname("BPWRCUSel1D.bp");
const size_t Nx = 10;
const size_t NSteps = 2;
const size_t ghostCells = 1;
std::vector<float> r32s(Nx + 2 * ghostCells);
std::iota(r32s.begin(), r32s.end(), .0f);

adios2::ADIOS adios;
{
// cuda simulation buffer
float *gpuSimData = nullptr;
cudaMalloc(&gpuSimData, (Nx + 2 * ghostCells) * sizeof(float));
cudaMemcpy(gpuSimData, r32s.data(),
(Nx + 2 * ghostCells) * sizeof(float),
cudaMemcpyHostToDevice);

adios2::IO io = adios.DeclareIO("TestIO");
io.SetEngine("BP5");
if (!engineName.empty())
{
io.SetEngine(engineName);
}

const adios2::Dims shape{static_cast<size_t>(Nx)};
const adios2::Dims start{static_cast<size_t>(0)};
const adios2::Dims count{Nx};
auto var_r32 = io.DefineVariable<float>("r32", shape, start, count);

const adios2::Dims memoryStart = {ghostCells};
const adios2::Dims memoryCount = {Nx + 2 * ghostCells};
var_r32.SetMemorySelection({memoryStart, memoryCount});

adios2::Engine bpWriter = io.Open(fname, adios2::Mode::Write);

for (size_t step = 0; step < NSteps; ++step)
{
cuda_increment(Nx + 2 * ghostCells, 1, 0, gpuSimData, INCREMENT);

bpWriter.BeginStep();
var_r32.SetMemorySpace(adios2::MemorySpace::GPU);
bpWriter.Put(var_r32, gpuSimData);
bpWriter.EndStep();
}

bpWriter.Close();
}
{
// remove ghost cells from the input vector when checking correctness
r32s.erase(r32s.begin(), r32s.begin() + ghostCells);
r32s.erase(r32s.end() - ghostCells, r32s.end());

adios2::IO io = adios.DeclareIO("ReadIO");
io.SetEngine("BP5");
if (!engineName.empty())
{
io.SetEngine(engineName);
}

adios2::Engine bpReader = io.Open(fname, adios2::Mode::Read);

unsigned int t = 0;
for (; bpReader.BeginStep() == adios2::StepStatus::OK; ++t)
{
auto var_r32 = io.InquireVariable<float>("r32");
EXPECT_TRUE(var_r32);
ASSERT_EQ(var_r32.ShapeID(), adios2::ShapeID::GlobalArray);
ASSERT_EQ(var_r32.Shape()[0], Nx);

auto mmR32 = std::minmax_element(r32s.begin(), r32s.end());
EXPECT_EQ(var_r32.Min() - (t + 1) * INCREMENT, *mmR32.first);
EXPECT_EQ(var_r32.Max() - (t + 1) * INCREMENT, *mmR32.second);

std::vector<float> r32o(Nx);
float *gpuSimData;
cudaMalloc(&gpuSimData, Nx * sizeof(float));
var_r32.SetMemorySpace(adios2::MemorySpace::GPU);
bpReader.Get(var_r32, gpuSimData);
bpReader.EndStep();
cudaMemcpy(r32o.data(), gpuSimData, Nx * sizeof(float),
cudaMemcpyDeviceToHost);

// Remove INCREMENT from each element
std::transform(r32o.begin(), r32o.end(), r32o.begin(),
std::bind(std::minus<float>(), std::placeholders::_1,
(t + 1) * INCREMENT));
for (size_t i = 0; i < Nx; i++)
{
char msg[1 << 8] = {0};
snprintf(msg, sizeof(msg), "t=%d i=%zu r32o=%f r32s=%f", t, i,
r32o[i], r32s[i]);
ASSERT_LT(std::abs(r32o[i] - r32s[i]), EPSILON) << msg;
}
}
EXPECT_EQ(t, NSteps);

bpReader.Close();
}
}

void CUDAWriteReadMPI1D(const std::string mode)
{
const std::string fname("BPWRCU1D_" + mode + ".bp");
Expand Down Expand Up @@ -343,6 +444,7 @@ class BPWRCUDA : public ::testing::TestWithParam<std::string>
TEST_P(BPWRCUDA, ADIOS2BPWRCUDA1D) { CUDAWriteReadMPI1D(GetParam()); }
TEST_P(BPWRCUDA, ADIOS2BPCUDADetect) { CUDADetectMemSpace(GetParam()); }
TEST_P(BPWRCUDA, ADIOS2BPCUDAWrong) { CUDAWrongMemSpace(); }
TEST_P(BPWRCUDA, ADIOS2BPCUDAMemSel) { CUDAWriteReadMemorySelection(); }

INSTANTIATE_TEST_SUITE_P(CudaRW, BPWRCUDA,
::testing::Values("deferred", "sync"));
Expand Down

0 comments on commit e29b99d

Please sign in to comment.