Skip to content

Commit

Permalink
NBS-179: support using multiple devices from the same rdma endpoint
Browse files Browse the repository at this point in the history
This commit fixes the problem with connecting to multiple devices on the same
host using rdma compound storage. Before the fix same storage was reused to
access all devices which resulted in data corruption
  • Loading branch information
budevg committed Jan 23, 2024
1 parent 3712104 commit 2b8e476
Show file tree
Hide file tree
Showing 3 changed files with 127 additions and 1 deletion.
5 changes: 4 additions & 1 deletion cloud/blockstore/libs/service_local/storage_rdma.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -471,12 +471,14 @@ class TRdmaStorageProvider final
private:
struct TEndpoint
{
TString Uuid;
TString Host;
ui32 Port;

bool operator<(const TEndpoint& other) const
{
return std::tie(Host, Port) < std::tie(other.Host, other.Port);
return std::tie(Uuid, Host, Port) <
std::tie(other.Uuid, other.Host, other.Port);
}
};

Expand Down Expand Up @@ -526,6 +528,7 @@ class TRdmaStorageProvider final

for (const auto& device: volume.GetDevices()) {
auto ep = TEndpoint{
device.GetDeviceUUID(),
device.GetRdmaEndpoint().GetHost(),
device.GetRdmaEndpoint().GetPort()};

Expand Down
121 changes: 121 additions & 0 deletions cloud/blockstore/libs/service_local/storage_rdma_ut.cpp
Original file line number Diff line number Diff line change
@@ -0,0 +1,121 @@
#include "storage_rdma.h"

#include <cloud/blockstore/libs/diagnostics/server_stats.h>
#include <cloud/blockstore/libs/rdma/iface/client.h>
#include <cloud/blockstore/libs/service/storage_provider.h>

#include <library/cpp/testing/common/env.h>
#include <library/cpp/testing/unittest/registar.h>

namespace NCloud::NBlockStore::NStorage {

using namespace NThreading;

namespace {

////////////////////////////////////////////////////////////////////////////////

#define UNIT_ASSERT_SUCCEEDED(e) \
UNIT_ASSERT_C(SUCCEEDED(e.GetCode()), e.GetMessage())

class TDummyClientEndpoint: public NRdma::IClientEndpoint
{
TResultOrError<NRdma::TClientRequestPtr> AllocateRequest(
NRdma::IClientHandlerPtr handler,
std::unique_ptr<NRdma::TNullContext> context,
size_t requestBytes,
size_t responseBytes) override
{
Y_UNUSED(handler);
Y_UNUSED(context);
Y_UNUSED(requestBytes);
Y_UNUSED(responseBytes);

return MakeError(E_NOT_IMPLEMENTED);
}

void SendRequest(NRdma::TClientRequestPtr req, TCallContextPtr callContext)
override
{
Y_UNUSED(req);
Y_UNUSED(callContext);
}
};

class TRdmaClientHelper: public NRdma::IClient
{
public:
TVector<std::tuple<TString, ui32>> StartedEndpoints;

public:
TFuture<NRdma::IClientEndpointPtr> StartEndpoint(
TString host,
ui32 port) noexcept override
{
StartedEndpoints.emplace_back(host, port);

return MakeFuture<NRdma::IClientEndpointPtr>(
std::make_shared<TDummyClientEndpoint>());
}

void Start() override
{}

void Stop() override
{}
};

} // namespace

////////////////////////////////////////////////////////////////////////////////

Y_UNIT_TEST_SUITE(TRdmaStorageTest)
{
Y_UNIT_TEST(ShouldCreateEndpointForEachDeviceOnSameHost)
{
auto client = std::make_shared<TRdmaClientHelper>();
auto provider = CreateRdmaStorageProvider(
NCloud::NBlockStore::CreateServerStatsStub(),
client,
ERdmaTaskQueueOpt::DontUse);

NProto::TVolume volume;
volume.SetDiskId("disk0");
volume.SetBlockSize(4096);
volume.SetBlocksCount(1000000);
volume.SetStorageMediaKind(NProto::STORAGE_MEDIA_SSD_NONREPLICATED);

TString hostName = "host1";
ui32 hostPort = 1111;
for (auto i = 0; i < 2; i++) {
auto* device = volume.AddDevices();
device->SetDeviceName("dev" + std::to_string(i));
device->SetDeviceUUID("uuid" + std::to_string(i));
device->SetAgentId(hostName);
device->SetBlockCount(4'000);
device->SetPhysicalOffset(32'000);
auto* rdma = device->MutableRdmaEndpoint();
rdma->SetHost(hostName);
rdma->SetPort(hostPort);
}

auto future = provider->CreateStorage(
volume,
"",
NProto::VOLUME_ACCESS_READ_WRITE);
auto storage = future.GetValue();

UNIT_ASSERT_VALUES_EQUAL(2, client->StartedEndpoints.size());

for (auto i = 0; i < 2; i++) {
UNIT_ASSERT_VALUES_EQUAL(
hostName,
std::get<0>(client->StartedEndpoints[i]));
UNIT_ASSERT_VALUES_EQUAL(
hostPort,
std::get<1>(client->StartedEndpoints[i]));
}
}
}

} // namespace NCloud::NBlockStore::NStorage
2 changes: 2 additions & 0 deletions cloud/blockstore/libs/service_local/ut/ya.make
Original file line number Diff line number Diff line change
Expand Up @@ -7,12 +7,14 @@ TIMEOUT(180)
SRCS(
compound_storage_ut.cpp
storage_aio_ut.cpp
storage_rdma_ut.cpp
storage_null_ut.cpp
storage_spdk_ut.cpp
)

PEERDIR(
cloud/blockstore/libs/server
cloud/blockstore/libs/rdma/iface

cloud/storage/core/libs/aio
)
Expand Down

0 comments on commit 2b8e476

Please sign in to comment.