Skip to content

Commit

Permalink
DAOS-16838 control: Fix dmg storage query usage with emulated NVMe (#…
Browse files Browse the repository at this point in the history
…15545)

Fix a regression which prevents dmg storage query usage from
enumerating devices backed with emulated (AIO file or kdev) NVMe.

Signed-off-by: Tom Nabarro <[email protected]>
  • Loading branch information
tanabarr committed Jan 8, 2025
1 parent f4e4613 commit 0a2df2a
Show file tree
Hide file tree
Showing 3 changed files with 101 additions and 7 deletions.
19 changes: 16 additions & 3 deletions src/control/server/instance_storage_rpc.go
Original file line number Diff line number Diff line change
@@ -1,5 +1,6 @@
//
// (C) Copyright 2020-2024 Intel Corporation.
// (C) Copyright 2025 Hewlett Packard Enterprise Development LP
//
// SPDX-License-Identifier: BSD-2-Clause-Patent
//
Expand Down Expand Up @@ -332,6 +333,7 @@ func scanEngineBdevsOverDrpc(ctx context.Context, engine Engine, pbReq *ctlpb.Sc
if scanSmdResp == nil {
return nil, errors.New("nil smd scan resp")
}
engine.Tracef("smd scan devices: %+v", scanSmdResp.Devices)

// Re-link SMD devices inside NVMe controller structures and populate scan response.

Expand All @@ -340,12 +342,20 @@ func scanEngineBdevsOverDrpc(ctx context.Context, engine Engine, pbReq *ctlpb.Sc
}
seenCtrlrs := make(map[string]*ctlpb.NvmeController)

for _, sd := range scanSmdResp.Devices {
for i, sd := range scanSmdResp.Devices {
if sd.Ctrlr == nil {
return nil, errors.Errorf("smd %q has no ctrlr ref", sd.Uuid)
}

addr := sd.Ctrlr.PciAddr
if addr == "" {
// Mock identifier for emulated NVMe mode where devices have no PCI-address.
// Allows for 256 unique identifiers per-host and formatted string template
// ensures no collisions with real device addresses. Note that this mock
// identifier address is not used outside of this loop and is only used for
// the purpose of mapping SMD records to NVMe (emulated) device details.
addr = fmt.Sprintf("FFFF:00:%X.F", i)
}

if _, exists := seenCtrlrs[addr]; !exists {
c := new(ctlpb.NvmeController)
Expand Down Expand Up @@ -460,6 +470,7 @@ func bdevScanEngineAssigned(ctx context.Context, engine Engine, req *ctlpb.ScanN
return scanEngineBdevsOverDrpc(ctx, engine, req)
}

// Accommodate for VMD backing devices and emulated NVMe (AIO).
func getEffCtrlrCount(ctrlrs []*ctlpb.NvmeController) (int, error) {
pas := hardware.MustNewPCIAddressSet()
for _, c := range ctrlrs {
Expand All @@ -471,11 +482,13 @@ func getEffCtrlrCount(ctrlrs []*ctlpb.NvmeController) (int, error) {
if npas, err := pas.BackingToVMDAddresses(); err != nil {
return 0, err
} else {
pas = npas
return npas.Len(), nil
}
}

return pas.Len(), nil
// Return inputted number of controllers rather than number of parsed addresses to cater for
// the case of emulated NVMe where there will be no valid PCI address.
return len(ctrlrs), nil
}

// bdevScanEngine calls either in to the private engine storage provider to scan bdevs if engine process
Expand Down
84 changes: 82 additions & 2 deletions src/control/server/instance_storage_rpc_test.go
Original file line number Diff line number Diff line change
@@ -1,5 +1,6 @@
//
// (C) Copyright 2023-2024 Intel Corporation.
// (C) Copyright 2025 Hewlett Packard Enterprise Development LP
//
// SPDX-License-Identifier: BSD-2-Clause-Patent
//
Expand Down Expand Up @@ -44,7 +45,7 @@ func (mp *mockPCIeLinkStatsProvider) PCIeCapsFromConfig(cfgBytes []byte, dev *ha
return nil
}

func TestIOEngineInstance_populateCtrlrHealth(t *testing.T) {
func TestServer_populateCtrlrHealth(t *testing.T) {
healthWithLinkStats := func(maxSpd, spd float32, maxWdt, wdt uint32) *ctlpb.BioHealthResp {
bhr := proto.MockNvmeHealth()
bhr.LinkMaxSpeed = maxSpd
Expand Down Expand Up @@ -459,7 +460,7 @@ func TestIOEngineInstance_populateCtrlrHealth(t *testing.T) {
}
}

func TestIOEngineInstance_bdevScanEngine(t *testing.T) {
func TestServer_bdevScanEngine(t *testing.T) {
c := storage.MockNvmeController(2)
withState := func(ctrlr *ctlpb.NvmeController, state ctlpb.NvmeDevState) *ctlpb.NvmeController {
ctrlr.DevState = state
Expand Down Expand Up @@ -793,6 +794,85 @@ func TestIOEngineInstance_bdevScanEngine(t *testing.T) {
// Prove link stat provider gets called when LinkStats flag set.
expErr: errors.New("link stats provider fail"),
},
"scan over drpc; aio file emulated nvme; no pci addresses": {
smdRes: &ctlpb.SmdDevResp{
Devices: []*ctlpb.SmdDevice{
{
Uuid: "b80b4653-af58-47b3-aa3b-8ad12965f440",
TgtIds: []int32{
1024, 1024, 0, 0, 0, 4, 4, 4, 8, 8, 8, 12,
12, 12,
},
RoleBits: 7,
Ctrlr: &ctlpb.NvmeController{
DevState: ctlpb.NvmeDevState_NORMAL,
},
},
{
Uuid: "3c7a8e22-38c0-4e6f-8776-d703d049ae6f",
TgtIds: []int32{
1024, 1024, 1, 1, 1, 5, 5, 5, 9, 9, 9, 13,
13, 13,
},
RoleBits: 7,
Ctrlr: &ctlpb.NvmeController{
DevState: ctlpb.NvmeDevState_NORMAL,
},
},
{
Uuid: "40ba7b18-3a0e-4d68-9e8f-c4fc556eb506",
TgtIds: []int32{
1024, 1024, 2, 2, 2, 6, 6, 6, 10, 10, 10,
14, 14, 14,
},
RoleBits: 7,
Ctrlr: &ctlpb.NvmeController{
DevState: ctlpb.NvmeDevState_NORMAL,
},
},
{
Uuid: "d78c849f-fd9e-4a20-9746-b0335e3618da",
TgtIds: []int32{
1024, 1024, 3, 3, 3, 7, 7, 7, 11, 11, 11,
15, 15, 15,
},
RoleBits: 7,
Ctrlr: &ctlpb.NvmeController{
DevState: ctlpb.NvmeDevState_NORMAL,
},
},
},
},
expResp: &ctlpb.ScanNvmeResp{
Ctrlrs: proto.NvmeControllers{
&ctlpb.NvmeController{
DevState: ctlpb.NvmeDevState_NORMAL,
SmdDevices: []*ctlpb.SmdDevice{
{RoleBits: 7},
},
},
&ctlpb.NvmeController{
DevState: ctlpb.NvmeDevState_NORMAL,
SmdDevices: []*ctlpb.SmdDevice{
{RoleBits: 7},
},
},
&ctlpb.NvmeController{
DevState: ctlpb.NvmeDevState_NORMAL,
SmdDevices: []*ctlpb.SmdDevice{
{RoleBits: 7},
},
},
&ctlpb.NvmeController{
DevState: ctlpb.NvmeDevState_NORMAL,
SmdDevices: []*ctlpb.SmdDevice{
{RoleBits: 7},
},
},
},
State: new(ctlpb.ResponseState),
},
},
} {
t.Run(name, func(t *testing.T) {
log, buf := logging.NewTestLogger(t.Name())
Expand Down
5 changes: 3 additions & 2 deletions src/control/server/storage/config.go
Original file line number Diff line number Diff line change
@@ -1,5 +1,6 @@
//
// (C) Copyright 2019-2024 Intel Corporation.
// (C) Copyright 2025 Hewlett Packard Enterprise Development LP
//
// SPDX-License-Identifier: BSD-2-Clause-Patent
//
Expand Down Expand Up @@ -484,8 +485,8 @@ func (tcs TierConfigs) AssignBdevTierRoles(extMetadataPath string) error {
if scs[0].Class == ClassDcpm {
return errors.New("external metadata path for md-on-ssd invalid with dcpm scm-class")
}
// Skip role assignment and validation if no real NVMe tiers exist.
if !tcs.HaveRealNVMe() {
// Skip role assignment and validation if no bdev tiers exist.
if !tcs.HaveBdevs() {
return nil
}

Expand Down

0 comments on commit 0a2df2a

Please sign in to comment.