rbd: add manager.CreateVolumeGroupSnapshot()

Implement the CreateVolumeGroupSnapshot for the rbd.Manager. A Group
Controller Server can use the rbd.Manager to create VolumeGroupSnapshots
in an easy an idempotent way.

Signed-off-by: Niels de Vos <ndevos@ibm.com>
This commit is contained in:
Niels de Vos 2024-08-28 17:46:22 +02:00 committed by mergify[bot]
parent 9bea3feff1
commit 7563f4285d
2 changed files with 163 additions and 0 deletions

View File

@ -114,6 +114,57 @@ func (mgr *rbdManager) getVolumeGroupJournal(clusterID string) (journal.VolumeGr
return vgJournal, nil return vgJournal, nil
} }
// getGroupUUID checks if a UUID in the volume group journal is already
// reserved. If none is reserved, a new reservation is made. Upon exit of
// getGroupUUID, the function returns:
// 1. the UUID that was reserved
// 2. an undo() function that reverts the reservation (if that succeeded), should be called in a defer
// 3. an error or nil.
func (mgr *rbdManager) getGroupUUID(
ctx context.Context,
clusterID, journalPool, name, prefix string,
) (string, func(), error) {
nothingToUndo := func() {
// the reservation was not done, no need to undo the reservation
}
vgJournal, err := mgr.getVolumeGroupJournal(clusterID)
if err != nil {
return "", nothingToUndo, err
}
vgsData, err := vgJournal.CheckReservation(ctx, journalPool, name, prefix)
if err != nil {
return "", nothingToUndo, fmt.Errorf("failed to check reservation for group %q: %w", name, err)
}
var uuid string
if vgsData != nil && vgsData.GroupUUID != "" {
uuid = vgsData.GroupUUID
} else {
log.DebugLog(ctx, "the journal does not contain a reservation for group %q yet", name)
uuid, _ /*vgsName*/, err = vgJournal.ReserveName(ctx, journalPool, name, prefix)
if err != nil {
return "", nothingToUndo, fmt.Errorf("failed to reserve a UUID for group %q: %w", name, err)
}
}
log.DebugLog(ctx, "got UUID %q for group %q", uuid, name)
// undo contains the cleanup that should be done by the caller when the
// reservation was made, and further actions fulfilling the final
// request failed
undo := func() {
err = vgJournal.UndoReservation(ctx, journalPool, uuid, name)
if err != nil {
log.ErrorLog(ctx, "failed to undo the reservation for group %q: %w", name, err)
}
}
return uuid, undo, nil
}
func (mgr *rbdManager) GetVolumeByID(ctx context.Context, id string) (types.Volume, error) { func (mgr *rbdManager) GetVolumeByID(ctx context.Context, id string) (types.Volume, error) {
creds, err := mgr.getCredentials() creds, err := mgr.getCredentials()
if err != nil { if err != nil {
@ -268,3 +319,108 @@ func (mgr *rbdManager) CreateVolumeGroup(ctx context.Context, name string) (type
return vg, nil return vg, nil
} }
func (mgr *rbdManager) CreateVolumeGroupSnapshot(
ctx context.Context,
vg types.VolumeGroup,
name string,
) (types.VolumeGroupSnapshot, error) {
pool, err := vg.GetPool(ctx)
if err != nil {
return nil, err
}
// groupNamePrefix is an optional parameter, can be an empty string
prefix := mgr.parameters["groupNamePrefix"]
clusterID, err := vg.GetClusterID(ctx)
if err != nil {
return nil, fmt.Errorf("failed to get cluster id for volume group snapshot %q: %w", vg, err)
}
uuid, freeUUID, err := mgr.getGroupUUID(ctx, clusterID, pool, name, prefix)
if err != nil {
return nil, fmt.Errorf("failed to get a UUID for volume group snapshot %q: %w", vg, err)
}
defer func() {
// no error, no need to undo the reservation
if err == nil {
return
}
freeUUID()
}()
monitors, err := util.Mons(util.CsiConfigFile, clusterID)
if err != nil {
return nil, fmt.Errorf("failed to find MONs for cluster %q: %w", clusterID, err)
}
_ /*journalPoolID*/, poolID, err := util.GetPoolIDs(ctx, monitors, pool, pool, mgr.creds)
if err != nil {
return nil, fmt.Errorf("failed to get PoolID for %q: %w", pool, err)
}
groupID, err := util.GenerateVolID(ctx, monitors, mgr.creds, poolID, pool, clusterID, uuid)
if err != nil {
return nil, fmt.Errorf("failed to generate a unique CSI volume group with uuid for %q: %w", uuid, err)
}
vgs, err := rbd_group.GetVolumeGroupSnapshot(ctx, groupID, mgr.csiID, mgr.creds, mgr)
if vgs != nil {
log.DebugLog(ctx, "found existing volume group snapshot %q for id %q", vgs, groupID)
// validate the contents of the vgs
snapshots, vgsErr := vgs.ListSnapshots(ctx)
if vgsErr != nil {
return nil, fmt.Errorf("failed to list snapshots of existing volume group snapshot %q: %w", vgs, vgsErr)
}
volumes, vgErr := vg.ListVolumes(ctx)
if vgErr != nil {
return nil, fmt.Errorf("failed to list volumes of volume group %q: %w", vg, vgErr)
}
// return the existing vgs if the contents matches
// TODO: improve contents verification, length is a very minimal check
if len(snapshots) == len(volumes) {
log.DebugLog(ctx, "existing volume group snapshot %q contains %d snapshots", vgs, len(snapshots))
return vgs, nil
}
} else if err != nil && !errors.Is(ErrImageNotFound, err) {
// ErrImageNotFound can be returned if the VolumeGroupSnapshot
// could not be found. It is expected that it does not exist
// yet, in which case it will be created below.
return nil, fmt.Errorf("failed to check for existing volume group snapshot with id %q: %w", groupID, err)
}
snapshots, err := vg.CreateSnapshots(ctx, mgr.creds, groupID)
if err != nil {
return nil, fmt.Errorf("failed to create volume group snapshot %q: %w", name, err)
}
defer func() {
// cleanup created snapshots in case there was a failure
if err == nil {
return
}
for _, snap := range snapshots {
delErr := snap.Delete(ctx)
if delErr != nil {
log.ErrorLog(ctx, "failed to delete snapshot %q: %v", snap, delErr)
}
}
}()
log.DebugLog(ctx, "volume group snapshot %q contains %d snapshots: %v", name, len(snapshots), snapshots)
vgs, err = rbd_group.NewVolumeGroupSnapshot(ctx, groupID, mgr.csiID, mgr.creds, snapshots)
if err != nil {
return nil, fmt.Errorf("failed to create new volume group snapshot %q: %w", name, err)
}
log.DebugLog(ctx, "volume group snapshot %q has been created", vgs)
return vgs, nil
}

View File

@ -52,4 +52,11 @@ type Manager interface {
// CreateVolumeGroup allocates a new VolumeGroup in the backend storage // CreateVolumeGroup allocates a new VolumeGroup in the backend storage
// and records details about it in the journal. // and records details about it in the journal.
CreateVolumeGroup(ctx context.Context, name string) (VolumeGroup, error) CreateVolumeGroup(ctx context.Context, name string) (VolumeGroup, error)
// CreateVolumeGroupSnapshot instructs the Manager to create a
// VolumeGroupSnapshot from the VolumeGroup. All snapshots in the
// returned VolumeGroupSnapshot have been taken while I/O on the
// VolumeGroup was paused, the snapshots in the group are crash
// consistent.
CreateVolumeGroupSnapshot(ctx context.Context, vg VolumeGroup, name string) (VolumeGroupSnapshot, error)
} }