Move utils/locks.go to /pkg

emmahardison · web-flow · commit 308dcd7f64d5 · 2025-05-13T13:44:47.000-06:00
diff --git a/frontend/csi/node_server.go b/frontend/csi/node_server.go
@@ -28,6 +28,7 @@ import (
 	. "github.com/netapp/trident/logging"
 	"github.com/netapp/trident/pkg/collection"
 	"github.com/netapp/trident/pkg/convert"
+	"github.com/netapp/trident/pkg/locks"
 	sa "github.com/netapp/trident/storage_attribute"
 	"github.com/netapp/trident/utils"
 	"github.com/netapp/trident/utils/devices"
@@ -105,7 +106,7 @@ const (
 
 func attemptLock(ctx context.Context, lockContext, lockID string, lockTimeout time.Duration) bool {
 	startTime := time.Now()
-	utils.Lock(ctx, lockContext, lockID)
+	locks.Lock(ctx, lockContext, lockID)
 	// Fail if the gRPC call came in a long time ago to avoid kubelet 120s timeout
 	if time.Since(startTime) > lockTimeout {
 		Logc(ctx).Debugf("Request spent more than %v in the queue and timed out", csiNodeLockTimeout)
@@ -127,7 +128,7 @@ func (p *Plugin) NodeStageVolume(
 	defer Logc(ctx).WithFields(fields).Debug("<<<< NodeStageVolume")
 
 	lockContext := "NodeStageVolume"
-	defer utils.Unlock(ctx, lockContext, req.GetVolumeId())
+	defer locks.Unlock(ctx, lockContext, req.GetVolumeId())
 	if !attemptLock(ctx, lockContext, req.GetVolumeId(), csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock")
 	}
@@ -181,7 +182,7 @@ func (p *Plugin) nodeUnstageVolume(
 	defer Logc(ctx).WithFields(fields).Debug("<<<< NodeUnstageVolume")
 
 	lockContext := "NodeUnstageVolume"
-	defer utils.Unlock(ctx, lockContext, req.GetVolumeId())
+	defer locks.Unlock(ctx, lockContext, req.GetVolumeId())
 	if !attemptLock(ctx, lockContext, req.GetVolumeId(), csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock")
 	}
@@ -269,7 +270,7 @@ func (p *Plugin) NodePublishVolume(
 	defer Logc(ctx).WithFields(fields).Debug("<<<< NodePublishVolume")
 
 	lockContext := "NodePublishVolume"
-	defer utils.Unlock(ctx, lockContext, req.GetVolumeId())
+	defer locks.Unlock(ctx, lockContext, req.GetVolumeId())
 	if !attemptLock(ctx, lockContext, req.GetVolumeId(), csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock")
 	}
@@ -326,7 +327,7 @@ func (p *Plugin) NodeUnpublishVolume(
 	defer Logc(ctx).WithFields(fields).Debug("<<<< NodeUnpublishVolume")
 
 	lockContext := "NodeUnpublishVolume"
-	defer utils.Unlock(ctx, lockContext, req.GetVolumeId())
+	defer locks.Unlock(ctx, lockContext, req.GetVolumeId())
 	if !attemptLock(ctx, lockContext, req.GetVolumeId(), csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock")
 	}
@@ -1553,7 +1554,7 @@ func (p *Plugin) nodeUnstageFCPVolumeRetry(
 ) (*csi.NodeUnstageVolumeResponse, error) {
 	// Serializing all the parallel requests by relying on the constant var.
 	lockContext := "NodeUnstageFCPVolume-" + req.GetVolumeId()
-	defer utils.Unlock(ctx, lockContext, nodeLockID)
+	defer locks.Unlock(ctx, lockContext, nodeLockID)
 
 	if !attemptLock(ctx, lockContext, nodeLockID, csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock")
@@ -1588,7 +1589,7 @@ func (p *Plugin) nodePublishFCPVolume(
 ) (*csi.NodePublishVolumeResponse, error) {
 	// Serializing all the parallel requests by relying on the constant var.
 	lockContext := "NodePublishFCPVolume-" + req.GetVolumeId()
-	defer utils.Unlock(ctx, lockContext, nodeLockID)
+	defer locks.Unlock(ctx, lockContext, nodeLockID)
 
 	if !attemptLock(ctx, lockContext, nodeLockID, csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock")
@@ -2090,7 +2091,7 @@ func (p *Plugin) nodeUnstageISCSIVolumeRetry(
 ) (*csi.NodeUnstageVolumeResponse, error) {
 	// Serializing all the parallel requests by relying on the constant var.
 	lockContext := "NodeUnstageISCSIVolume-" + req.GetVolumeId()
-	defer utils.Unlock(ctx, lockContext, nodeLockID)
+	defer locks.Unlock(ctx, lockContext, nodeLockID)
 
 	if !attemptLock(ctx, lockContext, nodeLockID, csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock")
@@ -2125,7 +2126,7 @@ func (p *Plugin) nodePublishISCSIVolume(
 ) (*csi.NodePublishVolumeResponse, error) {
 	// Serializing all the parallel requests by relying on the constant var.
 	lockContext := "NodePublishISCSIVolume-" + req.GetVolumeId()
-	defer utils.Unlock(ctx, lockContext, nodeLockID)
+	defer locks.Unlock(ctx, lockContext, nodeLockID)
 
 	if !attemptLock(ctx, lockContext, nodeLockID, csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock")
@@ -2655,8 +2656,8 @@ func (p *Plugin) updateCHAPInfoForSessions(
 // performISCSISelfHealing inspects the desired state of the iSCSI sessions with the current state and accordingly
 // identifies candidate sessions that require remediation. This function is invoked periodically.
 func (p *Plugin) performISCSISelfHealing(ctx context.Context) {
-	utils.Lock(ctx, iSCSISelfHealingLockContext, nodeLockID)
-	defer utils.Unlock(ctx, iSCSISelfHealingLockContext, nodeLockID)
+	locks.Lock(ctx, iSCSISelfHealingLockContext, nodeLockID)
+	defer locks.Unlock(ctx, iSCSISelfHealingLockContext, nodeLockID)
 
 	defer func() {
 		if r := recover(); r != nil {
@@ -2742,7 +2743,7 @@ func (p *Plugin) fixISCSISessions(ctx context.Context, portals []string, portalT
 
 		// Check if there is a need to stop the loop from running
 		// NOTE: The loop should run at least once for all portal types.
-		if idx > 0 && utils.WaitQueueSize(nodeLockID) > 0 {
+		if idx > 0 && locks.WaitQueueSize(nodeLockID) > 0 {
 			// Check to see if some other operation(s) requires node lock, if not then continue to resolve
 			// non-stale iSCSI portal issues else break out of this loop.
 			if isNonStaleSessionFix {
@@ -2913,7 +2914,7 @@ func (p *Plugin) nodeUnstageNVMeVolume(
 ) (*csi.NodeUnstageVolumeResponse, error) {
 	// Serializing all the parallel requests by relying on the constant var.
 	lockContext := "NodeUnstageNVMeVolume-" + req.GetVolumeId()
-	defer utils.Unlock(ctx, lockContext, nodeLockID)
+	defer locks.Unlock(ctx, lockContext, nodeLockID)
 
 	if !attemptLock(ctx, lockContext, nodeLockID, csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock")
@@ -3057,7 +3058,7 @@ func (p *Plugin) nodePublishNVMeVolume(
 ) (*csi.NodePublishVolumeResponse, error) {
 	// Serializing all the parallel requests by relying on the constant var.
 	lockContext := "NodePublishNVMeVolume-" + req.GetVolumeId()
-	defer utils.Unlock(ctx, lockContext, nodeLockID)
+	defer locks.Unlock(ctx, lockContext, nodeLockID)
 
 	if !attemptLock(ctx, lockContext, nodeLockID, csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock")
@@ -3128,7 +3129,7 @@ func (p *Plugin) nodeStageSANVolume(
 ) (*csi.NodeStageVolumeResponse, error) {
 	// Serializing all the parallel requests by relying on the constant var.
 	lockContext := "NodeStageSanVolume-" + req.GetVolumeId()
-	defer utils.Unlock(ctx, lockContext, nodeLockID)
+	defer locks.Unlock(ctx, lockContext, nodeLockID)
 
 	if !attemptLock(ctx, lockContext, nodeLockID, csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock")
@@ -3190,8 +3191,8 @@ func (p *Plugin) nodeStageSANVolume(
 // performNVMeSelfHealing inspects the desired state of the NVMe sessions with the current state and accordingly
 // identifies candidate sessions that require remediation. This function is invoked periodically.
 func (p *Plugin) performNVMeSelfHealing(ctx context.Context) {
-	utils.Lock(ctx, nvmeSelfHealingLockContext, nodeLockID)
-	defer utils.Unlock(ctx, nvmeSelfHealingLockContext, nodeLockID)
+	locks.Lock(ctx, nvmeSelfHealingLockContext, nodeLockID)
+	defer locks.Unlock(ctx, nvmeSelfHealingLockContext, nodeLockID)
 
 	defer func() {
 		if r := recover(); r != nil {
@@ -3240,7 +3241,7 @@ func (p *Plugin) fixNVMeSessions(ctx context.Context, stopAt time.Time, subsyste
 		// 1. We should fix at least one subsystem in a single self-healing thread.
 		// 2. If there's another thread waiting for the node lock and if we have exceeded our 60 secs lock, we should
 		//    stop NVMe self-healing.
-		if index > 0 && utils.WaitQueueSize(nodeLockID) > 0 && time.Now().After(stopAt) {
+		if index > 0 && locks.WaitQueueSize(nodeLockID) > 0 && time.Now().After(stopAt) {
 			Logc(ctx).Info("Self-healing has exceeded maximum runtime; preempting NVMe session self-healing.")
 			break
 		}
diff --git a/frontend/csi/node_server_test.go b/frontend/csi/node_server_test.go
@@ -34,8 +34,8 @@ import (
 	mock_nvme "github.com/netapp/trident/mocks/mock_utils/nvme"
 	"github.com/netapp/trident/pkg/collection"
 	"github.com/netapp/trident/pkg/convert"
+	"github.com/netapp/trident/pkg/locks"
 	sa "github.com/netapp/trident/storage_attribute"
-	"github.com/netapp/trident/utils"
 	"github.com/netapp/trident/utils/devices"
 	"github.com/netapp/trident/utils/errors"
 	"github.com/netapp/trident/utils/filesystem"
@@ -1263,9 +1263,9 @@ func TestFixISCSISessions(t *testing.T) {
 			portals := getPortals(input.PublishedPortals, input.PortalActions)
 
 			if input.AddNewNodeOps {
-				go utils.Lock(ctx, "test-lock1", nodeLockID)
+				go locks.Lock(ctx, "test-lock1", nodeLockID)
 				snooze(10)
-				go utils.Lock(ctx, "test-lock2", nodeLockID)
+				go locks.Lock(ctx, "test-lock2", nodeLockID)
 				snooze(10)
 			}
 
@@ -1290,16 +1290,16 @@ func TestFixISCSISessions(t *testing.T) {
 			}
 
 			if input.AddNewNodeOps {
-				utils.Unlock(ctx, "test-lock1", nodeLockID)
+				locks.Unlock(ctx, "test-lock1", nodeLockID)
 
 				// Wait for the lock to be released
-				for utils.WaitQueueSize(nodeLockID) > 1 {
+				for locks.WaitQueueSize(nodeLockID) > 1 {
 					snooze(10)
 				}
 
 				// Give some time for another context to acquire the lock
 				snooze(100)
-				utils.Unlock(ctx, "test-lock2", nodeLockID)
+				locks.Unlock(ctx, "test-lock2", nodeLockID)
 			}
 		})
 	}
@@ -1825,13 +1825,13 @@ func TestAttemptLock_Failure(t *testing.T) {
 		expected := attemptLock(ctx, lockContext, nodeLockID, lockTimeout)
 
 		assert.False(t, expected)
-		utils.Unlock(ctx, lockContext, nodeLockID)
+		locks.Unlock(ctx, lockContext, nodeLockID)
 	}()
 	// first request goes to sleep holding the lock
 	if expected {
 		time.Sleep(500 * time.Millisecond)
 	}
-	utils.Unlock(ctx, lockContext, nodeLockID)
+	locks.Unlock(ctx, lockContext, nodeLockID)
 	wg.Wait()
 }
 
@@ -1860,13 +1860,13 @@ func TestAttemptLock_Success(t *testing.T) {
 		expected := attemptLock(ctx, lockContext, nodeLockID, lockTimeout)
 
 		assert.True(t, expected)
-		utils.Unlock(ctx, lockContext, nodeLockID)
+		locks.Unlock(ctx, lockContext, nodeLockID)
 	}()
 	// first request goes to sleep holding the lock
 	if expected {
 		time.Sleep(200 * time.Millisecond)
 	}
-	utils.Unlock(ctx, lockContext, nodeLockID)
+	locks.Unlock(ctx, lockContext, nodeLockID)
 	wg.Wait()
 }
 
diff --git a/frontend/csi/volume_publish_manager.go b/frontend/csi/volume_publish_manager.go
@@ -18,7 +18,7 @@ import (
 	"github.com/netapp/trident/config"
 	"github.com/netapp/trident/internal/fiji"
 	. "github.com/netapp/trident/logging"
-	"github.com/netapp/trident/utils"
+	"github.com/netapp/trident/pkg/locks"
 	"github.com/netapp/trident/utils/errors"
 	"github.com/netapp/trident/utils/filesystem"
 	"github.com/netapp/trident/utils/models"
@@ -100,7 +100,7 @@ func (v *VolumePublishManager) WriteTrackingInfo(
 
 	// we can have locks on filename itself.
 	lockContext := "WriteTrackingInfo"
-	defer utils.Unlock(ctx, lockContext, filename)
+	defer locks.Unlock(ctx, lockContext, filename)
 	if !attemptLock(ctx, lockContext, filename, csiNodeLockTimeout) {
 		return status.Error(codes.Aborted, "request waited too long for the lock")
 	}
@@ -144,7 +144,7 @@ func (v *VolumePublishManager) readTrackingInfo(
 	}
 
 	lockContext := "ReadTrackingInfo"
-	defer utils.Unlock(ctx, lockContext, filename)
+	defer locks.Unlock(ctx, lockContext, filename)
 	if !attemptLock(ctx, lockContext, filename, csiNodeLockTimeout) {
 		return nil, status.Error(codes.Aborted, "request waited too long for the lock on tracking file")
 	}
diff --git a/pkg/locks/locks.go b/pkg/locks/locks.go
@@ -1,6 +1,6 @@
-// Copyright 2022 NetApp, Inc. All Rights Reserved.
+// Copyright 2025 NetApp, Inc. All Rights Reserved.
 
-package utils
+package locks
 
 import (
 	"context"
diff --git a/pkg/locks/locks_test.go b/pkg/locks/locks_test.go
@@ -1,6 +1,6 @@
 // Copyright 2018 NetApp, Inc. All Rights Reserved.
 
-package utils
+package locks
 
 import (
 	"context"
diff --git a/storage_drivers/ontap/ontap_nas_qtree.go b/storage_drivers/ontap/ontap_nas_qtree.go
@@ -23,12 +23,12 @@ import (
 	"github.com/netapp/trident/pkg/capacity"
 	"github.com/netapp/trident/pkg/collection"
 	"github.com/netapp/trident/pkg/convert"
+	"github.com/netapp/trident/pkg/locks"
 	"github.com/netapp/trident/storage"
 	sa "github.com/netapp/trident/storage_attribute"
 	drivers "github.com/netapp/trident/storage_drivers"
 	"github.com/netapp/trident/storage_drivers/ontap/api"
 	"github.com/netapp/trident/storage_drivers/ontap/awsapi"
-	"github.com/netapp/trident/utils"
 	"github.com/netapp/trident/utils/errors"
 	"github.com/netapp/trident/utils/models"
 )
@@ -326,8 +326,8 @@ func (d *NASQtreeStorageDriver) Create(
 	defer Logd(ctx, d.Name(), d.Config.DebugTraceFlags["method"]).WithFields(fields).Trace("<<<< Create")
 
 	// Ensure any Flexvol we create won't be pruned before we place a qtree on it
-	utils.Lock(ctx, "create", d.sharedLockID)
-	defer utils.Unlock(ctx, "create", d.sharedLockID)
+	locks.Lock(ctx, "create", d.sharedLockID)
+	defer locks.Unlock(ctx, "create", d.sharedLockID)
 
 	// Generic user-facing message
 	createError := errors.New("volume creation failed")
@@ -578,8 +578,8 @@ func (d *NASQtreeStorageDriver) Destroy(ctx context.Context, volConfig *storage.
 	defer Logd(ctx, d.Name(), d.Config.DebugTraceFlags["method"]).WithFields(fields).Trace("<<<< Destroy")
 
 	// Ensure the deleted qtree reaping job doesn't interfere with this workflow
-	utils.Lock(ctx, "destroy", d.sharedLockID)
-	defer utils.Unlock(ctx, "destroy", d.sharedLockID)
+	locks.Lock(ctx, "destroy", d.sharedLockID)
+	defer locks.Unlock(ctx, "destroy", d.sharedLockID)
 
 	// Generic user-facing message
 	deleteError := errors.New("volume deletion failed")
@@ -1603,8 +1603,8 @@ func (d *NASQtreeStorageDriver) queueAllFlexvolsForQuotaResize(ctx context.Conte
 // operation will be attempted each time this method is called until it succeeds.
 func (d *NASQtreeStorageDriver) resizeQuotas(ctx context.Context) {
 	// Ensure we don't forget any Flexvol that is involved in a qtree provisioning workflow
-	utils.Lock(ctx, "resize", d.sharedLockID)
-	defer utils.Unlock(ctx, "resize", d.sharedLockID)
+	locks.Lock(ctx, "resize", d.sharedLockID)
+	defer locks.Unlock(ctx, "resize", d.sharedLockID)
 
 	Logc(ctx).Debug("Housekeeping, resizing quotas.")
 
@@ -1649,8 +1649,8 @@ func (d *NASQtreeStorageDriver) getTotalHardDiskLimitQuota(ctx context.Context,
 // hardcoded prefix on their names) that have no qtrees are deleted.
 func (d *NASQtreeStorageDriver) pruneUnusedFlexvols(ctx context.Context) {
 	// Ensure we don't prune any Flexvol that is involved in a qtree provisioning workflow
-	utils.Lock(ctx, "prune", d.sharedLockID)
-	defer utils.Unlock(ctx, "prune", d.sharedLockID)
+	locks.Lock(ctx, "prune", d.sharedLockID)
+	defer locks.Unlock(ctx, "prune", d.sharedLockID)
 
 	Logc(ctx).Debug("Housekeeping, checking for managed Flexvols with no qtrees.")
 
@@ -1729,8 +1729,8 @@ func (d *NASQtreeStorageDriver) pruneUnusedFlexvols(ctx context.Context) {
 // destroy call failed or was never made due to a process interruption.
 func (d *NASQtreeStorageDriver) reapDeletedQtrees(ctx context.Context) {
 	// Ensure we don't reap any qtree that is involved in a qtree delete workflow
-	utils.Lock(ctx, "reap", d.sharedLockID)
-	defer utils.Unlock(ctx, "reap", d.sharedLockID)
+	locks.Lock(ctx, "reap", d.sharedLockID)
+	defer locks.Unlock(ctx, "reap", d.sharedLockID)
 
 	Logc(ctx).Debug("Housekeeping, checking for deleted qtrees.")
 
@@ -2288,8 +2288,8 @@ func (d *NASQtreeStorageDriver) Resize(ctx context.Context, volConfig *storage.V
 	}
 
 	// Ensure any Flexvol won't be pruned before resize is completed.
-	utils.Lock(ctx, "resize", d.sharedLockID)
-	defer utils.Unlock(ctx, "resize", d.sharedLockID)
+	locks.Lock(ctx, "resize", d.sharedLockID)
+	defer locks.Unlock(ctx, "resize", d.sharedLockID)
 
 	// Generic user-facing message
 	resizeError := errors.New("storage driver failed to resize the volume")