Made node label key configurable (#217)

romanbaron · web-flow · commit 0450532a5590 · 2025-06-10T11:54:02.000+03:00
diff --git a/cmd/scheduler/app/options/options.go b/cmd/scheduler/app/options/options.go
@@ -27,6 +27,9 @@ const (
 	DefaultPyroscopeBlockProfilerRate  = 5
 	defaultNumOfStatusRecordingWorkers = 5
 	defaultNodePoolLabelKey            = ""
+	defaultCPUWorkerNodeLabelKey       = "node-role.kubernetes.io/cpu-worker"
+	defaultGPUWorkerNodeLabelKey       = "node-role.kubernetes.io/gpu-worker"
+	defaultMIGWorkerNodeLabelKey       = "node-role.kubernetes.io/mig-enabled"
 )
 
 // ServerOption is the main context object for the controller manager.
@@ -59,6 +62,9 @@ type ServerOption struct {
 	NumOfStatusRecordingWorkers       int
 	GlobalDefaultStalenessGracePeriod time.Duration
 	PluginServerPort                  int
+	CPUWorkerNodeLabelKey             string
+	GPUWorkerNodeLabelKey             string
+	MIGWorkerNodeLabelKey             string
 
 	QPS   int
 	Burst int
@@ -105,6 +111,9 @@ func (s *ServerOption) AddFlags(fs *pflag.FlagSet) {
 	fs.IntVar(&s.NumOfStatusRecordingWorkers, "num-of-status-recording-workers", defaultNumOfStatusRecordingWorkers, "specifies the max number of go routines spawned to update pod and podgroups conditions and events. Defaults to 5")
 	fs.DurationVar(&s.GlobalDefaultStalenessGracePeriod, "default-staleness-grace-period", defaultStalenessGracePeriod, "Global default staleness grace period duration. Negative values means infinite. Defaults to 60s")
 	fs.IntVar(&s.PluginServerPort, "plugin-server-port", 8081, "The port to bind for plugin server requests")
+	fs.StringVar(&s.CPUWorkerNodeLabelKey, "cpu-worker-node-label-key", defaultCPUWorkerNodeLabelKey, "The label key for CPU worker nodes")
+	fs.StringVar(&s.GPUWorkerNodeLabelKey, "gpu-worker-node-label-key", defaultGPUWorkerNodeLabelKey, "The label key for GPU worker nodes")
+	fs.StringVar(&s.MIGWorkerNodeLabelKey, "mig-worker-node-label-key", defaultMIGWorkerNodeLabelKey, "The label key for MIG enabled worker nodes")
 
 	utilfeature.DefaultMutableFeatureGate.AddFlag(fs)
 }
diff --git a/cmd/scheduler/app/options/options_test.go b/cmd/scheduler/app/options/options_test.go
@@ -49,6 +49,9 @@ func TestAddFlags(t *testing.T) {
 		NumOfStatusRecordingWorkers:       defaultNumOfStatusRecordingWorkers,
 		NodePoolLabelKey:                  defaultNodePoolLabelKey,
 		PluginServerPort:                  8081,
+		CPUWorkerNodeLabelKey:             defaultCPUWorkerNodeLabelKey,
+		GPUWorkerNodeLabelKey:             defaultGPUWorkerNodeLabelKey,
+		MIGWorkerNodeLabelKey:             defaultMIGWorkerNodeLabelKey,
 	}
 
 	if !reflect.DeepEqual(expected, s) {
diff --git a/cmd/scheduler/app/server.go b/cmd/scheduler/app/server.go
@@ -132,6 +132,9 @@ func setupLogging(so *options.ServerOption) error {
 func setConfig(so *options.ServerOption) {
 	config := conf.GetConfig()
 	config.ResourceReservationAppLabelValue = so.ResourceReservationAppLabel
+	config.CPUWorkerNodeLabelKey = so.CPUWorkerNodeLabelKey
+	config.GPUWorkerNodeLabelKey = so.GPUWorkerNodeLabelKey
+	config.MIGWorkerNodeLabelKey = so.MIGWorkerNodeLabelKey
 }
 
 func Run(opt *options.ServerOption, config *restclient.Config, mux *http.ServeMux) error {
diff --git a/pkg/common/constants/constants.go b/pkg/common/constants/constants.go
@@ -29,7 +29,6 @@ const (
 	// Labels
 	GPUGroup                 = "runai-gpu-group"
 	MultiGpuGroupLabelPrefix = GPUGroup + "/"
-	MigEnabledLabel          = "node-role.kubernetes.io/runai-mig-enabled"
 	MigStrategyLabel         = "nvidia.com/mig.strategy"
 	GpuCountLabel            = "nvidia.com/gpu.count"
 )
diff --git a/pkg/scheduler/api/node_info/node_info.go b/pkg/scheduler/api/node_info/node_info.go
@@ -24,15 +24,14 @@ import (
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/api/resource_info"
 	sc_info "github.com/NVIDIA/KAI-scheduler/pkg/scheduler/api/storagecapacity_info"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/api/storageclaim_info"
+	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/conf"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/log"
 )
 
 const (
 	DefaultGpuMemory = 100 // The default value is 100 because it allows all the calculation of (memory = fractional * GpuMemory) to work, if it was 0 the result will always be zero too
 	GpuMemoryLabel   = "nvidia.com/gpu.memory"
 	GpuCountLabel    = "nvidia.com/gpu.count"
-	CpuWorkerNode    = "node-role.kubernetes.io/runai-cpu-worker"
-	GpuWorkerNode    = "node-role.kubernetes.io/runai-gpu-worker"
 	MbToBRatio       = 1000000
 	BitToMib         = 1024 * 1024
 	TibInMib         = 1024 * 1024
@@ -633,7 +632,8 @@ func (ni *NodeInfo) IsCPUOnlyNode() bool {
 }
 
 func (ni *NodeInfo) IsMIGEnabled() bool {
-	enabled, found := ni.Node.Labels[commonconstants.MigEnabledLabel]
+	migWorkerLabelKey := conf.GetConfig().MIGWorkerNodeLabelKey
+	enabled, found := ni.Node.Labels[migWorkerLabelKey]
 	if found {
 		isMig, err := strconv.ParseBool(enabled)
 		return err == nil && isMig
diff --git a/pkg/scheduler/api/node_info/node_info_test.go b/pkg/scheduler/api/node_info/node_info_test.go
@@ -27,7 +27,10 @@ import (
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/api/storagecapacity_info"
 )
 
-const MibToMbScale = 1.048576
+const (
+	MibToMbScale       = 1.048576
+	migEnabledLabelKey = "node-role.kubernetes.io/mig-enabled"
+)
 
 func nodeInfoEqual(l, r *NodeInfo) bool {
 	l.PodAffinityInfo = nil
@@ -535,10 +538,10 @@ func TestIsTaskAllocatable(t *testing.T) {
 
 func TestIsTaskAllocatableOnReleasingOrIdle(t *testing.T) {
 	singleMigNode := common_info.BuildNode("single-mig", common_info.BuildResourceListWithGPU("2000m", "2G", "8"))
-	singleMigNode.Labels[commonconstants.MigEnabledLabel] = "true"
+	singleMigNode.Labels[migEnabledLabelKey] = "true"
 
 	mixedMigNode := common_info.BuildNode("mixed-mig", common_info.BuildResourceListWithGPU("2000m", "2G", "8"))
-	mixedMigNode.Labels[commonconstants.MigEnabledLabel] = "true"
+	mixedMigNode.Labels[migEnabledLabelKey] = "true"
 	mixedMigNode.Labels[commonconstants.GpuCountLabel] = "8"
 	mixedMigNode.Labels[GpuMemoryLabel] = "40"
 
diff --git a/pkg/scheduler/cache/cluster_info/cluster_info.go b/pkg/scheduler/cache/cluster_info/cluster_info.go
@@ -429,10 +429,12 @@ func getPodGroupPriority(
 }
 
 func filterUnmarkedNodes(nodes []*v1.Node) []*v1.Node {
+	cpuWorkerLabelKey := conf.GetConfig().CPUWorkerNodeLabelKey
+	gpuWorkerLabelKey := conf.GetConfig().GPUWorkerNodeLabelKey
 	markedNodes := []*v1.Node{}
 	for _, node := range nodes {
-		_, foundGpuNode := node.Labels[node_info.GpuWorkerNode]
-		_, foundCpuNode := node.Labels[node_info.CpuWorkerNode]
+		_, foundGpuNode := node.Labels[gpuWorkerLabelKey]
+		_, foundCpuNode := node.Labels[cpuWorkerLabelKey]
 		if foundGpuNode || foundCpuNode {
 			markedNodes = append(markedNodes, node)
 			log.InfraLogger.V(6).Infof("Node: <%v> is considered by cpu or gpu label", node.Name)
diff --git a/pkg/scheduler/conf/global_config.go b/pkg/scheduler/conf/global_config.go
@@ -15,12 +15,18 @@ var (
 type GlobalConfig struct {
 	ResourceReservationAppLabelValue string
 	ScalingPodAppLabelValue          string
+	CPUWorkerNodeLabelKey            string
+	GPUWorkerNodeLabelKey            string
+	MIGWorkerNodeLabelKey            string
 }
 
 func newGlobalConfig() *GlobalConfig {
 	return &GlobalConfig{
-		ResourceReservationAppLabelValue: "kai-resource-reservation",
+		ResourceReservationAppLabelValue: "runai-reservation",
 		ScalingPodAppLabelValue:          "scaling-pod",
+		CPUWorkerNodeLabelKey:            "node-role.kubernetes.io/cpu-worker",
+		GPUWorkerNodeLabelKey:            "node-role.kubernetes.io/gpu-worker",
+		MIGWorkerNodeLabelKey:            "node-role.kubernetes.io/mig-enabled",
 	}
 }
 
diff --git a/pkg/scheduler/plugins/predicates/predicates.go b/pkg/scheduler/plugins/predicates/predicates.go
@@ -16,6 +16,7 @@ import (
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/api/pod_info"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/api/podgroup_info"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/cache/cluster_info"
+	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/conf"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/framework"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/k8s_internal"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/k8s_internal/predicates"
@@ -229,14 +230,16 @@ func (pp *predicatesPlugin) evaluateTaskOnPredicates(
 	}
 
 	if isRestrictNodeSchedulingEnabled() {
+		gpuWorkerLabelKey := conf.GetConfig().GPUWorkerNodeLabelKey
+		cpuWorkerLabelKey := conf.GetConfig().CPUWorkerNodeLabelKey
 		if task.IsRequireAnyKindOfGPU() {
-			if _, found := node.Node.Labels[node_info.GpuWorkerNode]; !found {
+			if _, found := node.Node.Labels[gpuWorkerLabelKey]; !found {
 				log.InfraLogger.V(6).Infof("Task <%s/%s> is a GPU job and will not be allocated to a non GPU <%s>",
 					task.Namespace, task.Name, node.Name)
 				return fmt.Errorf("gpu task: <%v/%v> can't run on non gpu nodes, node: <%v>", task.Namespace, task.Name, node.Name)
 			}
 		} else {
-			if _, found := node.Node.Labels[node_info.CpuWorkerNode]; !found {
+			if _, found := node.Node.Labels[cpuWorkerLabelKey]; !found {
 				log.InfraLogger.V(6).Infof("Task <%s/%s> is a CPU job and will not be allocated to a GPU node <%s>",
 					task.Namespace, task.Name, node.Name)
 				return fmt.Errorf("cpu task: <%v/%v> can't run on non cpu nodes, node: <%v>", task.Namespace, task.Name, node.Name)
diff --git a/pkg/scheduler/plugins/proportion/proportion.go b/pkg/scheduler/plugins/proportion/proportion.go
@@ -16,6 +16,7 @@ import (
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/api/podgroup_info"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/api/queue_info"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/api/resource_info"
+	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/conf"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/framework"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/log"
 	"github.com/NVIDIA/KAI-scheduler/pkg/scheduler/metrics"
@@ -193,7 +194,8 @@ func getNodeResources(ssn *framework.Session, node *node_info.NodeInfo) rs.Resou
 		return nodeResource
 	}
 
-	_, found := node.Node.Labels[node_info.GpuWorkerNode]
+	gpuWorkerLabelKey := conf.GetConfig().GPUWorkerNodeLabelKey
+	_, found := node.Node.Labels[gpuWorkerLabelKey]
 	shouldIgnoreGPUs := ssn.IsRestrictNodeSchedulingEnabled() && !found
 	if shouldIgnoreGPUs {
 		nodeResource.Add(rs.NewResourceQuantities(node.Allocatable.Cpu(), node.Allocatable.Memory(), 0))
diff --git a/pkg/scheduler/plugins/proportion/proportion_test.go b/pkg/scheduler/plugins/proportion/proportion_test.go
@@ -550,7 +550,7 @@ var _ = Describe("Set Fair Share in Proportion", func() {
 					Node: &v1.Node{
 						ObjectMeta: metav1.ObjectMeta{
 							Labels: map[string]string{
-								node_info.GpuWorkerNode: "true",
+								"node-role.kubernetes.io/gpu-worker": "true",
 							},
 						},
 					},
diff --git a/pkg/scheduler/test_utils/nodes_fake/nodes.go b/pkg/scheduler/test_utils/nodes_fake/nodes.go
@@ -28,6 +28,7 @@ const (
 	memoryOverall       = "30G"
 	cpuMilliAllocatable = "20000"
 	memoryAllocatable   = "20G"
+	migEnabledLabelKey  = "node-role.kubernetes.io/mig-enabled"
 )
 
 type TestClusterTopology struct {
@@ -116,7 +117,7 @@ func buildNodeInfo(
 	node.Labels = map[string]string{
 		commonconstants.GpuCountLabel:    nodeGpuCount,
 		node_info.GpuMemoryLabel:         strconv.Itoa(node_info.DefaultGpuMemory),
-		commonconstants.MigEnabledLabel:  migEnabledLabel,
+		migEnabledLabelKey:               migEnabledLabel,
 		commonconstants.MigStrategyLabel: string(nodeMetadata.MigStrategy),
 		tasks_fake.NodeAffinityKey:       nodeName,
 	}
diff --git a/test/e2e/suites/allocate/predicates/restrict_node_scheduling_test.go b/test/e2e/suites/allocate/predicates/restrict_node_scheduling_test.go
@@ -32,8 +32,8 @@ import (
 )
 
 const (
-	cpuWorkerLabelName = "node-role.kubernetes.io/runai-cpu-worker"
-	gpuWorkerLabelName = "node-role.kubernetes.io/runai-gpu-worker"
+	cpuWorkerLabelName = "node-role.kubernetes.io/cpu-worker"
+	gpuWorkerLabelName = "node-role.kubernetes.io/gpu-worker"
 )
 
 var _ = Describe("Restrict node scheduling", Label(labels.Operated), Ordered, func() {

Original file line number	Diff line number	Diff line change
`@@ -49,6 +49,9 @@ func TestAddFlags(t *testing.T) {`
`49`	`49`	`NumOfStatusRecordingWorkers: defaultNumOfStatusRecordingWorkers,`
`50`	`50`	`NodePoolLabelKey: defaultNodePoolLabelKey,`
`51`	`51`	`PluginServerPort: 8081,`
	`52`	`+ CPUWorkerNodeLabelKey: defaultCPUWorkerNodeLabelKey,`
	`53`	`+ GPUWorkerNodeLabelKey: defaultGPUWorkerNodeLabelKey,`
	`54`	`+ MIGWorkerNodeLabelKey: defaultMIGWorkerNodeLabelKey,`
`52`	`55`	`}`
`53`	`56`
`54`	`57`	`if !reflect.DeepEqual(expected, s) {`
Original file line number	Diff line number	Diff line change
`@@ -132,6 +132,9 @@ func setupLogging(so *options.ServerOption) error {`
`132`	`132`	`func setConfig(so *options.ServerOption) {`
`133`	`133`	`config := conf.GetConfig()`
`134`	`134`	`config.ResourceReservationAppLabelValue = so.ResourceReservationAppLabel`
	`135`	`+ config.CPUWorkerNodeLabelKey = so.CPUWorkerNodeLabelKey`
	`136`	`+ config.GPUWorkerNodeLabelKey = so.GPUWorkerNodeLabelKey`
	`137`	`+ config.MIGWorkerNodeLabelKey = so.MIGWorkerNodeLabelKey`
`135`	`138`	`}`
`136`	`139`
`137`	`140`	`func Run(opt options.ServerOption, config restclient.Config, mux *http.ServeMux) error {`
Original file line number	Diff line number	Diff line change
`@@ -29,7 +29,6 @@ const (`
`29`	`29`	`// Labels`
`30`	`30`	`GPUGroup = "runai-gpu-group"`
`31`	`31`	`MultiGpuGroupLabelPrefix = GPUGroup + "/"`
`32`		`- MigEnabledLabel = "node-role.kubernetes.io/runai-mig-enabled"`
`33`	`32`	`MigStrategyLabel = "nvidia.com/mig.strategy"`
`34`	`33`	`GpuCountLabel = "nvidia.com/gpu.count"`
`35`	`34`	`)`
Original file line number	Diff line number	Diff line change
`@@ -15,12 +15,18 @@ var (`
`15`	`15`	`type GlobalConfig struct {`
`16`	`16`	`ResourceReservationAppLabelValue string`
`17`	`17`	`ScalingPodAppLabelValue string`
	`18`	`+ CPUWorkerNodeLabelKey string`
	`19`	`+ GPUWorkerNodeLabelKey string`
	`20`	`+ MIGWorkerNodeLabelKey string`
`18`	`21`	`}`
`19`	`22`
`20`	`23`	`func newGlobalConfig() *GlobalConfig {`
`21`	`24`	`return &GlobalConfig{`
`22`		`- ResourceReservationAppLabelValue: "kai-resource-reservation",`
	`25`	`+ ResourceReservationAppLabelValue: "runai-reservation",`
`23`	`26`	`ScalingPodAppLabelValue: "scaling-pod",`
	`27`	`+ CPUWorkerNodeLabelKey: "node-role.kubernetes.io/cpu-worker",`
	`28`	`+ GPUWorkerNodeLabelKey: "node-role.kubernetes.io/gpu-worker",`
	`29`	`+ MIGWorkerNodeLabelKey: "node-role.kubernetes.io/mig-enabled",`
`24`	`30`	`}`
`25`	`31`	`}`
`26`	`32`