@@ -11,8 +11,6 @@ import (
1111)
1212
1313const (
14- RunaiNamespace = "runai"
15-
1614 // OnSessionOpen label
1715 OnSessionOpen = "OnSessionOpen"
1816
@@ -22,48 +20,49 @@ const (
2220
2321var (
2422 currentAction string
23+ subsystemName string
2524
2625 e2eSchedulingLatency = promauto .NewGauge (
2726 prometheus.GaugeOpts {
28- Subsystem : RunaiNamespace ,
27+ Subsystem : subsystemName ,
2928 Name : "e2e_scheduling_latency_milliseconds" ,
3029 Help : "E2e scheduling latency in milliseconds (scheduling algorithm + binding), as a gauge" ,
3130 },
3231 )
3332
3433 openSessionLatency = promauto .NewGauge (
3534 prometheus.GaugeOpts {
36- Subsystem : RunaiNamespace ,
35+ Subsystem : subsystemName ,
3736 Name : "open_session_latency_milliseconds" ,
3837 Help : "Open session latency in milliseconds, including all plugins, as a gauge" ,
3938 },
4039 )
4140
4241 closeSessionLatency = promauto .NewGauge (
4342 prometheus.GaugeOpts {
44- Subsystem : RunaiNamespace ,
43+ Subsystem : subsystemName ,
4544 Name : "close_session_latency_milliseconds" ,
4645 Help : "Close session latency in milliseconds, including all plugins, as a gauge" ,
4746 },
4847 )
4948
5049 pluginSchedulingLatency = promauto .NewGaugeVec (
5150 prometheus.GaugeOpts {
52- Subsystem : RunaiNamespace ,
51+ Subsystem : subsystemName ,
5352 Name : "plugin_scheduling_latency_milliseconds" ,
5453 Help : "Plugin scheduling latency in milliseconds, as a gauge" ,
5554 }, []string {"plugin" , "OnSession" })
5655
5756 actionSchedulingLatency = promauto .NewGaugeVec (
5857 prometheus.GaugeOpts {
59- Subsystem : RunaiNamespace ,
58+ Subsystem : subsystemName ,
6059 Name : "action_scheduling_latency_milliseconds" ,
6160 Help : "Action scheduling latency in milliseconds, as a gauge" ,
6261 }, []string {"action" })
6362
6463 taskSchedulingLatency = promauto .NewHistogram (
6564 prometheus.HistogramOpts {
66- Subsystem : RunaiNamespace ,
65+ Subsystem : subsystemName ,
6766 Name : "task_scheduling_latency_milliseconds" ,
6867 Help : "Task scheduling latency in milliseconds" ,
6968 Buckets : prometheus .ExponentialBuckets (5 , 2 , 10 ),
7271
7372 taskBindLatency = promauto .NewHistogram (
7473 prometheus.HistogramOpts {
75- Subsystem : RunaiNamespace ,
74+ Subsystem : subsystemName ,
7675 Name : "task_bind_latency_milliseconds" ,
7776 Help : "Task bind latency histogram in milliseconds" ,
7877 Buckets : prometheus .ExponentialBuckets (5 , 2 , 10 ),
@@ -81,55 +80,55 @@ var (
8180
8281 podgroupsScheduledByAction = promauto .NewCounterVec (
8382 prometheus.CounterOpts {
84- Subsystem : RunaiNamespace ,
83+ Subsystem : subsystemName ,
8584 Name : "podgroups_scheduled_by_action" ,
8685 Help : "Count of podgroups scheduled per action" ,
8786 }, []string {"action" })
8887
8988 podgroupsConsideredByAction = promauto .NewCounterVec (
9089 prometheus.CounterOpts {
91- Subsystem : RunaiNamespace ,
90+ Subsystem : subsystemName ,
9291 Name : "podgroups_acted_on_by_action" ,
9392 Help : "Count of podgroups tried per action" ,
9493 }, []string {"action" })
9594
9695 scenariosSimulatedByAction = promauto .NewCounterVec (
9796 prometheus.CounterOpts {
98- Subsystem : RunaiNamespace ,
97+ Subsystem : subsystemName ,
9998 Name : "scenarios_simulation_by_action" ,
10099 Help : "Count of scenarios simulated per action" ,
101100 }, []string {"action" })
102101
103102 scenariosFilteredByAction = promauto .NewCounterVec (
104103 prometheus.CounterOpts {
105- Subsystem : RunaiNamespace ,
104+ Subsystem : subsystemName ,
106105 Name : "scenarios_filtered_by_action" ,
107106 Help : "Count of scenarios filtered per action" ,
108107 }, []string {"action" })
109108
110109 preemptionAttempts = promauto .NewCounter (
111110 prometheus.CounterOpts {
112- Subsystem : RunaiNamespace ,
111+ Subsystem : subsystemName ,
113112 Name : "total_preemption_attempts" ,
114113 Help : "Total preemption attempts in the cluster till now" ,
115114 },
116115 )
117116
118117 queueFairShareCPU = promauto .NewGaugeVec (
119118 prometheus.GaugeOpts {
120- Subsystem : RunaiNamespace ,
119+ Subsystem : subsystemName ,
121120 Name : "queue_fair_share_cpu_cores" ,
122121 Help : "CPU Fair share of queue, as a gauge. Value is in Cores" ,
123122 }, []string {"queue_name" })
124123 queueFairShareMemory = promauto .NewGaugeVec (
125124 prometheus.GaugeOpts {
126- Subsystem : RunaiNamespace ,
125+ Subsystem : subsystemName ,
127126 Name : "queue_fair_share_memory_gb" ,
128127 Help : "Memory Fair share of queue, as a gauge. Value is in GB" ,
129128 }, []string {"queue_name" })
130129 queueFairShareGPU = promauto .NewGaugeVec (
131130 prometheus.GaugeOpts {
132- Subsystem : RunaiNamespace ,
131+ Subsystem : subsystemName ,
133132 Name : "queue_fair_share_gpu" ,
134133 Help : "GPU Fair share of queue, as a gauge. Values in GPU devices" ,
135134 }, []string {"queue_name" })
@@ -168,6 +167,10 @@ func UpdateTaskScheduleDuration(duration time.Duration) {
168167 taskSchedulingLatency .Observe (float64 (duration .Milliseconds ()))
169168}
170169
170+ func SetSubSystemName (name string ) {
171+ subsystemName = name
172+ }
173+
171174func SetCurrentAction (action string ) {
172175 currentAction = action
173176}
0 commit comments