1 hafta önce · 73d55a3b22
--- a/core/pkg/source/datasource.go
+++ b/core/pkg/source/datasource.go
@@ -93,6 +93,33 @@ type MetricsQuerier interface {
 
															 	QueryDCGMContainerUsageAvg(start, end time.Time) *Future[DCGMDeviceContainerUsageResult]
														
 
															 	QueryDCGMContainerUsageMax(start, end time.Time) *Future[DCGMDeviceContainerUsageResult]
														
 
															+	// GPU saturation (USE method). Sources return no results when the
														
 
															+	// underlying DCGM fields are unavailable; absence is never zero.
														
 
															+	QueryGPUThrottleViolationRatio(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUThrottleReasonRatio(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUMemoryUsedRatioAvg(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUMemoryUsedRatioMax(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUMemoryPressureRatio(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUXIDErrorCount(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUDRAMActiveAvg(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUDRAMActiveMax(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUSMActiveAvg(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUSMOccupancyAvg(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUPCIeTxBytesAvg(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUPCIeRxBytesAvg(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUNVLinkTxBytesAvg(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+	QueryGPUNVLinkRxBytesAvg(start, end time.Time) *Future[GPUSaturationResult]
														
 
															+
														
 
															+	// Device-level GPU metrics (DeviceInfo / DevicePerformance support):
														
 
															+	// grouped by device identity only, all from the default dcgm-exporter
														
 
															+	// configuration
														
 
															+	QueryGPUDevicePowerAvg(start, end time.Time) *Future[GPUDeviceMetricResult]
														
 
															+	QueryGPUDeviceTempAvg(start, end time.Time) *Future[GPUDeviceMetricResult]
														
 
															+	QueryGPUDeviceUsageAvg(start, end time.Time) *Future[GPUDeviceMetricResult]
														
 
															+	QueryGPUDeviceUsageMax(start, end time.Time) *Future[GPUDeviceMetricResult]
														
 
															+	QueryGPUDeviceMemoryUsedAvg(start, end time.Time) *Future[GPUDeviceMetricResult]
														
 
															+	QueryGPUDeviceMemoryUsedMax(start, end time.Time) *Future[GPUDeviceMetricResult]
														
 
															+
														
 
															 	// PVC
														
 
															 	QueryPodPVCAllocation(start, end time.Time) *Future[PodPVCAllocationResult]
														
 
															 	QueryPVCBytesRequested(start, end time.Time) *Future[PVCBytesRequestedResult]
														
--- a/core/pkg/source/decoders.go
+++ b/core/pkg/source/decoders.go
@@ -46,6 +46,9 @@ const (
 
															 	HostNameLabel        = "Hostname"
														
 
															 	UUIDLabel            = "UUID"
														
 
															 	ResourceLabel        = "resource"
														
 
															+	ReasonLabel          = "reason"
														
 
															+	MIGProfileLabel      = "GPU_I_PROFILE"
														
 
															+	MIGInstanceLabel     = "GPU_I_ID"
														
 
															 	DeploymentLabel      = "deployment"
														
 
															 	StatefulSetLabel     = "statefulSet"
														
 
															 	DaemonSetLabel       = "daemonset"
														
@@ -1090,6 +1093,72 @@ func DecodeGPUInfoResult(result *QueryResult) *GPUInfoResult {
 
															 	}
														
 
															 }
														
 
															+// GPUSaturationResult is the shared result shape for every GPU saturation
														
 
															+// query. The signal queried (throttle ratio, memory pressure, etc.) is
														
 
															+// determined by the DataSource method that produced the result; Reason is
														
 
															+// only populated by the throttle queries, and the MIG labels only when
														
 
															+// dcgm-exporter reports MIG instances as distinct devices.
														
 
															+// GPUDeviceMetricResult is the result shape for device-level GPU metric
														
 
															+// queries (power, temperature, device-level utilization, memory used).
														
 
															+// It shares GPUSaturationResult's label decoding: device identity plus MIG
														
 
															+// instance labels; container attribution fields stay empty for
														
 
															+// device-level groupings.
														
 
															+type GPUDeviceMetricResult = GPUSaturationResult
														
 
															+
														
 
															+// DecodeGPUDeviceMetricResult decodes a device-level GPU metric result.
														
 
															+func DecodeGPUDeviceMetricResult(result *QueryResult) *GPUDeviceMetricResult {
														
 
															+	return DecodeGPUSaturationResult(result)
														
 
															+}
														
 
															+
														
 
															+type GPUSaturationResult struct {
														
 
															+	UID         string
														
 
															+	Cluster     string
														
 
															+	Namespace   string
														
 
															+	Pod         string
														
 
															+	Container   string
														
 
															+	Device      string
														
 
															+	ModelName   string
														
 
															+	UUID        string
														
 
															+	MIGProfile  string
														
 
															+	MIGInstance string
														
 
															+	Reason      string
														
 
															+	Data        []*util.Vector
														
 
															+}
														
 
															+
														
 
															+func DecodeGPUSaturationResult(result *QueryResult) *GPUSaturationResult {
														
 
															+	// DCGM series carry the pod UID as pod_uid in the kubemodel scrape
														
 
															+	// convention; fall back to the legacy uid label for older configs
														
 
															+	uid, err := result.GetString(PodUIDLabel)
														
 
															+	if err != nil {
														
 
															+		uid, _ = result.GetString(UIDLabel)
														
 
															+	}
														
 
															+	cluster, _ := result.GetCluster()
														
 
															+	namespace, _ := result.GetNamespace()
														
 
															+	pod, _ := result.GetPod()
														
 
															+	container, _ := result.GetContainer()
														
 
															+	device, _ := result.GetString(DeviceLabel)
														
 
															+	modelName, _ := result.GetString(ModelNameLabel)
														
 
															+	uuid, _ := result.GetString(UUIDLabel)
														
 
															+	migProfile, _ := result.GetString(MIGProfileLabel)
														
 
															+	migInstance, _ := result.GetString(MIGInstanceLabel)
														
 
															+	reason, _ := result.GetString(ReasonLabel)
														
 
															+
														
 
															+	return &GPUSaturationResult{
														
 
															+		UID:         uid,
														
 
															+		Cluster:     cluster,
														
 
															+		Namespace:   namespace,
														
 
															+		Pod:         pod,
														
 
															+		Container:   container,
														
 
															+		Device:      device,
														
 
															+		ModelName:   modelName,
														
 
															+		UUID:        uuid,
														
 
															+		MIGProfile:  migProfile,
														
 
															+		MIGInstance: migInstance,
														
 
															+		Reason:      reason,
														
 
															+		Data:        result.Values,
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															 type IsGPUSharedResult struct {
														
 
															 	UID       string
														
 
															 	Cluster   string
														
--- a/core/pkg/source/decoders_test.go
+++ b/core/pkg/source/decoders_test.go
@@ -0,0 +1,93 @@
 
															+package source
														
 
															+
														
 
															+import (
														
 
															+	"testing"
														
 
															+
														
 
															+	"github.com/opencost/opencost/core/pkg/util"
														
 
															+)
														
 
															+
														
 
															+func TestDecodeGPUSaturationResult(t *testing.T) {
														
 
															+	values := []*util.Vector{{Timestamp: 1000, Value: 0.25}}
														
 
															+
														
 
															+	t.Run("all labels present", func(t *testing.T) {
														
 
															+		result := NewQueryResult(map[string]any{
														
 
															+			"pod_uid":       "pod-uid-1",
														
 
															+			"cluster_id":    "cluster-1",
														
 
															+			"namespace":     "gpu-ns",
														
 
															+			"pod":           "gpu-pod",
														
 
															+			"container":     "gpu-container",
														
 
															+			"device":        "nvidia0",
														
 
															+			"modelName":     "NVIDIA A100-SXM4-40GB",
														
 
															+			"UUID":          "GPU-1234",
														
 
															+			"GPU_I_PROFILE": "1g.5gb",
														
 
															+			"GPU_I_ID":      "3",
														
 
															+			"reason":        "sw_power_cap",
														
 
															+		}, values, nil)
														
 
															+
														
 
															+		decoded := DecodeGPUSaturationResult(result)
														
 
															+
														
 
															+		if decoded.UID != "pod-uid-1" {
														
 
															+			t.Errorf("UID = %q, want %q", decoded.UID, "pod-uid-1")
														
 
															+		}
														
 
															+		if decoded.Cluster != "cluster-1" {
														
 
															+			t.Errorf("Cluster = %q, want %q", decoded.Cluster, "cluster-1")
														
 
															+		}
														
 
															+		if decoded.Namespace != "gpu-ns" {
														
 
															+			t.Errorf("Namespace = %q, want %q", decoded.Namespace, "gpu-ns")
														
 
															+		}
														
 
															+		if decoded.Pod != "gpu-pod" {
														
 
															+			t.Errorf("Pod = %q, want %q", decoded.Pod, "gpu-pod")
														
 
															+		}
														
 
															+		if decoded.Container != "gpu-container" {
														
 
															+			t.Errorf("Container = %q, want %q", decoded.Container, "gpu-container")
														
 
															+		}
														
 
															+		if decoded.Device != "nvidia0" {
														
 
															+			t.Errorf("Device = %q, want %q", decoded.Device, "nvidia0")
														
 
															+		}
														
 
															+		if decoded.ModelName != "NVIDIA A100-SXM4-40GB" {
														
 
															+			t.Errorf("ModelName = %q, want %q", decoded.ModelName, "NVIDIA A100-SXM4-40GB")
														
 
															+		}
														
 
															+		if decoded.UUID != "GPU-1234" {
														
 
															+			t.Errorf("UUID = %q, want %q", decoded.UUID, "GPU-1234")
														
 
															+		}
														
 
															+		if decoded.MIGProfile != "1g.5gb" {
														
 
															+			t.Errorf("MIGProfile = %q, want %q", decoded.MIGProfile, "1g.5gb")
														
 
															+		}
														
 
															+		if decoded.MIGInstance != "3" {
														
 
															+			t.Errorf("MIGInstance = %q, want %q", decoded.MIGInstance, "3")
														
 
															+		}
														
 
															+		if decoded.Reason != "sw_power_cap" {
														
 
															+			t.Errorf("Reason = %q, want %q", decoded.Reason, "sw_power_cap")
														
 
															+		}
														
 
															+		if len(decoded.Data) != 1 || decoded.Data[0].Value != 0.25 {
														
 
															+			t.Errorf("Data not passed through: %+v", decoded.Data)
														
 
															+		}
														
 
															+	})
														
 
															+
														
 
															+	t.Run("optional labels absent", func(t *testing.T) {
														
 
															+		// non-MIG GPU without a reason-labeled query: those labels simply
														
 
															+		// do not exist on the series and must decode to empty strings
														
 
															+		// legacy scrape configs label the pod UID as "uid"; the decoder
														
 
															+		// falls back to it when pod_uid is absent
														
 
															+		result := NewQueryResult(map[string]any{
														
 
															+			"uid":        "pod-uid-1",
														
 
															+			"cluster_id": "cluster-1",
														
 
															+			"namespace":  "gpu-ns",
														
 
															+			"pod":        "gpu-pod",
														
 
															+			"container":  "gpu-container",
														
 
															+			"UUID":       "GPU-1234",
														
 
															+		}, values, nil)
														
 
															+
														
 
															+		decoded := DecodeGPUSaturationResult(result)
														
 
															+
														
 
															+		if decoded.MIGProfile != "" || decoded.MIGInstance != "" || decoded.Reason != "" {
														
 
															+			t.Errorf("expected absent labels to decode to empty strings, got %+v", decoded)
														
 
															+		}
														
 
															+		if decoded.Device != "" || decoded.ModelName != "" {
														
 
															+			t.Errorf("expected absent device labels to decode to empty strings, got %+v", decoded)
														
 
															+		}
														
 
															+		if decoded.UUID != "GPU-1234" {
														
 
															+			t.Errorf("UUID = %q, want %q", decoded.UUID, "GPU-1234")
														
 
															+		}
														
 
															+	})
														
 
															+}
														
--- a/modules/collector-source/pkg/collector/collector.go
+++ b/modules/collector-source/pkg/collector/collector.go
@@ -74,6 +74,12 @@ func NewOpenCostMetricStore() metric.MetricStore {
 
															 	memStore.Register(NewDCGMUptimeMetricCollector())
														
 
															 	memStore.Register(NewDCGMContainerUsageAvgMetricCollector())
														
 
															 	memStore.Register(NewDCGMContainerUsageMaxMetricCollector())
														
 
															+	for _, gpuSaturationCollector := range NewGPUSaturationMetricCollectors() {
														
 
															+		memStore.Register(gpuSaturationCollector)
														
 
															+	}
														
 
															+	for _, gpuDeviceCollector := range NewGPUDeviceMetricCollectors() {
														
 
															+		memStore.Register(gpuDeviceCollector)
														
 
															+	}
														
 
															 	memStore.Register(NewNodeCPUPricePerHourMetricCollector())
														
 
															 	memStore.Register(NewNodeRAMPricePerGiBHourMetricCollector())
														
 
															 	memStore.Register(NewNodeGPUPricePerHourMetricCollector())
														
--- a/modules/collector-source/pkg/collector/datasource.go
+++ b/modules/collector-source/pkg/collector/datasource.go
@@ -88,6 +88,7 @@ func NewCollectorDataSource(
 
															 		updater,
														
 
															 		synthetic.NewContainerMemoryAllocationSynthesizer(),
														
 
															 		synthetic.NewContainerCpuAllocationSynthesizer(),
														
 
															+		synthetic.NewGPUMemoryUsedRatioSynthesizer(),
														
 
															 	)
														
 
															 	updater = metricSynthesizer
														
--- a/modules/collector-source/pkg/collector/gpusaturation.go
+++ b/modules/collector-source/pkg/collector/gpusaturation.go
@@ -0,0 +1,150 @@
 
															+package collector
														
 
															+
														
 
															+import (
														
 
															+	coreenv "github.com/opencost/opencost/core/pkg/env"
														
 
															+	"github.com/opencost/opencost/core/pkg/opencost"
														
 
															+	"github.com/opencost/opencost/core/pkg/source"
														
 
															+	"github.com/opencost/opencost/modules/collector-source/pkg/metric"
														
 
															+	"github.com/opencost/opencost/modules/collector-source/pkg/metric/aggregator"
														
 
															+)
														
 
															+
														
 
															+// GPU saturation collectors
														
 
															+//
														
 
															+// These collectors aggregate USE-method GPU saturation signals from
														
 
															+// dcgm-exporter scrapes. When a DCGM field is absent from the scrape (not in
														
 
															+// the exporter config, or no DCP profiling support) the corresponding
														
 
															+// collector simply accumulates nothing and its query returns no results,
														
 
															+// which downstream treats as "signal absent" rather than zero.
														
 
															+
														
 
															+// gpuSaturationLabels is the label set shared by every GPU saturation
														
 
															+// collector: container attribution, GPU identity, and MIG instance labels.
														
 
															+// Labels absent from a scrape resolve to empty strings.
														
 
															+var gpuSaturationLabels = []string{
														
 
															+	source.NamespaceLabel,
														
 
															+	source.PodLabel,
														
 
															+	source.PodUIDLabel,
														
 
															+	source.ContainerLabel,
														
 
															+	source.DeviceLabel,
														
 
															+	source.ModelNameLabel,
														
 
															+	source.UUIDLabel,
														
 
															+	source.MIGProfileLabel,
														
 
															+	source.MIGInstanceLabel,
														
 
															+}
														
 
															+
														
 
															+func gpuSaturationFilter(labels map[string]string) bool {
														
 
															+	return labels[source.ContainerLabel] != ""
														
 
															+}
														
 
															+
														
 
															+// gpuThrottleViolationCollectorMetrics maps each violation collector ID to
														
 
															+// its DCGM source metric. The counters accumulate microseconds spent
														
 
															+// throttled; the querier converts the windowed increase into a fraction of
														
 
															+// the window and tags the reason.
														
 
															+var gpuThrottleViolationCollectors = []struct {
														
 
															+	ID     metric.MetricCollectorID
														
 
															+	Metric string
														
 
															+	Reason string
														
 
															+}{
														
 
															+	{ID: metric.GPUThrottleViolationPowerID, Metric: metric.DCGMFIDEVPOWERVIOLATION, Reason: opencost.GPUThrottleViolationPower},
														
 
															+	{ID: metric.GPUThrottleViolationThermalID, Metric: metric.DCGMFIDEVTHERMALVIOLATION, Reason: opencost.GPUThrottleViolationThermal},
														
 
															+	{ID: metric.GPUThrottleViolationSyncBoostID, Metric: metric.DCGMFIDEVSYNCBOOSTVIOLATION, Reason: opencost.GPUThrottleViolationSyncBoost},
														
 
															+	{ID: metric.GPUThrottleViolationBoardLimitID, Metric: metric.DCGMFIDEVBOARDLIMITVIOLATION, Reason: opencost.GPUThrottleViolationBoardLimit},
														
 
															+}
														
 
															+
														
 
															+// gpuThrottleBitmaskMetrics enumerates both names of the DCGM clock throttle
														
 
															+// reasons bitmask field (renamed in DCGM 3.3+); at most one is scraped per
														
 
															+// dcgm-exporter version, so only one family of collectors ever accumulates
														
 
															+// data and the querier's merge of both ID families is effectively a union
														
 
															+// with one empty side. Registering per-name collectors was chosen over
														
 
															+// renaming at scrape time because the TargetScraper is a generic
														
 
															+// name-filtered pipe with no transform hook; if scrape-time normalization
														
 
															+// is ever added, collapse this to the canonical name and halve the
														
 
															+// collectors.
														
 
															+var gpuThrottleBitmaskMetrics = []string{
														
 
															+	metric.DCGMFIDEVCLOCKTHROTTLEREASONS,
														
 
															+	metric.DCGMFIDEVCLOCKSEVENTREASONS,
														
 
															+}
														
 
															+
														
 
															+func newGPUSaturationCollector(id metric.MetricCollectorID, metricName string, factory aggregator.MetricAggregatorFactory) *metric.MetricCollector {
														
 
															+	return metric.NewMetricCollector(
														
 
															+		id,
														
 
															+		metricName,
														
 
															+		gpuSaturationLabels,
														
 
															+		factory,
														
 
															+		gpuSaturationFilter,
														
 
															+	)
														
 
															+}
														
 
															+
														
 
															+// gpuDeviceLabels groups device-level metrics by device identity (and MIG
														
 
															+// instance) without container attribution: power, temperature, and
														
 
															+// device-level utilization describe the whole device regardless of which
														
 
															+// containers share it.
														
 
															+var gpuDeviceLabels = []string{
														
 
															+	source.DeviceLabel,
														
 
															+	source.ModelNameLabel,
														
 
															+	source.UUIDLabel,
														
 
															+	source.MIGProfileLabel,
														
 
															+	source.MIGInstanceLabel,
														
 
															+}
														
 
															+
														
 
															+func newGPUDeviceCollector(id metric.MetricCollectorID, metricName string, factory aggregator.MetricAggregatorFactory) *metric.MetricCollector {
														
 
															+	return metric.NewMetricCollector(id, metricName, gpuDeviceLabels, factory, nil)
														
 
															+}
														
 
															+
														
 
															+// NewGPUDeviceMetricCollectors returns the collectors backing the
														
 
															+// DeviceInfo / DevicePerformance contracts: power, temperature,
														
 
															+// device-level compute utilization, and framebuffer used.
														
 
															+func NewGPUDeviceMetricCollectors() []*metric.MetricCollector {
														
 
															+	return []*metric.MetricCollector{
														
 
															+		newGPUDeviceCollector(metric.GPUDevicePowerAvgID, metric.DCGMFIDEVPOWERUSAGE, aggregator.AverageOverTime),
														
 
															+		newGPUDeviceCollector(metric.GPUDeviceTempAvgID, metric.DCGMFIDEVGPUTEMP, aggregator.AverageOverTime),
														
 
															+		newGPUDeviceCollector(metric.GPUDeviceUsageAvgID, metric.DCGMFIPROFGRENGINEACTIVE, aggregator.AverageOverTime),
														
 
															+		newGPUDeviceCollector(metric.GPUDeviceUsageMaxID, metric.DCGMFIPROFGRENGINEACTIVE, aggregator.MaxOverTime),
														
 
															+		newGPUDeviceCollector(metric.GPUDeviceMemoryUsedAvgID, metric.DCGMFIDEVFBUSED, aggregator.AverageOverTime),
														
 
															+		newGPUDeviceCollector(metric.GPUDeviceMemoryUsedMaxID, metric.DCGMFIDEVFBUSED, aggregator.MaxOverTime),
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+// NewGPUSaturationMetricCollectors returns every collector needed for the
														
 
															+// GPU saturation signals.
														
 
															+func NewGPUSaturationMetricCollectors() []*metric.MetricCollector {
														
 
															+	collectors := []*metric.MetricCollector{
														
 
															+		// framebuffer occupancy over the synthetic per-sample ratio metric
														
 
															+		// joined from FB_USED/FB_FREE at scrape time (see
														
 
															+		// synthetic.GPUMemoryUsedRatioSynthesizer)
														
 
															+		newGPUSaturationCollector(metric.GPUMemoryUsedAvgID, metric.OpencostGPUMemoryUsedRatio, aggregator.AverageOverTime),
														
 
															+		newGPUSaturationCollector(metric.GPUMemoryUsedMaxID, metric.OpencostGPUMemoryUsedRatio, aggregator.MaxOverTime),
														
 
															+		newGPUSaturationCollector(metric.GPUMemoryPressureRatioID, metric.OpencostGPUMemoryUsedRatio, aggregator.AboveThresholdRatio(coreenv.GetGPUMemorySaturationThreshold())),
														
 
															+		// XID error events: count value transitions of the last-error gauge
														
 
															+		newGPUSaturationCollector(metric.GPUXIDErrorCountID, metric.DCGMFIDEVXIDERRORS, aggregator.Changes),
														
 
															+		// DCP profiling gauges
														
 
															+		newGPUSaturationCollector(metric.GPUDRAMActiveAvgID, metric.DCGMFIPROFDRAMACTIVE, aggregator.AverageOverTime),
														
 
															+		newGPUSaturationCollector(metric.GPUDRAMActiveMaxID, metric.DCGMFIPROFDRAMACTIVE, aggregator.MaxOverTime),
														
 
															+		newGPUSaturationCollector(metric.GPUSMActiveAvgID, metric.DCGMFIPROFSMACTIVE, aggregator.AverageOverTime),
														
 
															+		newGPUSaturationCollector(metric.GPUSMOccupancyAvgID, metric.DCGMFIPROFSMOCCUPANCY, aggregator.AverageOverTime),
														
 
															+		// DCP byte counters as average bytes/sec
														
 
															+		newGPUSaturationCollector(metric.GPUPCIeTxBytesAvgID, metric.DCGMFIPROFPCIETXBYTES, aggregator.Rate),
														
 
															+		newGPUSaturationCollector(metric.GPUPCIeRxBytesAvgID, metric.DCGMFIPROFPCIERXBYTES, aggregator.Rate),
														
 
															+		newGPUSaturationCollector(metric.GPUNVLinkTxBytesAvgID, metric.DCGMFIPROFNVLINKTXBYTES, aggregator.Rate),
														
 
															+		newGPUSaturationCollector(metric.GPUNVLinkRxBytesAvgID, metric.DCGMFIPROFNVLINKRXBYTES, aggregator.Rate),
														
 
															+	}
														
 
															+
														
 
															+	// throttle violation counters: windowed increase, normalized by the
														
 
															+	// querier
														
 
															+	for _, violation := range gpuThrottleViolationCollectors {
														
 
															+		collectors = append(collectors, newGPUSaturationCollector(violation.ID, violation.Metric, aggregator.Increase))
														
 
															+	}
														
 
															+
														
 
															+	// throttle reasons bitmask: one bit-ratio collector per
														
 
															+	// (metric name, saturation-relevant reason)
														
 
															+	for _, metricName := range gpuThrottleBitmaskMetrics {
														
 
															+		for _, reason := range opencost.GPUThrottleReasons {
														
 
															+			collectors = append(collectors, newGPUSaturationCollector(
														
 
															+				metric.GPUThrottleReasonCollectorID(metricName, reason.Name),
														
 
															+				metricName,
														
 
															+				aggregator.BitSetRatio(reason.Bit),
														
 
															+			))
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															+	return collectors
														
 
															+}
														
--- a/modules/collector-source/pkg/collector/gpusaturationquerier.go
+++ b/modules/collector-source/pkg/collector/gpusaturationquerier.go
@@ -0,0 +1,202 @@
 
															+package collector
														
 
															+
														
 
															+import (
														
 
															+	"fmt"
														
 
															+	"time"
														
 
															+
														
 
															+	"github.com/opencost/opencost/core/pkg/opencost"
														
 
															+	"github.com/opencost/opencost/core/pkg/source"
														
 
															+	"github.com/opencost/opencost/modules/collector-source/pkg/metric"
														
 
															+	"github.com/opencost/opencost/modules/collector-source/pkg/metric/aggregator"
														
 
															+)
														
 
															+
														
 
															+// GPU saturation queries over the collector store. These mirror the
														
 
															+// prometheus-source queries: same DataSource method names, same
														
 
															+// GPUSaturationResult semantics. Signals whose DCGM field was never scraped
														
 
															+// produce no results, which downstream treats as absent rather than zero.
														
 
															+
														
 
															+// gpuSaturationResultsFuture wraps a set of MetricResults into the shared
														
 
															+// GPUSaturationResult future shape.
														
 
															+func gpuSaturationResultsFuture(name string, results []*aggregator.MetricResult, err error) *source.Future[source.GPUSaturationResult] {
														
 
															+	queryResults := source.NewQueryResults(name)
														
 
															+	queryResults.Error = err
														
 
															+	for _, result := range results {
														
 
															+		queryResults.Results = append(queryResults.Results, result.ToQueryResult())
														
 
															+	}
														
 
															+	ch := make(source.QueryResultsChan, 1)
														
 
															+	ch <- queryResults
														
 
															+	return source.NewFuture(source.DecodeGPUSaturationResult, ch)
														
 
															+}
														
 
															+
														
 
															+// queryGPUReasonTagged queries one collector per reason, tags each result
														
 
															+// with the reason label, and optionally transforms every value.
														
 
															+func (c *collectorMetricsQuerier) queryGPUReasonTagged(name string, start, end time.Time, idReasons map[metric.MetricCollectorID]string, transform func(float64) float64) *source.Future[source.GPUSaturationResult] {
														
 
															+	var tagged []*aggregator.MetricResult
														
 
															+	var firstErr error
														
 
															+
														
 
															+	collector := c.collectorProvider.GetStore(start, end)
														
 
															+	if collector != nil {
														
 
															+		for id, reason := range idReasons {
														
 
															+			results, err := collector.Query(id)
														
 
															+			if err != nil {
														
 
															+				if firstErr == nil {
														
 
															+					firstErr = err
														
 
															+				}
														
 
															+				continue
														
 
															+			}
														
 
															+			for _, result := range results {
														
 
															+				if result.MetricLabels == nil {
														
 
															+					result.MetricLabels = map[string]string{}
														
 
															+				}
														
 
															+				result.MetricLabels[source.ReasonLabel] = reason
														
 
															+				if transform != nil {
														
 
															+					for i := range result.Values {
														
 
															+						result.Values[i].Value = transform(result.Values[i].Value)
														
 
															+					}
														
 
															+				}
														
 
															+				tagged = append(tagged, result)
														
 
															+			}
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															+	return gpuSaturationResultsFuture(name, tagged, firstErr)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUThrottleViolationRatio reports the fraction of the window each GPU
														
 
															+// spent throttled, per reason, from the DCGM violation microsecond counters.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUThrottleViolationRatio(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	idReasons := make(map[metric.MetricCollectorID]string, len(gpuThrottleViolationCollectors))
														
 
															+	for _, violation := range gpuThrottleViolationCollectors {
														
 
															+		idReasons[violation.ID] = violation.Reason
														
 
															+	}
														
 
															+
														
 
															+	windowMicros := float64(end.Sub(start).Microseconds())
														
 
															+	if windowMicros <= 0 {
														
 
															+		return gpuSaturationResultsFuture("GPUThrottleViolationRatio", nil, fmt.Errorf("invalid window for GPUThrottleViolationRatio: %s to %s", start, end))
														
 
															+	}
														
 
															+
														
 
															+	return c.queryGPUReasonTagged("GPUThrottleViolationRatio", start, end, idReasons, func(increaseMicros float64) float64 {
														
 
															+		return increaseMicros / windowMicros
														
 
															+	})
														
 
															+}
														
 
															+
														
 
															+// QueryGPUThrottleReasonRatio reports the fraction of scraped samples in
														
 
															+// which each saturation-relevant bit of the clock throttle reasons bitmask
														
 
															+// was set. Both DCGM field names are queried; at most one is ever scraped.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUThrottleReasonRatio(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	idReasons := make(map[metric.MetricCollectorID]string, 2*len(opencost.GPUThrottleReasons))
														
 
															+	for _, metricName := range gpuThrottleBitmaskMetrics {
														
 
															+		for _, reason := range opencost.GPUThrottleReasons {
														
 
															+			idReasons[metric.GPUThrottleReasonCollectorID(metricName, reason.Name)] = reason.Name
														
 
															+		}
														
 
															+	}
														
 
															+	return c.queryGPUReasonTagged("GPUThrottleReasonRatio", start, end, idReasons, nil)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUMemoryUsedRatioAvg reports average framebuffer occupancy over the
														
 
															+// window: FB_USED / (FB_USED + FB_FREE), aggregated from the per-sample
														
 
															+// occupancy ratio synthesized at scrape time.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUMemoryUsedRatioAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUMemoryUsedAvgID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUMemoryUsedRatioMax reports peak framebuffer occupancy over the
														
 
															+// window.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUMemoryUsedRatioMax(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUMemoryUsedMaxID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUMemoryPressureRatio reports the fraction of scraped samples in
														
 
															+// which framebuffer occupancy was at or above the configured threshold,
														
 
															+// from the same synthesized per-sample occupancy ratio.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUMemoryPressureRatio(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUMemoryPressureRatioID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUXIDErrorCount reports the number of XID error transitions
														
 
															+// observed in the window.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUXIDErrorCount(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUXIDErrorCountID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDRAMActiveAvg reports the average ratio of cycles the device
														
 
															+// memory interface was active. Requires DCP profiling.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUDRAMActiveAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUDRAMActiveAvgID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDRAMActiveMax reports the peak ratio of cycles the device memory
														
 
															+// interface was active. Requires DCP profiling.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUDRAMActiveMax(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUDRAMActiveMaxID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUSMActiveAvg reports the average ratio of cycles at least one warp
														
 
															+// was resident on any SM. Requires DCP profiling and explicit enablement.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUSMActiveAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUSMActiveAvgID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUSMOccupancyAvg reports the average ratio of resident warps to the
														
 
															+// SM maximum. Requires DCP profiling and explicit enablement.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUSMOccupancyAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUSMOccupancyAvgID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUPCIeTxBytesAvg reports average PCIe transmit throughput in
														
 
															+// bytes/sec. Requires DCP profiling.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUPCIeTxBytesAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUPCIeTxBytesAvgID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUPCIeRxBytesAvg reports average PCIe receive throughput in
														
 
															+// bytes/sec. Requires DCP profiling.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUPCIeRxBytesAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUPCIeRxBytesAvgID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUNVLinkTxBytesAvg reports average NVLink transmit throughput in
														
 
															+// bytes/sec. Requires DCP profiling and explicit enablement.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUNVLinkTxBytesAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUNVLinkTxBytesAvgID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUNVLinkRxBytesAvg reports average NVLink receive throughput in
														
 
															+// bytes/sec. Requires DCP profiling and explicit enablement.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUNVLinkRxBytesAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUNVLinkRxBytesAvgID, source.DecodeGPUSaturationResult)
														
 
															+}
														
 
															+
														
 
															+// Device-level GPU metric queries (DeviceInfo / DevicePerformance support).
														
 
															+
														
 
															+// QueryGPUDevicePowerAvg reports average device power draw in watts.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUDevicePowerAvg(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUDevicePowerAvgID, source.DecodeGPUDeviceMetricResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDeviceTempAvg reports average device temperature in Celsius.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUDeviceTempAvg(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUDeviceTempAvgID, source.DecodeGPUDeviceMetricResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDeviceUsageAvg reports average device-level compute utilization
														
 
															+// as a 0-1 ratio.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUDeviceUsageAvg(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUDeviceUsageAvgID, source.DecodeGPUDeviceMetricResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDeviceUsageMax reports peak device-level compute utilization as a
														
 
															+// 0-1 ratio.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUDeviceUsageMax(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUDeviceUsageMaxID, source.DecodeGPUDeviceMetricResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDeviceMemoryUsedAvg reports average framebuffer used in MiB.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUDeviceMemoryUsedAvg(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUDeviceMemoryUsedAvgID, source.DecodeGPUDeviceMetricResult)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDeviceMemoryUsedMax reports peak framebuffer used in MiB.
														
 
															+func (c *collectorMetricsQuerier) QueryGPUDeviceMemoryUsedMax(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return queryCollector(c, start, end, metric.GPUDeviceMemoryUsedMaxID, source.DecodeGPUDeviceMetricResult)
														
 
															+}
														
--- a/modules/collector-source/pkg/collector/gpusaturationquerier_test.go
+++ b/modules/collector-source/pkg/collector/gpusaturationquerier_test.go
@@ -0,0 +1,235 @@
 
															+package collector
														
 
															+
														
 
															+import (
														
 
															+	"math"
														
 
															+	"testing"
														
 
															+	"time"
														
 
															+
														
 
															+	"github.com/opencost/opencost/core/pkg/opencost"
														
 
															+	"github.com/opencost/opencost/core/pkg/source"
														
 
															+	"github.com/opencost/opencost/modules/collector-source/pkg/metric"
														
 
															+)
														
 
															+
														
 
															+// gpuSaturationMockProvider builds a store with one hour of DCGM saturation
														
 
															+// samples for a single GPU container. SM_ACTIVE, SM_OCCUPANCY, and NVLink
														
 
															+// metrics are deliberately never updated to exercise absent-signal behavior.
														
 
															+func gpuSaturationMockProvider(t *testing.T) (StoreProvider, time.Time, time.Time) {
														
 
															+	t.Helper()
														
 
															+	t.Setenv("GPU_MEMORY_SATURATION_THRESHOLD", "0.6")
														
 
															+
														
 
															+	start, _ := time.Parse(time.RFC3339, Start1Str)
														
 
															+	end, _ := time.Parse(time.RFC3339, End1Str)
														
 
															+
														
 
															+	gpuInfo := map[string]string{
														
 
															+		source.NamespaceLabel:   "namespace1",
														
 
															+		source.PodLabel:         "pod1",
														
 
															+		source.PodUIDLabel:      "pod-uuid1",
														
 
															+		source.ContainerLabel:   "container1",
														
 
															+		source.DeviceLabel:      "nvidia0",
														
 
															+		source.ModelNameLabel:   "Tesla T4",
														
 
															+		source.UUIDLabel:        "GPU-1",
														
 
															+		source.MIGProfileLabel:  "",
														
 
															+		source.MIGInstanceLabel: "",
														
 
															+	}
														
 
															+
														
 
															+	store := NewOpenCostMetricStore()
														
 
															+
														
 
															+	// power violation counter: 1.8e9us accumulated over a 3.6e9us window
														
 
															+	store.Update(metric.DCGMFIDEVPOWERVIOLATION, gpuInfo, 0, start, nil)
														
 
															+	store.Update(metric.DCGMFIDEVPOWERVIOLATION, gpuInfo, 1.8e9, end, nil)
														
 
															+
														
 
															+	// throttle bitmask (legacy field name): sw_power_cap set in 1 of 2 samples
														
 
															+	store.Update(metric.DCGMFIDEVCLOCKTHROTTLEREASONS, gpuInfo, 0x4, start, nil)
														
 
															+	store.Update(metric.DCGMFIDEVCLOCKTHROTTLEREASONS, gpuInfo, 0x0, end, nil)
														
 
															+
														
 
															+	// framebuffer occupancy ratio, as synthesized from FB_USED/FB_FREE per
														
 
															+	// scrape by GPUMemoryUsedRatioSynthesizer (see synthetic package tests
														
 
															+	// for the join itself): avg 0.625, max 0.75, half of samples >= 0.6
														
 
															+	store.Update(metric.OpencostGPUMemoryUsedRatio, gpuInfo, 0.5, start, nil)
														
 
															+	store.Update(metric.OpencostGPUMemoryUsedRatio, gpuInfo, 0.75, end, nil)
														
 
															+
														
 
															+	// one XID error transition
														
 
															+	store.Update(metric.DCGMFIDEVXIDERRORS, gpuInfo, 0, start, nil)
														
 
															+	store.Update(metric.DCGMFIDEVXIDERRORS, gpuInfo, 13, end, nil)
														
 
															+
														
 
															+	// DRAM activity gauge
														
 
															+	store.Update(metric.DCGMFIPROFDRAMACTIVE, gpuInfo, 0.5, start, nil)
														
 
															+	store.Update(metric.DCGMFIPROFDRAMACTIVE, gpuInfo, 0.7, end, nil)
														
 
															+
														
 
															+	// PCIe tx counter: 3.6e12 bytes over 3600s = 1e9 bytes/sec
														
 
															+	store.Update(metric.DCGMFIPROFPCIETXBYTES, gpuInfo, 0, start, nil)
														
 
															+	store.Update(metric.DCGMFIPROFPCIETXBYTES, gpuInfo, 3.6e12, end, nil)
														
 
															+
														
 
															+	return &MockStoreProvider{metricsCollector: store}, start, end
														
 
															+}
														
 
															+
														
 
															+func awaitGPUSaturation(t *testing.T, f *source.Future[source.GPUSaturationResult]) []*source.GPUSaturationResult {
														
 
															+	t.Helper()
														
 
															+	res, err := f.Await()
														
 
															+	if err != nil {
														
 
															+		t.Fatalf("unexpected error: %v", err)
														
 
															+	}
														
 
															+	return res
														
 
															+}
														
 
															+
														
 
															+func requireValue(t *testing.T, results []*source.GPUSaturationResult, want float64) {
														
 
															+	t.Helper()
														
 
															+	if len(results) != 1 {
														
 
															+		t.Fatalf("expected 1 result, got %d", len(results))
														
 
															+	}
														
 
															+	got := results[0].Data[0].Value
														
 
															+	if math.Abs(got-want) > 1e-9 {
														
 
															+		t.Errorf("value = %v, want %v", got, want)
														
 
															+	}
														
 
															+	if results[0].UUID != "GPU-1" || results[0].Container != "container1" {
														
 
															+		t.Errorf("result lost GPU identity labels: %+v", results[0])
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+func TestCollectorMetricsQuerier_GPUThrottleViolationRatio(t *testing.T) {
														
 
															+	provider, start, end := gpuSaturationMockProvider(t)
														
 
															+	c := collectorMetricsQuerier{collectorProvider: provider}
														
 
															+
														
 
															+	results := awaitGPUSaturation(t, c.QueryGPUThrottleViolationRatio(start, end))
														
 
															+
														
 
															+	// only the power violation counter was scraped
														
 
															+	requireValue(t, results, 0.5)
														
 
															+	if results[0].Reason != opencost.GPUThrottleViolationPower {
														
 
															+		t.Errorf("Reason = %q, want %q", results[0].Reason, opencost.GPUThrottleViolationPower)
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+func TestCollectorMetricsQuerier_GPUThrottleReasonRatio(t *testing.T) {
														
 
															+	provider, start, end := gpuSaturationMockProvider(t)
														
 
															+	c := collectorMetricsQuerier{collectorProvider: provider}
														
 
															+
														
 
															+	results := awaitGPUSaturation(t, c.QueryGPUThrottleReasonRatio(start, end))
														
 
															+
														
 
															+	// the legacy bitmask field was scraped, so every reason bit reports
														
 
															+	got := map[string]float64{}
														
 
															+	for _, res := range results {
														
 
															+		got[res.Reason] = res.Data[0].Value
														
 
															+	}
														
 
															+	if len(got) != len(opencost.GPUThrottleReasons) {
														
 
															+		t.Fatalf("expected %d reasons, got %d: %v", len(opencost.GPUThrottleReasons), len(got), got)
														
 
															+	}
														
 
															+	for _, reason := range opencost.GPUThrottleReasons {
														
 
															+		want := 0.0
														
 
															+		if reason.Name == opencost.GPUThrottleReasonSwPowerCap {
														
 
															+			want = 0.5
														
 
															+		}
														
 
															+		if math.Abs(got[reason.Name]-want) > 1e-9 {
														
 
															+			t.Errorf("reason %q ratio = %v, want %v", reason.Name, got[reason.Name], want)
														
 
															+		}
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+func TestCollectorMetricsQuerier_GPUMemoryUsedRatio(t *testing.T) {
														
 
															+	provider, start, end := gpuSaturationMockProvider(t)
														
 
															+	c := collectorMetricsQuerier{collectorProvider: provider}
														
 
															+
														
 
															+	// avg of per-sample ratios (0.5, 0.75)
														
 
															+	requireValue(t, awaitGPUSaturation(t, c.QueryGPUMemoryUsedRatioAvg(start, end)), 0.625)
														
 
															+	// max of per-sample ratios
														
 
															+	requireValue(t, awaitGPUSaturation(t, c.QueryGPUMemoryUsedRatioMax(start, end)), 0.75)
														
 
															+}
														
 
															+
														
 
															+func TestCollectorMetricsQuerier_GPUMemoryPressureRatio(t *testing.T) {
														
 
															+	provider, start, end := gpuSaturationMockProvider(t)
														
 
															+	c := collectorMetricsQuerier{collectorProvider: provider}
														
 
															+
														
 
															+	// threshold configured to 0.6: one of two samples (0.75) is at or above
														
 
															+	requireValue(t, awaitGPUSaturation(t, c.QueryGPUMemoryPressureRatio(start, end)), 0.5)
														
 
															+}
														
 
															+
														
 
															+func TestCollectorMetricsQuerier_GPUXIDErrorCount(t *testing.T) {
														
 
															+	provider, start, end := gpuSaturationMockProvider(t)
														
 
															+	c := collectorMetricsQuerier{collectorProvider: provider}
														
 
															+
														
 
															+	requireValue(t, awaitGPUSaturation(t, c.QueryGPUXIDErrorCount(start, end)), 1)
														
 
															+}
														
 
															+
														
 
															+func TestCollectorMetricsQuerier_GPUDRAMActive(t *testing.T) {
														
 
															+	provider, start, end := gpuSaturationMockProvider(t)
														
 
															+	c := collectorMetricsQuerier{collectorProvider: provider}
														
 
															+
														
 
															+	requireValue(t, awaitGPUSaturation(t, c.QueryGPUDRAMActiveAvg(start, end)), 0.6)
														
 
															+	requireValue(t, awaitGPUSaturation(t, c.QueryGPUDRAMActiveMax(start, end)), 0.7)
														
 
															+}
														
 
															+
														
 
															+func TestCollectorMetricsQuerier_GPUPCIeTxBytesAvg(t *testing.T) {
														
 
															+	provider, start, end := gpuSaturationMockProvider(t)
														
 
															+	c := collectorMetricsQuerier{collectorProvider: provider}
														
 
															+
														
 
															+	requireValue(t, awaitGPUSaturation(t, c.QueryGPUPCIeTxBytesAvg(start, end)), 1e9)
														
 
															+}
														
 
															+
														
 
															+// TestCollectorMetricsQuerier_GPUDeviceMetrics verifies the device-level
														
 
															+// queries aggregate from the device-labeled DCGM series.
														
 
															+func TestCollectorMetricsQuerier_GPUDeviceMetrics(t *testing.T) {
														
 
															+	start, _ := time.Parse(time.RFC3339, Start1Str)
														
 
															+	end, _ := time.Parse(time.RFC3339, End1Str)
														
 
															+
														
 
															+	deviceInfo := map[string]string{
														
 
															+		source.DeviceLabel:      "nvidia0",
														
 
															+		source.ModelNameLabel:   "Tesla T4",
														
 
															+		source.UUIDLabel:        "GPU-1",
														
 
															+		source.MIGProfileLabel:  "",
														
 
															+		source.MIGInstanceLabel: "",
														
 
															+	}
														
 
															+	store := NewOpenCostMetricStore()
														
 
															+	store.Update(metric.DCGMFIDEVPOWERUSAGE, deviceInfo, 120, start, nil)
														
 
															+	store.Update(metric.DCGMFIDEVPOWERUSAGE, deviceInfo, 160, end, nil)
														
 
															+	store.Update(metric.DCGMFIDEVGPUTEMP, deviceInfo, 55, start, nil)
														
 
															+	store.Update(metric.DCGMFIPROFGRENGINEACTIVE, deviceInfo, 0.4, start, nil)
														
 
															+	store.Update(metric.DCGMFIPROFGRENGINEACTIVE, deviceInfo, 0.9, end, nil)
														
 
															+	store.Update(metric.DCGMFIDEVFBUSED, deviceInfo, 1024, start, nil)
														
 
															+	store.Update(metric.DCGMFIDEVFBUSED, deviceInfo, 2048, end, nil)
														
 
															+
														
 
															+	c := collectorMetricsQuerier{collectorProvider: &MockStoreProvider{metricsCollector: store}}
														
 
															+
														
 
															+	checks := map[string]struct {
														
 
															+		future *source.Future[source.GPUDeviceMetricResult]
														
 
															+		want   float64
														
 
															+	}{
														
 
															+		"power avg":  {c.QueryGPUDevicePowerAvg(start, end), 140},
														
 
															+		"temp avg":   {c.QueryGPUDeviceTempAvg(start, end), 55},
														
 
															+		"usage avg":  {c.QueryGPUDeviceUsageAvg(start, end), 0.65},
														
 
															+		"usage max":  {c.QueryGPUDeviceUsageMax(start, end), 0.9},
														
 
															+		"memory avg": {c.QueryGPUDeviceMemoryUsedAvg(start, end), 1536},
														
 
															+		"memory max": {c.QueryGPUDeviceMemoryUsedMax(start, end), 2048},
														
 
															+	}
														
 
															+	for name, check := range checks {
														
 
															+		results := awaitGPUSaturation(t, check.future)
														
 
															+		if len(results) != 1 {
														
 
															+			t.Fatalf("%s: expected 1 result, got %d", name, len(results))
														
 
															+		}
														
 
															+		if got := results[0].Data[0].Value; math.Abs(got-check.want) > 1e-9 {
														
 
															+			t.Errorf("%s = %v, want %v", name, got, check.want)
														
 
															+		}
														
 
															+		if results[0].UUID != "GPU-1" {
														
 
															+			t.Errorf("%s: lost device identity: %+v", name, results[0])
														
 
															+		}
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+// TestCollectorMetricsQuerier_GPUSaturationAbsentSignals verifies that
														
 
															+// signals whose DCGM fields were never scraped return no results instead of
														
 
															+// zeroes.
														
 
															+func TestCollectorMetricsQuerier_GPUSaturationAbsentSignals(t *testing.T) {
														
 
															+	provider, start, end := gpuSaturationMockProvider(t)
														
 
															+	c := collectorMetricsQuerier{collectorProvider: provider}
														
 
															+
														
 
															+	absent := map[string]*source.Future[source.GPUSaturationResult]{
														
 
															+		"SMActiveAvg":      c.QueryGPUSMActiveAvg(start, end),
														
 
															+		"SMOccupancyAvg":   c.QueryGPUSMOccupancyAvg(start, end),
														
 
															+		"PCIeRxBytesAvg":   c.QueryGPUPCIeRxBytesAvg(start, end),
														
 
															+		"NVLinkTxBytesAvg": c.QueryGPUNVLinkTxBytesAvg(start, end),
														
 
															+		"NVLinkRxBytesAvg": c.QueryGPUNVLinkRxBytesAvg(start, end),
														
 
															+	}
														
 
															+	for name, future := range absent {
														
 
															+		if results := awaitGPUSaturation(t, future); len(results) != 0 {
														
 
															+			t.Errorf("%s: expected no results for unscraped metric, got %d", name, len(results))
														
 
															+		}
														
 
															+	}
														
 
															+}
														
--- a/modules/collector-source/pkg/metric/aggregator/abovethresholdratio.go
+++ b/modules/collector-source/pkg/metric/aggregator/abovethresholdratio.go
@@ -0,0 +1,68 @@
 
															+package aggregator
														
 
															+
														
 
															+import (
														
 
															+	"math"
														
 
															+	"sync"
														
 
															+	"time"
														
 
															+)
														
 
															+
														
 
															+// aboveThresholdRatioAggregator is a MetricAggregator which returns the
														
 
															+// fraction of unique-timestamp samples whose value was at or above a fixed
														
 
															+// threshold. It is used to derive time-over-threshold pressure signals such
														
 
															+// as GPU memory pressure.
														
 
															+type aboveThresholdRatioAggregator struct {
														
 
															+	lock        sync.Mutex
														
 
															+	labelValues []string
														
 
															+	threshold   float64
														
 
															+	count       int
														
 
															+	aboveCount  int
														
 
															+	currentTime *time.Time
														
 
															+	currentHit  bool
														
 
															+}
														
 
															+
														
 
															+// AboveThresholdRatio returns a MetricAggregatorFactory producing
														
 
															+// aggregators that report the fraction of samples >= threshold.
														
 
															+func AboveThresholdRatio(threshold float64) MetricAggregatorFactory {
														
 
															+	return func(labelValues []string) MetricAggregator {
														
 
															+		return &aboveThresholdRatioAggregator{
														
 
															+			labelValues: labelValues,
														
 
															+			threshold:   threshold,
														
 
															+		}
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+func (a *aboveThresholdRatioAggregator) AdditionInfo() map[string]string {
														
 
															+	return nil
														
 
															+}
														
 
															+
														
 
															+func (a *aboveThresholdRatioAggregator) LabelValues() []string {
														
 
															+	return a.labelValues
														
 
															+}
														
 
															+
														
 
															+func (a *aboveThresholdRatioAggregator) Update(value float64, timestamp time.Time, additionalInfo map[string]string) {
														
 
															+	a.lock.Lock()
														
 
															+	defer a.lock.Unlock()
														
 
															+
														
 
															+	hit := !math.IsNaN(value) && value >= a.threshold
														
 
															+
														
 
															+	if a.currentTime == nil || !timestamp.Equal(*a.currentTime) {
														
 
															+		a.currentTime = &timestamp
														
 
															+		a.currentHit = false
														
 
															+		a.count++
														
 
															+	}
														
 
															+	if hit && !a.currentHit {
														
 
															+		a.currentHit = true
														
 
															+		a.aboveCount++
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+func (a *aboveThresholdRatioAggregator) Value() []MetricValue {
														
 
															+	a.lock.Lock()
														
 
															+	defer a.lock.Unlock()
														
 
															+	if a.count == 0 {
														
 
															+		return []MetricValue{{Value: 0}}
														
 
															+	}
														
 
															+	return []MetricValue{
														
 
															+		{Value: float64(a.aboveCount) / float64(a.count)},
														
 
															+	}
														
 
															+}
														
--- a/modules/collector-source/pkg/metric/aggregator/abovethresholdratio_test.go
+++ b/modules/collector-source/pkg/metric/aggregator/abovethresholdratio_test.go
@@ -0,0 +1,83 @@
 
															+package aggregator
														
 
															+
														
 
															+import (
														
 
															+	"math"
														
 
															+	"reflect"
														
 
															+	"testing"
														
 
															+	"time"
														
 
															+)
														
 
															+
														
 
															+func TestAboveThresholdRatioAggregator_Value(t *testing.T) {
														
 
															+	time1 := time.Date(1, 1, 1, 0, 0, 0, 0, time.UTC)
														
 
															+	time2 := time.Date(1, 1, 1, 0, 1, 0, 0, time.UTC)
														
 
															+	time3 := time.Date(1, 1, 1, 0, 2, 0, 0, time.UTC)
														
 
															+	time4 := time.Date(1, 1, 1, 0, 3, 0, 0, time.UTC)
														
 
															+
														
 
															+	type update struct {
														
 
															+		value     float64
														
 
															+		timestamp time.Time
														
 
															+	}
														
 
															+	tests := map[string]struct {
														
 
															+		threshold float64
														
 
															+		updates   []update
														
 
															+		want      []MetricValue
														
 
															+	}{
														
 
															+		"no update": {
														
 
															+			threshold: 0.9,
														
 
															+			updates:   []update{},
														
 
															+			want:      []MetricValue{{Value: 0}},
														
 
															+		},
														
 
															+		"all above": {
														
 
															+			threshold: 0.9,
														
 
															+			updates: []update{
														
 
															+				{value: 0.95, timestamp: time1},
														
 
															+				{value: 0.99, timestamp: time2},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 1}},
														
 
															+		},
														
 
															+		"threshold is inclusive": {
														
 
															+			threshold: 0.9,
														
 
															+			updates:   []update{{value: 0.9, timestamp: time1}},
														
 
															+			want:      []MetricValue{{Value: 1}},
														
 
															+		},
														
 
															+		"quarter above": {
														
 
															+			threshold: 0.9,
														
 
															+			updates: []update{
														
 
															+				{value: 0.95, timestamp: time1},
														
 
															+				{value: 0.5, timestamp: time2},
														
 
															+				{value: 0.89, timestamp: time3},
														
 
															+				{value: 0.1, timestamp: time4},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 0.25}},
														
 
															+		},
														
 
															+		"duplicate timestamp counts once": {
														
 
															+			threshold: 0.9,
														
 
															+			updates: []update{
														
 
															+				{value: 0.95, timestamp: time1},
														
 
															+				{value: 0.1, timestamp: time1},
														
 
															+				{value: 0.1, timestamp: time2},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 0.5}},
														
 
															+		},
														
 
															+		"NaN counts as below": {
														
 
															+			threshold: 0.9,
														
 
															+			updates: []update{
														
 
															+				{value: math.NaN(), timestamp: time1},
														
 
															+				{value: 0.95, timestamp: time2},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 0.5}},
														
 
															+		},
														
 
															+	}
														
 
															+
														
 
															+	for name, tt := range tests {
														
 
															+		t.Run(name, func(t *testing.T) {
														
 
															+			agg := AboveThresholdRatio(tt.threshold)([]string{})
														
 
															+			for _, u := range tt.updates {
														
 
															+				agg.Update(u.value, u.timestamp, nil)
														
 
															+			}
														
 
															+			if got := agg.Value(); !reflect.DeepEqual(got, tt.want) {
														
 
															+				t.Errorf("Value() = %v, want %v", got, tt.want)
														
 
															+			}
														
 
															+		})
														
 
															+	}
														
 
															+}
														
--- a/modules/collector-source/pkg/metric/aggregator/bitsetratio.go
+++ b/modules/collector-source/pkg/metric/aggregator/bitsetratio.go
@@ -0,0 +1,71 @@
 
															+package aggregator
														
 
															+
														
 
															+import (
														
 
															+	"math"
														
 
															+	"sync"
														
 
															+	"time"
														
 
															+)
														
 
															+
														
 
															+// bitSetRatioAggregator is a MetricAggregator which returns the fraction of
														
 
															+// unique-timestamp samples in which a specific bit was set in the sample
														
 
															+// value, treating the value as an integer bitmask. It is used to derive the
														
 
															+// fraction of a window a GPU spent throttled for a specific reason from the
														
 
															+// DCGM clock throttle reasons bitmask.
														
 
															+type bitSetRatioAggregator struct {
														
 
															+	lock        sync.Mutex
														
 
															+	labelValues []string
														
 
															+	bit         uint64
														
 
															+	count       int
														
 
															+	setCount    int
														
 
															+	currentTime *time.Time
														
 
															+	currentSet  bool
														
 
															+}
														
 
															+
														
 
															+// BitSetRatio returns a MetricAggregatorFactory producing aggregators that
														
 
															+// report the fraction of samples with the given bit set.
														
 
															+func BitSetRatio(bit uint64) MetricAggregatorFactory {
														
 
															+	return func(labelValues []string) MetricAggregator {
														
 
															+		return &bitSetRatioAggregator{
														
 
															+			labelValues: labelValues,
														
 
															+			bit:         bit,
														
 
															+		}
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+func (a *bitSetRatioAggregator) AdditionInfo() map[string]string {
														
 
															+	return nil
														
 
															+}
														
 
															+
														
 
															+func (a *bitSetRatioAggregator) LabelValues() []string {
														
 
															+	return a.labelValues
														
 
															+}
														
 
															+
														
 
															+func (a *bitSetRatioAggregator) Update(value float64, timestamp time.Time, additionalInfo map[string]string) {
														
 
															+	a.lock.Lock()
														
 
															+	defer a.lock.Unlock()
														
 
															+
														
 
															+	// NaN or negative values cannot be valid bitmasks; count the sample as
														
 
															+	// bit-clear rather than guessing
														
 
															+	set := !math.IsNaN(value) && value >= 0 && uint64(value)&a.bit != 0
														
 
															+
														
 
															+	if a.currentTime == nil || !timestamp.Equal(*a.currentTime) {
														
 
															+		a.currentTime = &timestamp
														
 
															+		a.currentSet = false
														
 
															+		a.count++
														
 
															+	}
														
 
															+	if set && !a.currentSet {
														
 
															+		a.currentSet = true
														
 
															+		a.setCount++
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+func (a *bitSetRatioAggregator) Value() []MetricValue {
														
 
															+	a.lock.Lock()
														
 
															+	defer a.lock.Unlock()
														
 
															+	if a.count == 0 {
														
 
															+		return []MetricValue{{Value: 0}}
														
 
															+	}
														
 
															+	return []MetricValue{
														
 
															+		{Value: float64(a.setCount) / float64(a.count)},
														
 
															+	}
														
 
															+}
														
--- a/modules/collector-source/pkg/metric/aggregator/bitsetratio_test.go
+++ b/modules/collector-source/pkg/metric/aggregator/bitsetratio_test.go
@@ -0,0 +1,88 @@
 
															+package aggregator
														
 
															+
														
 
															+import (
														
 
															+	"math"
														
 
															+	"reflect"
														
 
															+	"testing"
														
 
															+	"time"
														
 
															+)
														
 
															+
														
 
															+func TestBitSetRatioAggregator_Value(t *testing.T) {
														
 
															+	time1 := time.Date(1, 1, 1, 0, 0, 0, 0, time.UTC)
														
 
															+	time2 := time.Date(1, 1, 1, 0, 1, 0, 0, time.UTC)
														
 
															+	time3 := time.Date(1, 1, 1, 0, 2, 0, 0, time.UTC)
														
 
															+	time4 := time.Date(1, 1, 1, 0, 3, 0, 0, time.UTC)
														
 
															+
														
 
															+	type update struct {
														
 
															+		value     float64
														
 
															+		timestamp time.Time
														
 
															+	}
														
 
															+	tests := map[string]struct {
														
 
															+		bit     uint64
														
 
															+		updates []update
														
 
															+		want    []MetricValue
														
 
															+	}{
														
 
															+		"no update": {
														
 
															+			bit:     0x8,
														
 
															+			updates: []update{},
														
 
															+			want:    []MetricValue{{Value: 0}},
														
 
															+		},
														
 
															+		"single sample bit set": {
														
 
															+			bit:     0x8,
														
 
															+			updates: []update{{value: 8, timestamp: time1}},
														
 
															+			want:    []MetricValue{{Value: 1}},
														
 
															+		},
														
 
															+		"single sample bit clear": {
														
 
															+			bit:     0x8,
														
 
															+			updates: []update{{value: 4, timestamp: time1}},
														
 
															+			want:    []MetricValue{{Value: 0}},
														
 
															+		},
														
 
															+		"half of samples set": {
														
 
															+			bit: 0x4,
														
 
															+			updates: []update{
														
 
															+				{value: 0x4, timestamp: time1},
														
 
															+				{value: 0x0, timestamp: time2},
														
 
															+				{value: 0x4 | 0x8, timestamp: time3},
														
 
															+				{value: 0x8, timestamp: time4},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 0.5}},
														
 
															+		},
														
 
															+		"other bits do not count": {
														
 
															+			bit: 0x40,
														
 
															+			updates: []update{
														
 
															+				{value: 0x1 | 0x2 | 0x4 | 0x8 | 0x10 | 0x20 | 0x80, timestamp: time1},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 0}},
														
 
															+		},
														
 
															+		"duplicate timestamp counts once": {
														
 
															+			bit: 0x4,
														
 
															+			updates: []update{
														
 
															+				{value: 0x4, timestamp: time1},
														
 
															+				{value: 0x0, timestamp: time1},
														
 
															+				{value: 0x0, timestamp: time2},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 0.5}},
														
 
															+		},
														
 
															+		"invalid values are treated as bit clear": {
														
 
															+			bit: 0x4,
														
 
															+			updates: []update{
														
 
															+				{value: math.NaN(), timestamp: time1},
														
 
															+				{value: -4, timestamp: time2},
														
 
															+				{value: 0x4, timestamp: time3},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 1.0 / 3.0}},
														
 
															+		},
														
 
															+	}
														
 
															+
														
 
															+	for name, tt := range tests {
														
 
															+		t.Run(name, func(t *testing.T) {
														
 
															+			agg := BitSetRatio(tt.bit)([]string{})
														
 
															+			for _, u := range tt.updates {
														
 
															+				agg.Update(u.value, u.timestamp, nil)
														
 
															+			}
														
 
															+			if got := agg.Value(); !reflect.DeepEqual(got, tt.want) {
														
 
															+				t.Errorf("Value() = %v, want %v", got, tt.want)
														
 
															+			}
														
 
															+		})
														
 
															+	}
														
 
															+}
														
--- a/modules/collector-source/pkg/metric/aggregator/changes.go
+++ b/modules/collector-source/pkg/metric/aggregator/changes.go
@@ -0,0 +1,56 @@
 
															+package aggregator
														
 
															+
														
 
															+import (
														
 
															+	"sync"
														
 
															+	"time"
														
 
															+)
														
 
															+
														
 
															+// changesAggregator is a MetricAggregator which counts how many times the
														
 
															+// sample value changed between consecutive samples, equivalent to
														
 
															+// PromQL's changes(). Updates must arrive in timestamp order; out-of-order
														
 
															+// or duplicate timestamps are ignored.
														
 
															+type changesAggregator struct {
														
 
															+	lock        sync.Mutex
														
 
															+	labelValues []string
														
 
															+	initialized bool
														
 
															+	lastValue   float64
														
 
															+	lastTime    time.Time
														
 
															+	changes     float64
														
 
															+}
														
 
															+
														
 
															+func Changes(labelValues []string) MetricAggregator {
														
 
															+	return &changesAggregator{
														
 
															+		labelValues: labelValues,
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+func (a *changesAggregator) AdditionInfo() map[string]string {
														
 
															+	return nil
														
 
															+}
														
 
															+
														
 
															+func (a *changesAggregator) LabelValues() []string {
														
 
															+	return a.labelValues
														
 
															+}
														
 
															+
														
 
															+func (a *changesAggregator) Update(value float64, timestamp time.Time, additionalInfo map[string]string) {
														
 
															+	a.lock.Lock()
														
 
															+	defer a.lock.Unlock()
														
 
															+
														
 
															+	if a.initialized && !timestamp.After(a.lastTime) {
														
 
															+		return
														
 
															+	}
														
 
															+	if a.initialized && value != a.lastValue {
														
 
															+		a.changes++
														
 
															+	}
														
 
															+	a.initialized = true
														
 
															+	a.lastValue = value
														
 
															+	a.lastTime = timestamp
														
 
															+}
														
 
															+
														
 
															+func (a *changesAggregator) Value() []MetricValue {
														
 
															+	a.lock.Lock()
														
 
															+	defer a.lock.Unlock()
														
 
															+	return []MetricValue{
														
 
															+		{Value: a.changes},
														
 
															+	}
														
 
															+}
														
--- a/modules/collector-source/pkg/metric/aggregator/changes_test.go
+++ b/modules/collector-source/pkg/metric/aggregator/changes_test.go
@@ -0,0 +1,75 @@
 
															+package aggregator
														
 
															+
														
 
															+import (
														
 
															+	"reflect"
														
 
															+	"testing"
														
 
															+	"time"
														
 
															+)
														
 
															+
														
 
															+func TestChangesAggregator_Value(t *testing.T) {
														
 
															+	time1 := time.Date(1, 1, 1, 0, 0, 0, 0, time.UTC)
														
 
															+	time2 := time.Date(1, 1, 1, 0, 1, 0, 0, time.UTC)
														
 
															+	time3 := time.Date(1, 1, 1, 0, 2, 0, 0, time.UTC)
														
 
															+	time4 := time.Date(1, 1, 1, 0, 3, 0, 0, time.UTC)
														
 
															+
														
 
															+	type update struct {
														
 
															+		value     float64
														
 
															+		timestamp time.Time
														
 
															+	}
														
 
															+	tests := map[string]struct {
														
 
															+		updates []update
														
 
															+		want    []MetricValue
														
 
															+	}{
														
 
															+		"no update": {
														
 
															+			updates: []update{},
														
 
															+			want:    []MetricValue{{Value: 0}},
														
 
															+		},
														
 
															+		"single sample is zero changes": {
														
 
															+			updates: []update{{value: 13, timestamp: time1}},
														
 
															+			want:    []MetricValue{{Value: 0}},
														
 
															+		},
														
 
															+		"constant value is zero changes": {
														
 
															+			updates: []update{
														
 
															+				{value: 0, timestamp: time1},
														
 
															+				{value: 0, timestamp: time2},
														
 
															+				{value: 0, timestamp: time3},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 0}},
														
 
															+		},
														
 
															+		"each transition counts": {
														
 
															+			updates: []update{
														
 
															+				{value: 0, timestamp: time1},
														
 
															+				{value: 13, timestamp: time2},
														
 
															+				{value: 13, timestamp: time3},
														
 
															+				{value: 31, timestamp: time4},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 2}},
														
 
															+		},
														
 
															+		"out of order updates are ignored": {
														
 
															+			updates: []update{
														
 
															+				{value: 0, timestamp: time2},
														
 
															+				{value: 13, timestamp: time1},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 0}},
														
 
															+		},
														
 
															+		"duplicate timestamp is ignored": {
														
 
															+			updates: []update{
														
 
															+				{value: 0, timestamp: time1},
														
 
															+				{value: 13, timestamp: time1},
														
 
															+			},
														
 
															+			want: []MetricValue{{Value: 0}},
														
 
															+		},
														
 
															+	}
														
 
															+
														
 
															+	for name, tt := range tests {
														
 
															+		t.Run(name, func(t *testing.T) {
														
 
															+			agg := Changes([]string{})
														
 
															+			for _, u := range tt.updates {
														
 
															+				agg.Update(u.value, u.timestamp, nil)
														
 
															+			}
														
 
															+			if got := agg.Value(); !reflect.DeepEqual(got, tt.want) {
														
 
															+				t.Errorf("Value() = %v, want %v", got, tt.want)
														
 
															+			}
														
 
															+		})
														
 
															+	}
														
 
															+}
														
--- a/modules/collector-source/pkg/metric/collector.go
+++ b/modules/collector-source/pkg/metric/collector.go
@@ -75,6 +75,28 @@ const (
 
															 	GPUsAllocatedID                            MetricCollectorID = "GPUsAllocated"
														
 
															 	IsGPUSharedID                              MetricCollectorID = "IsGPUShared"
														
 
															 	GPUInfoID                                  MetricCollectorID = "GPUInfo"
														
 
															+	GPUThrottleViolationPowerID                MetricCollectorID = "GPUThrottleViolationPower"
														
 
															+	GPUThrottleViolationThermalID              MetricCollectorID = "GPUThrottleViolationThermal"
														
 
															+	GPUThrottleViolationSyncBoostID            MetricCollectorID = "GPUThrottleViolationSyncBoost"
														
 
															+	GPUThrottleViolationBoardLimitID           MetricCollectorID = "GPUThrottleViolationBoardLimit"
														
 
															+	GPUMemoryUsedAvgID                         MetricCollectorID = "GPUMemoryUsedAvg"
														
 
															+	GPUMemoryUsedMaxID                         MetricCollectorID = "GPUMemoryUsedMax"
														
 
															+	GPUMemoryPressureRatioID                   MetricCollectorID = "GPUMemoryPressureRatio"
														
 
															+	GPUXIDErrorCountID                         MetricCollectorID = "GPUXIDErrorCount"
														
 
															+	GPUDRAMActiveAvgID                         MetricCollectorID = "GPUDRAMActiveAvg"
														
 
															+	GPUDRAMActiveMaxID                         MetricCollectorID = "GPUDRAMActiveMax"
														
 
															+	GPUSMActiveAvgID                           MetricCollectorID = "GPUSMActiveAvg"
														
 
															+	GPUSMOccupancyAvgID                        MetricCollectorID = "GPUSMOccupancyAvg"
														
 
															+	GPUPCIeTxBytesAvgID                        MetricCollectorID = "GPUPCIeTxBytesAvg"
														
 
															+	GPUPCIeRxBytesAvgID                        MetricCollectorID = "GPUPCIeRxBytesAvg"
														
 
															+	GPUNVLinkTxBytesAvgID                      MetricCollectorID = "GPUNVLinkTxBytesAvg"
														
 
															+	GPUNVLinkRxBytesAvgID                      MetricCollectorID = "GPUNVLinkRxBytesAvg"
														
 
															+	GPUDevicePowerAvgID                        MetricCollectorID = "GPUDevicePowerAvg"
														
 
															+	GPUDeviceTempAvgID                         MetricCollectorID = "GPUDeviceTempAvg"
														
 
															+	GPUDeviceUsageAvgID                        MetricCollectorID = "GPUDeviceUsageAvg"
														
 
															+	GPUDeviceUsageMaxID                        MetricCollectorID = "GPUDeviceUsageMax"
														
 
															+	GPUDeviceMemoryUsedAvgID                   MetricCollectorID = "GPUDeviceMemoryUsedAvg"
														
 
															+	GPUDeviceMemoryUsedMaxID                   MetricCollectorID = "GPUDeviceMemoryUsedMax"
														
 
															 	NodeCPUPricePerHourID                      MetricCollectorID = "NodeCPUPricePerHour"
														
 
															 	NodeRAMPricePerGiBHourID                   MetricCollectorID = "NodeRAMPricePerGiBHour"
														
 
															 	NodeGPUPricePerHourID                      MetricCollectorID = "NodeGPUPricePerHour"
														
@@ -170,6 +192,14 @@ const (
 
															 	ResourceQuotaStatusUsedRAMLimitMaxID       MetricCollectorID = "ResourceQuotaStatusUsedRAMLimitMax"
														
 
															 )
														
 
															+// GPUThrottleReasonCollectorID returns the deterministic collector ID for the
														
 
															+// throttle reason bit collector over the given DCGM bitmask metric name. One
														
 
															+// collector exists per (bitmask metric name, reason) pair because the DCGM
														
 
															+// field was renamed in 3.3+ and only one of the two names is ever scraped.
														
 
															+func GPUThrottleReasonCollectorID(metricName, reason string) MetricCollectorID {
														
 
															+	return MetricCollectorID("GPUThrottleReason/" + metricName + "/" + reason)
														
 
															+}
														
 
															+
														
 
															 // MetricCollector is a data structure that represents a specific MetricCollector metric instance that contains its own breakdown
														
 
															 // of stored metrics by a specific label set.
														
 
															 type MetricCollector struct {
														
--- a/modules/collector-source/pkg/metric/metrics.go
+++ b/modules/collector-source/pkg/metric/metrics.go
@@ -63,6 +63,39 @@ const (
 
															 	DCGMFIPROFGRENGINEACTIVE = "DCGM_FI_PROF_GR_ENGINE_ACTIVE"
														
 
															 	DCGMFIDEVDECUTIL         = "DCGM_FI_DEV_DEC_UTIL"
														
 
															+	// DCGM saturation metrics (default dcgm-exporter configuration)
														
 
															+	DCGMFIDEVPOWERVIOLATION      = "DCGM_FI_DEV_POWER_VIOLATION"
														
 
															+	DCGMFIDEVTHERMALVIOLATION    = "DCGM_FI_DEV_THERMAL_VIOLATION"
														
 
															+	DCGMFIDEVSYNCBOOSTVIOLATION  = "DCGM_FI_DEV_SYNC_BOOST_VIOLATION"
														
 
															+	DCGMFIDEVBOARDLIMITVIOLATION = "DCGM_FI_DEV_BOARD_LIMIT_VIOLATION"
														
 
															+	DCGMFIDEVFBUSED              = "DCGM_FI_DEV_FB_USED"
														
 
															+	DCGMFIDEVFBFREE              = "DCGM_FI_DEV_FB_FREE"
														
 
															+	DCGMFIDEVXIDERRORS           = "DCGM_FI_DEV_XID_ERRORS"
														
 
															+	DCGMFIDEVPOWERUSAGE          = "DCGM_FI_DEV_POWER_USAGE"
														
 
															+	DCGMFIDEVGPUTEMP             = "DCGM_FI_DEV_GPU_TEMP"
														
 
															+
														
 
															+	// DCGM saturation metrics requiring explicit enablement in the
														
 
															+	// dcgm-exporter configuration. The clock throttle reasons bitmask was
														
 
															+	// renamed in DCGM 3.3+; both names are scraped, at most one exists.
														
 
															+	DCGMFIDEVCLOCKTHROTTLEREASONS = "DCGM_FI_DEV_CLOCK_THROTTLE_REASONS"
														
 
															+	DCGMFIDEVCLOCKSEVENTREASONS   = "DCGM_FI_DEV_CLOCKS_EVENT_REASONS"
														
 
															+
														
 
															+	// DCGM DCP profiling saturation metrics (require Volta+ GPUs;
														
 
															+	// SM_ACTIVE, SM_OCCUPANCY, and NVLINK additionally require explicit
														
 
															+	// enablement in the dcgm-exporter configuration)
														
 
															+	DCGMFIPROFDRAMACTIVE    = "DCGM_FI_PROF_DRAM_ACTIVE"
														
 
															+	DCGMFIPROFSMACTIVE      = "DCGM_FI_PROF_SM_ACTIVE"
														
 
															+	DCGMFIPROFSMOCCUPANCY   = "DCGM_FI_PROF_SM_OCCUPANCY"
														
 
															+	DCGMFIPROFPCIETXBYTES   = "DCGM_FI_PROF_PCIE_TX_BYTES"
														
 
															+	DCGMFIPROFPCIERXBYTES   = "DCGM_FI_PROF_PCIE_RX_BYTES"
														
 
															+	DCGMFIPROFNVLINKTXBYTES = "DCGM_FI_PROF_NVLINK_TX_BYTES"
														
 
															+	DCGMFIPROFNVLINKRXBYTES = "DCGM_FI_PROF_NVLINK_RX_BYTES"
														
 
															+
														
 
															+	// Synthetic metrics generated from DCGM scrapes (see pkg/metric/synthetic)
														
 
															+	// OpencostGPUMemoryUsedRatio is the per-sample framebuffer occupancy
														
 
															+	// ratio FB_USED / (FB_USED + FB_FREE), joined per scrape
														
 
															+	OpencostGPUMemoryUsedRatio = "opencost_gpu_memory_used_ratio"
														
 
															+
														
 
															 	// Network Metrics
														
 
															 	KubecostPodNetworkEgressBytesTotal  = "kubecost_pod_network_egress_bytes_total"
														
 
															 	KubecostPodNetworkIngressBytesTotal = "kubecost_pod_network_ingress_bytes_total"
														
--- a/modules/collector-source/pkg/metric/synthetic/gpumemory.go
+++ b/modules/collector-source/pkg/metric/synthetic/gpumemory.go
@@ -0,0 +1,104 @@
 
															+package synthetic
														
 
															+
														
 
															+import (
														
 
															+	"maps"
														
 
															+	"math"
														
 
															+	"strings"
														
 
															+	"time"
														
 
															+
														
 
															+	"github.com/opencost/opencost/core/pkg/source"
														
 
															+	"github.com/opencost/opencost/modules/collector-source/pkg/metric"
														
 
															+)
														
 
															+
														
 
															+// gpuFramebufferSample pairs the framebuffer used/free updates for one GPU
														
 
															+// (or MIG instance) and container within a single scrape.
														
 
															+type gpuFramebufferSample struct {
														
 
															+	used *metric.Update
														
 
															+	free *metric.Update
														
 
															+}
														
 
															+
														
 
															+// GPUMemoryUsedRatioSynthesizer joins DCGM_FI_DEV_FB_USED and
														
 
															+// DCGM_FI_DEV_FB_FREE within each scrape and synthesizes a per-sample
														
 
															+// framebuffer occupancy ratio metric, used / (used + free). Joining per
														
 
															+// scrape is what makes time-over-threshold memory pressure computable
														
 
															+// downstream; post-aggregation joins cannot recover the per-sample ratio.
														
 
															+type GPUMemoryUsedRatioSynthesizer struct {
														
 
															+	byDevice map[string]*gpuFramebufferSample
														
 
															+}
														
 
															+
														
 
															+// NewGPUMemoryUsedRatioSynthesizer creates a synthesizer producing
														
 
															+// OpencostGPUMemoryUsedRatio updates from the DCGM framebuffer metrics.
														
 
															+func NewGPUMemoryUsedRatioSynthesizer() *GPUMemoryUsedRatioSynthesizer {
														
 
															+	return &GPUMemoryUsedRatioSynthesizer{
														
 
															+		byDevice: make(map[string]*gpuFramebufferSample),
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+// gpuDeviceKey identifies one GPU (or MIG instance) attached to one
														
 
															+// container: dcgm-exporter emits one used/free series per such pairing.
														
 
															+func gpuDeviceKey(labels map[string]string) string {
														
 
															+	return strings.Join([]string{
														
 
															+		labels[source.UUIDLabel],
														
 
															+		labels[source.MIGInstanceLabel],
														
 
															+		labels[source.PodUIDLabel],
														
 
															+		labels[source.ContainerLabel],
														
 
															+	}, "|")
														
 
															+}
														
 
															+
														
 
															+// Process records framebuffer used/free updates; all other metrics are
														
 
															+// ignored.
														
 
															+func (s *GPUMemoryUsedRatioSynthesizer) Process(t time.Time, update *metric.Update) {
														
 
															+	var sample *gpuFramebufferSample
														
 
															+	switch update.Name {
														
 
															+	case metric.DCGMFIDEVFBUSED, metric.DCGMFIDEVFBFREE:
														
 
															+		key := gpuDeviceKey(update.Labels)
														
 
															+		if _, ok := s.byDevice[key]; !ok {
														
 
															+			s.byDevice[key] = &gpuFramebufferSample{}
														
 
															+		}
														
 
															+		sample = s.byDevice[key]
														
 
															+	default:
														
 
															+		return
														
 
															+	}
														
 
															+
														
 
															+	if update.Name == metric.DCGMFIDEVFBUSED {
														
 
															+		sample.used = update
														
 
															+	} else {
														
 
															+		sample.free = update
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+// Synthesize emits one occupancy ratio update per device that reported both
														
 
															+// framebuffer metrics this scrape. Devices missing either half, or
														
 
															+// reporting a non-positive or non-finite total, emit nothing.
														
 
															+func (s *GPUMemoryUsedRatioSynthesizer) Synthesize() []metric.Update {
														
 
															+	var updates []metric.Update
														
 
															+
														
 
															+	for _, sample := range s.byDevice {
														
 
															+		if sample.used == nil || sample.free == nil {
														
 
															+			continue
														
 
															+		}
														
 
															+		used := sample.used.Value
														
 
															+		free := sample.free.Value
														
 
															+		total := used + free
														
 
															+		// Both components must be individually non-negative: checking only
														
 
															+		// the total would let a corrupt negative FB_FREE (e.g. used=100,
														
 
															+		// free=-50) through and produce a ratio above 1, escaping the
														
 
															+		// documented [0, 1] occupancy range. (Code review finding.)
														
 
															+		if math.IsNaN(total) || math.IsInf(total, 0) || total <= 0 || used < 0 || free < 0 {
														
 
															+			continue
														
 
															+		}
														
 
															+
														
 
															+		updates = append(updates, metric.Update{
														
 
															+			Name:   metric.OpencostGPUMemoryUsedRatio,
														
 
															+			Labels: maps.Clone(sample.used.Labels),
														
 
															+			Value:  used / total,
														
 
															+		})
														
 
															+	}
														
 
															+
														
 
															+	return updates
														
 
															+}
														
 
															+
														
 
															+// Clear resets the per-scrape state.
														
 
															+func (s *GPUMemoryUsedRatioSynthesizer) Clear() {
														
 
															+	s.byDevice = make(map[string]*gpuFramebufferSample)
														
 
															+}
														
--- a/modules/collector-source/pkg/metric/synthetic/gpumemory_test.go
+++ b/modules/collector-source/pkg/metric/synthetic/gpumemory_test.go
@@ -0,0 +1,163 @@
 
															+package synthetic
														
 
															+
														
 
															+import (
														
 
															+	"math"
														
 
															+	"testing"
														
 
															+	"time"
														
 
															+
														
 
															+	"github.com/opencost/opencost/modules/collector-source/pkg/metric"
														
 
															+)
														
 
															+
														
 
															+// capturingUpdater records the UpdateSet handed to the next stage of the
														
 
															+// synthesizer pipeline.
														
 
															+type capturingUpdater struct {
														
 
															+	set *metric.UpdateSet
														
 
															+}
														
 
															+
														
 
															+func (c *capturingUpdater) Update(set *metric.UpdateSet) {
														
 
															+	c.set = set
														
 
															+}
														
 
															+
														
 
															+func gpuFBUpdate(name string, uuid, migInstance string, value float64) *metric.Update {
														
 
															+	return &metric.Update{
														
 
															+		Name: name,
														
 
															+		Labels: map[string]string{
														
 
															+			"UUID":      uuid,
														
 
															+			"GPU_I_ID":  migInstance,
														
 
															+			"pod_uid":   "pod-uuid1",
														
 
															+			"container": "container1",
														
 
															+			"namespace": "namespace1",
														
 
															+			"pod":       "pod1",
														
 
															+		},
														
 
															+		Value: value,
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+func TestGPUMemoryUsedRatioSynthesizer(t *testing.T) {
														
 
															+	now := time.Now()
														
 
															+
														
 
															+	t.Run("joins used and free into a ratio", func(t *testing.T) {
														
 
															+		s := NewGPUMemoryUsedRatioSynthesizer()
														
 
															+		s.Process(now, gpuFBUpdate(metric.DCGMFIDEVFBUSED, "GPU-1", "", 12000))
														
 
															+		s.Process(now, gpuFBUpdate(metric.DCGMFIDEVFBFREE, "GPU-1", "", 4000))
														
 
															+
														
 
															+		updates := s.Synthesize()
														
 
															+		if len(updates) != 1 {
														
 
															+			t.Fatalf("expected 1 synthetic update, got %d", len(updates))
														
 
															+		}
														
 
															+		got := updates[0]
														
 
															+		if got.Name != metric.OpencostGPUMemoryUsedRatio {
														
 
															+			t.Errorf("Name = %q, want %q", got.Name, metric.OpencostGPUMemoryUsedRatio)
														
 
															+		}
														
 
															+		if got.Value != 0.75 {
														
 
															+			t.Errorf("Value = %v, want 0.75", got.Value)
														
 
															+		}
														
 
															+		if got.Labels["UUID"] != "GPU-1" || got.Labels["container"] != "container1" {
														
 
															+			t.Errorf("labels not carried through: %v", got.Labels)
														
 
															+		}
														
 
															+	})
														
 
															+
														
 
															+	t.Run("MIG instances synthesize independently", func(t *testing.T) {
														
 
															+		s := NewGPUMemoryUsedRatioSynthesizer()
														
 
															+		s.Process(now, gpuFBUpdate(metric.DCGMFIDEVFBUSED, "GPU-1", "1", 5000))
														
 
															+		s.Process(now, gpuFBUpdate(metric.DCGMFIDEVFBFREE, "GPU-1", "1", 5000))
														
 
															+		s.Process(now, gpuFBUpdate(metric.DCGMFIDEVFBUSED, "GPU-1", "2", 2000))
														
 
															+		s.Process(now, gpuFBUpdate(metric.DCGMFIDEVFBFREE, "GPU-1", "2", 8000))
														
 
															+
														
 
															+		updates := s.Synthesize()
														
 
															+		if len(updates) != 2 {
														
 
															+			t.Fatalf("expected 2 synthetic updates, got %d", len(updates))
														
 
															+		}
														
 
															+		byInstance := map[string]float64{}
														
 
															+		for _, u := range updates {
														
 
															+			byInstance[u.Labels["GPU_I_ID"]] = u.Value
														
 
															+		}
														
 
															+		if byInstance["1"] != 0.5 || byInstance["2"] != 0.2 {
														
 
															+			t.Errorf("per-instance ratios = %v, want {1:0.5, 2:0.2}", byInstance)
														
 
															+		}
														
 
															+	})
														
 
															+
														
 
															+	t.Run("missing half emits nothing", func(t *testing.T) {
														
 
															+		s := NewGPUMemoryUsedRatioSynthesizer()
														
 
															+		s.Process(now, gpuFBUpdate(metric.DCGMFIDEVFBUSED, "GPU-1", "", 12000))
														
 
															+		if updates := s.Synthesize(); len(updates) != 0 {
														
 
															+			t.Errorf("expected no updates without FB_FREE, got %v", updates)
														
 
															+		}
														
 
															+	})
														
 
															+
														
 
															+	t.Run("invalid totals emit nothing", func(t *testing.T) {
														
 
															+		cases := map[string][2]float64{
														
 
															+			"zero total":     {0, 0},
														
 
															+			"negative used":  {-1, 100},
														
 
															+			"NaN free":       {100, math.NaN()},
														
 
															+			"infinite total": {math.Inf(1), 100},
														
 
															+			// negative free with positive total would yield ratio > 1
														
 
															+			// (100/(100-50) = 2.0) if only the total were validated
														
 
															+			"negative free": {100, -50},
														
 
															+		}
														
 
															+		for name, values := range cases {
														
 
															+			s := NewGPUMemoryUsedRatioSynthesizer()
														
 
															+			s.Process(now, gpuFBUpdate(metric.DCGMFIDEVFBUSED, "GPU-1", "", values[0]))
														
 
															+			s.Process(now, gpuFBUpdate(metric.DCGMFIDEVFBFREE, "GPU-1", "", values[1]))
														
 
															+			if updates := s.Synthesize(); len(updates) != 0 {
														
 
															+				t.Errorf("%s: expected no updates, got %v", name, updates)
														
 
															+			}
														
 
															+		}
														
 
															+	})
														
 
															+
														
 
															+	t.Run("unrelated metrics are ignored", func(t *testing.T) {
														
 
															+		s := NewGPUMemoryUsedRatioSynthesizer()
														
 
															+		s.Process(now, gpuFBUpdate(metric.DCGMFIPROFGRENGINEACTIVE, "GPU-1", "", 0.9))
														
 
															+		if updates := s.Synthesize(); len(updates) != 0 {
														
 
															+			t.Errorf("expected no updates for unrelated metric, got %v", updates)
														
 
															+		}
														
 
															+	})
														
 
															+
														
 
															+	t.Run("joins correctly through the MetricSynthesizers pipeline", func(t *testing.T) {
														
 
															+		// Exercises the real dispatch path: MetricSynthesizers.Update copies
														
 
															+		// each Update into a loop-body variable and passes its address to
														
 
															+		// Process. The body-scoped declaration yields a distinct allocation
														
 
															+		// per iteration, so stored pointers never alias; this test pins that
														
 
															+		// by pushing two devices' used/free pairs through one UpdateSet and
														
 
															+		// asserting each synthesized ratio reflects its own samples.
														
 
															+		captured := &capturingUpdater{}
														
 
															+		pipeline := NewMetricSynthesizers(captured, NewGPUMemoryUsedRatioSynthesizer())
														
 
															+
														
 
															+		pipeline.Update(&metric.UpdateSet{
														
 
															+			Timestamp: now,
														
 
															+			Updates: []metric.Update{
														
 
															+				*gpuFBUpdate(metric.DCGMFIDEVFBUSED, "GPU-1", "", 12000),
														
 
															+				*gpuFBUpdate(metric.DCGMFIDEVFBFREE, "GPU-1", "", 4000),
														
 
															+				*gpuFBUpdate(metric.DCGMFIDEVFBUSED, "GPU-2", "", 2000),
														
 
															+				*gpuFBUpdate(metric.DCGMFIDEVFBFREE, "GPU-2", "", 8000),
														
 
															+			},
														
 
															+		})
														
 
															+
														
 
															+		ratios := map[string]float64{}
														
 
															+		for _, u := range captured.set.Updates {
														
 
															+			if u.Name == metric.OpencostGPUMemoryUsedRatio {
														
 
															+				ratios[u.Labels["UUID"]] = u.Value
														
 
															+			}
														
 
															+		}
														
 
															+		if len(ratios) != 2 {
														
 
															+			t.Fatalf("expected 2 synthesized ratios, got %d: %v", len(ratios), ratios)
														
 
															+		}
														
 
															+		if ratios["GPU-1"] != 0.75 || ratios["GPU-2"] != 0.2 {
														
 
															+			t.Errorf("ratios = %v, want {GPU-1:0.75, GPU-2:0.2}", ratios)
														
 
															+		}
														
 
															+		// original updates must pass through untouched alongside synthetics
														
 
															+		if len(captured.set.Updates) != 6 {
														
 
															+			t.Errorf("expected 4 originals + 2 synthetics, got %d", len(captured.set.Updates))
														
 
															+		}
														
 
															+	})
														
 
															+
														
 
															+	t.Run("Clear resets state between scrapes", func(t *testing.T) {
														
 
															+		s := NewGPUMemoryUsedRatioSynthesizer()
														
 
															+		s.Process(now, gpuFBUpdate(metric.DCGMFIDEVFBUSED, "GPU-1", "", 12000))
														
 
															+		s.Clear()
														
 
															+		s.Process(now, gpuFBUpdate(metric.DCGMFIDEVFBFREE, "GPU-1", "", 4000))
														
 
															+		if updates := s.Synthesize(); len(updates) != 0 {
														
 
															+			t.Errorf("expected no join across Clear, got %v", updates)
														
 
															+		}
														
 
															+	})
														
 
															+}
														
--- a/modules/collector-source/pkg/scrape/dcgm.go
+++ b/modules/collector-source/pkg/scrape/dcgm.go
@@ -26,6 +26,26 @@ func newDCGMTargetScraper(provider target.TargetProvider) *TargetScraper {
 
															 		[]string{
														
 
															 			metric.DCGMFIPROFGRENGINEACTIVE,
														
 
															 			metric.DCGMFIDEVDECUTIL,
														
 
															+			// GPU saturation signals; fields absent from the dcgm-exporter
														
 
															+			// configuration simply never appear in the scrape
														
 
															+			metric.DCGMFIDEVPOWERVIOLATION,
														
 
															+			metric.DCGMFIDEVTHERMALVIOLATION,
														
 
															+			metric.DCGMFIDEVSYNCBOOSTVIOLATION,
														
 
															+			metric.DCGMFIDEVBOARDLIMITVIOLATION,
														
 
															+			metric.DCGMFIDEVFBUSED,
														
 
															+			metric.DCGMFIDEVFBFREE,
														
 
															+			metric.DCGMFIDEVXIDERRORS,
														
 
															+			metric.DCGMFIDEVPOWERUSAGE,
														
 
															+			metric.DCGMFIDEVGPUTEMP,
														
 
															+			metric.DCGMFIDEVCLOCKTHROTTLEREASONS,
														
 
															+			metric.DCGMFIDEVCLOCKSEVENTREASONS,
														
 
															+			metric.DCGMFIPROFDRAMACTIVE,
														
 
															+			metric.DCGMFIPROFSMACTIVE,
														
 
															+			metric.DCGMFIPROFSMOCCUPANCY,
														
 
															+			metric.DCGMFIPROFPCIETXBYTES,
														
 
															+			metric.DCGMFIPROFPCIERXBYTES,
														
 
															+			metric.DCGMFIPROFNVLINKTXBYTES,
														
 
															+			metric.DCGMFIPROFNVLINKRXBYTES,
														
 
															 		},
														
 
															 		true)
														
 
															 }
														
--- a/modules/prometheus-source/go.mod
+++ b/modules/prometheus-source/go.mod
@@ -25,12 +25,15 @@ require (
 
															 	github.com/go-viper/mapstructure/v2 v2.5.0 // indirect
														
 
															 	github.com/goccy/go-json v0.10.5 // indirect
														
 
															 	github.com/google/uuid v1.6.0 // indirect
														
 
															+	github.com/hashicorp/errwrap v1.1.0 // indirect
														
 
															+	github.com/hashicorp/go-multierror v1.1.1 // indirect
														
 
															 	github.com/json-iterator/go v1.1.12 // indirect
														
 
															 	github.com/mattn/go-colorable v0.1.14 // indirect
														
 
															 	github.com/mattn/go-isatty v0.0.20 // indirect
														
 
															 	github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd // indirect
														
 
															 	github.com/modern-go/reflect2 v1.0.3-0.20250322232337-35a7c28c31ee // indirect
														
 
															 	github.com/munnerz/goautoneg v0.0.0-20191010083416-a7dc8b61c822 // indirect
														
 
															+	github.com/patrickmn/go-cache v2.1.0+incompatible // indirect
														
 
															 	github.com/pelletier/go-toml/v2 v2.2.4 // indirect
														
 
															 	github.com/prometheus/client_model v0.6.2 // indirect
														
 
															 	github.com/prometheus/common v0.67.5 // indirect
														
@@ -43,6 +46,7 @@ require (
 
															 	github.com/x448/float16 v0.8.4 // indirect
														
 
															 	go.yaml.in/yaml/v2 v2.4.3 // indirect
														
 
															 	go.yaml.in/yaml/v3 v3.0.4 // indirect
														
 
															+	golang.org/x/exp v0.0.0-20260218203240-3dfff04db8fa // indirect
														
 
															 	golang.org/x/net v0.52.0 // indirect
														
 
															 	golang.org/x/oauth2 v0.35.0 // indirect
														
 
															 	golang.org/x/sys v0.42.0 // indirect
														
--- a/modules/prometheus-source/go.sum
+++ b/modules/prometheus-source/go.sum
@@ -61,6 +61,11 @@ github.com/google/go-cmp v0.7.0/go.mod h1:pXiqmnSA92OHEEa9HXL2W4E7lf9JzCmGVUdgjX
 
															 github.com/google/gofuzz v1.0.0/go.mod h1:dBl0BpW6vV/+mYPU4Po3pmUjxk6FQPldtuIdl/M65Eg=
														
 
															 github.com/google/uuid v1.6.0 h1:NIvaJDMOsjHA8n1jAhLSgzrAzy1Hgr+hNrb57e+94F0=
														
 
															 github.com/google/uuid v1.6.0/go.mod h1:TIyPZe4MgqvfeYDBFedMoGGpEw/LqOeaOT+nhxU+yHo=
														
 
															+github.com/hashicorp/errwrap v1.0.0/go.mod h1:YH+1FKiLXxHSkmPseP+kNlulaMuP3n2brvKWEqk/Jc4=
														
 
															+github.com/hashicorp/errwrap v1.1.0 h1:OxrOeh75EUXMY8TBjag2fzXGZ40LB6IKw45YeGUDY2I=
														
 
															+github.com/hashicorp/errwrap v1.1.0/go.mod h1:YH+1FKiLXxHSkmPseP+kNlulaMuP3n2brvKWEqk/Jc4=
														
 
															+github.com/hashicorp/go-multierror v1.1.1 h1:H5DkEtf6CXdFp0N0Em5UCwQpXMWke8IA0+lD48awMYo=
														
 
															+github.com/hashicorp/go-multierror v1.1.1/go.mod h1:iw975J/qwKPdAO1clOe2L8331t/9/fmwbPZ6JB6eMoM=
														
 
															 github.com/jpillora/backoff v1.0.0 h1:uvFg412JmmHBHw7iwprIxkPMI+sGQ4kzOWsMeHnm2EA=
														
 
															 github.com/jpillora/backoff v1.0.0/go.mod h1:J/6gKK9jxlEcS3zixgDgUAsiuZ7yrSoa/FX5e0EB2j4=
														
 
															 github.com/json-iterator/go v1.1.12 h1:PV8peI4a0ysnczrg+LtxykD8LfKY9ML6u2jnxaEnrnM=
														
@@ -88,6 +93,8 @@ github.com/munnerz/goautoneg v0.0.0-20191010083416-a7dc8b61c822 h1:C3w9PqII01/Oq
 
															 github.com/munnerz/goautoneg v0.0.0-20191010083416-a7dc8b61c822/go.mod h1:+n7T8mK8HuQTcFwEeznm/DIxMOiR9yIdICNftLE1DvQ=
														
 
															 github.com/mwitkow/go-conntrack v0.0.0-20190716064945-2f068394615f h1:KUppIJq7/+SVif2QVs3tOP0zanoHgBEVAwHxUSIzRqU=
														
 
															 github.com/mwitkow/go-conntrack v0.0.0-20190716064945-2f068394615f/go.mod h1:qRWi+5nqEBWmkhHvq77mSJWrCKwh8bxhgT7d/eI7P4U=
														
 
															+github.com/patrickmn/go-cache v2.1.0+incompatible h1:HRMgzkcYKYpi3C8ajMPV8OFXaaRUnok+kx1WdO15EQc=
														
 
															+github.com/patrickmn/go-cache v2.1.0+incompatible/go.mod h1:3Qf8kWWT7OJRJbdiICTKqZju1ZixQ/KpMGzzAfe6+WQ=
														
 
															 github.com/pelletier/go-toml/v2 v2.2.4 h1:mye9XuhQ6gvn5h28+VilKrrPoQVanw5PMw/TB0t5Ec4=
														
 
															 github.com/pelletier/go-toml/v2 v2.2.4/go.mod h1:2gIqNv+qfxSVS7cM2xJQKtLSTLUE9V8t9Stt+h56mCY=
														
 
															 github.com/pkg/errors v0.9.1/go.mod h1:bwawxfHBFNV+L2hUp1rHADufV3IMtnDRdf1r5NINEl0=
														
@@ -131,6 +138,8 @@ go.yaml.in/yaml/v2 v2.4.3 h1:6gvOSjQoTB3vt1l+CU+tSyi/HOjfOjRLJ4YwYZGwRO0=
 
															 go.yaml.in/yaml/v2 v2.4.3/go.mod h1:zSxWcmIDjOzPXpjlTTbAsKokqkDNAVtZO0WOMiT90s8=
														
 
															 go.yaml.in/yaml/v3 v3.0.4 h1:tfq32ie2Jv2UxXFdLJdh3jXuOzWiL1fo0bu/FbuKpbc=
														
 
															 go.yaml.in/yaml/v3 v3.0.4/go.mod h1:DhzuOOF2ATzADvBadXxruRBLzYTpT36CKvDb3+aBEFg=
														
 
															+golang.org/x/exp v0.0.0-20260218203240-3dfff04db8fa h1:Zt3DZoOFFYkKhDT3v7Lm9FDMEV06GpzjG2jrqW+QTE0=
														
 
															+golang.org/x/exp v0.0.0-20260218203240-3dfff04db8fa/go.mod h1:K79w1Vqn7PoiZn+TkNpx3BUWUQksGO3JcVX6qIjytmA=
														
 
															 golang.org/x/net v0.52.0 h1:He/TN1l0e4mmR3QqHMT2Xab3Aj3L9qjbhRm78/6jrW0=
														
 
															 golang.org/x/net v0.52.0/go.mod h1:R1MAz7uMZxVMualyPXb+VaqGSa3LIaUqk0eEt3w36Sw=
														
 
															 golang.org/x/oauth2 v0.35.0 h1:Mv2mzuHuZuY2+bkyWXIHMfhNdJAdwW3FuWeCPYN5GVQ=
														
--- a/modules/prometheus-source/pkg/prom/config.go
+++ b/modules/prometheus-source/pkg/prom/config.go
@@ -34,6 +34,9 @@ type OpenCostPrometheusConfig struct {
 
															 	ClusterFilter         string
														
 
															 	DataResolution        time.Duration
														
 
															 	DataResolutionMinutes int
														
 
															+	// GPUMemorySaturationThreshold is the framebuffer occupancy ratio in
														
 
															+	// (0, 1] above which GPU memory is considered pressured.
														
 
															+	GPUMemorySaturationThreshold float64
														
 
															 }
														
 
															 func (ocpc *OpenCostPrometheusConfig) IsRateLimitRetryEnabled() bool {
														
@@ -151,5 +154,9 @@ func NewOpenCostPrometheusConfigFromEnv() (*OpenCostPrometheusConfig, error) {
 
															 		ClusterFilter:         clusterFilter,
														
 
															 		DataResolution:        dataResolution,
														
 
															 		DataResolutionMinutes: resolutionMinutes,
														
 
															+
														
 
															+		// shared with collector-source via core env so both data sources
														
 
															+		// apply the identical threshold
														
 
															+		GPUMemorySaturationThreshold: coreenv.GetGPUMemorySaturationThreshold(),
														
 
															 	}, nil
														
 
															 }
														
--- a/modules/prometheus-source/pkg/prom/gpudevicequerier.go
+++ b/modules/prometheus-source/pkg/prom/gpudevicequerier.go
@@ -0,0 +1,67 @@
 
															+package prom
														
 
															+
														
 
															+import (
														
 
															+	"fmt"
														
 
															+	"time"
														
 
															+
														
 
															+	"github.com/opencost/opencost/core/pkg/source"
														
 
															+)
														
 
															+
														
 
															+// Device-level GPU metric queries supporting the DeviceInfo and
														
 
															+// DevicePerformance contracts on DCGMDevice: power draw, temperature,
														
 
															+// device-level compute utilization, and absolute memory used. Unlike the
														
 
															+// container-attributed saturation queries these group by device identity
														
 
															+// only, since the values describe the whole device (or MIG instance)
														
 
															+// regardless of which containers share it. All source fields are in the
														
 
															+// default dcgm-exporter configuration.
														
 
															+
														
 
															+// gpuDeviceByLabels groups series by device identity (and MIG instance)
														
 
															+// without container attribution.
														
 
															+const gpuDeviceByLabels = `device, modelName, UUID, GPU_I_PROFILE, GPU_I_ID`
														
 
															+
														
 
															+// queryGPUDeviceGauge issues an agg(agg_over_time(...)) query for a
														
 
															+// device-level DCGM gauge.
														
 
															+func (pds *PrometheusMetricsQuerier) queryGPUDeviceGauge(queryName, metric, agg string, start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	const queryFmt = `%s(%s_over_time(%s{%s}[%s])) by (%s, %s)`
														
 
															+	cfg := pds.promConfig
														
 
															+
														
 
															+	durStr := mustDurationString(queryName, start, end)
														
 
															+	query := fmt.Sprintf(queryFmt, agg, agg, metric, cfg.ClusterFilter, durStr, gpuDeviceByLabels, cfg.ClusterLabel)
														
 
															+	return pds.queryGPUSaturation(queryName, query, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDevicePowerAvg queries average device power draw in watts
														
 
															+// (DCGM_FI_DEV_POWER_USAGE).
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUDevicePowerAvg(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return pds.queryGPUDeviceGauge("QueryGPUDevicePowerAvg", "DCGM_FI_DEV_POWER_USAGE", "avg", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDeviceTempAvg queries average device temperature in degrees
														
 
															+// Celsius (DCGM_FI_DEV_GPU_TEMP).
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUDeviceTempAvg(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return pds.queryGPUDeviceGauge("QueryGPUDeviceTempAvg", "DCGM_FI_DEV_GPU_TEMP", "avg", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDeviceUsageAvg queries average device-level compute utilization
														
 
															+// as a 0-1 ratio (DCGM_FI_PROF_GR_ENGINE_ACTIVE without container
														
 
															+// attribution).
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUDeviceUsageAvg(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return pds.queryGPUDeviceGauge("QueryGPUDeviceUsageAvg", "DCGM_FI_PROF_GR_ENGINE_ACTIVE", "avg", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDeviceUsageMax queries peak device-level compute utilization as a
														
 
															+// 0-1 ratio.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUDeviceUsageMax(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return pds.queryGPUDeviceGauge("QueryGPUDeviceUsageMax", "DCGM_FI_PROF_GR_ENGINE_ACTIVE", "max", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDeviceMemoryUsedAvg queries average framebuffer used in MiB
														
 
															+// (DCGM_FI_DEV_FB_USED); hydration converts to bytes.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUDeviceMemoryUsedAvg(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return pds.queryGPUDeviceGauge("QueryGPUDeviceMemoryUsedAvg", "DCGM_FI_DEV_FB_USED", "avg", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDeviceMemoryUsedMax queries peak framebuffer used in MiB.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUDeviceMemoryUsedMax(start, end time.Time) *source.Future[source.GPUDeviceMetricResult] {
														
 
															+	return pds.queryGPUDeviceGauge("QueryGPUDeviceMemoryUsedMax", "DCGM_FI_DEV_FB_USED", "max", start, end)
														
 
															+}
														
--- a/modules/prometheus-source/pkg/prom/gpusaturationquerier.go
+++ b/modules/prometheus-source/pkg/prom/gpusaturationquerier.go
@@ -0,0 +1,282 @@
 
															+package prom
														
 
															+
														
 
															+import (
														
 
															+	"fmt"
														
 
															+	"strings"
														
 
															+	"time"
														
 
															+
														
 
															+	"github.com/opencost/opencost/core/pkg/log"
														
 
															+	"github.com/opencost/opencost/core/pkg/opencost"
														
 
															+	"github.com/opencost/opencost/core/pkg/source"
														
 
															+	"github.com/opencost/opencost/core/pkg/util/timeutil"
														
 
															+)
														
 
															+
														
 
															+// GPU saturation queries
														
 
															+//
														
 
															+// These queries derive USE-method saturation signals for GPUs from
														
 
															+// dcgm-exporter metrics. Each query is an independent primitive; when the
														
 
															+// underlying DCGM field is not collected (no dcgm-exporter, the field is
														
 
															+// disabled in its config, or the GPU lacks DCP profiling support) the query
														
 
															+// simply returns no series, which downstream code treats as "signal absent"
														
 
															+// rather than zero.
														
 
															+//
														
 
															+// Sources by dcgm-exporter configuration:
														
 
															+//   - default config: DCGM_FI_DEV_*_VIOLATION, DCGM_FI_DEV_FB_USED/FREE,
														
 
															+//     DCGM_FI_DEV_XID_ERRORS, DCGM_FI_PROF_DRAM_ACTIVE,
														
 
															+//     DCGM_FI_PROF_PCIE_TX/RX_BYTES
														
 
															+//   - requires explicit enablement: DCGM_FI_DEV_CLOCK_THROTTLE_REASONS
														
 
															+//     (DCGM_FI_DEV_CLOCKS_EVENT_REASONS in DCGM 3.3+),
														
 
															+//     DCGM_FI_PROF_SM_ACTIVE, DCGM_FI_PROF_SM_OCCUPANCY,
														
 
															+//     DCGM_FI_PROF_NVLINK_TX/RX_BYTES
														
 
															+//
														
 
															+// All DCGM_FI_PROF_* fields additionally require DCP profiling (Volta+).
														
 
															+
														
 
															+// gpuSaturationByLabels is the grouping shared by every GPU saturation
														
 
															+// query: container attribution, GPU identity, and MIG instance labels.
														
 
															+// Grouping by a label that is absent from a series yields an empty value,
														
 
															+// so non-MIG series pass through unchanged.
														
 
															+const gpuSaturationByLabels = `container, pod, namespace, device, modelName, UUID, GPU_I_PROFILE, GPU_I_ID, pod_uid`
														
 
															+
														
 
															+// gpuThrottleViolationMetrics maps each DCGM violation counter to its
														
 
															+// canonical reason name. The counters accumulate microseconds spent
														
 
															+// throttled, so increase(counter[window]) / window-in-microseconds is the
														
 
															+// fraction of the window spent throttled for that reason.
														
 
															+var gpuThrottleViolationMetrics = []struct {
														
 
															+	Metric string
														
 
															+	Reason string
														
 
															+}{
														
 
															+	{Metric: "DCGM_FI_DEV_POWER_VIOLATION", Reason: opencost.GPUThrottleViolationPower},
														
 
															+	{Metric: "DCGM_FI_DEV_THERMAL_VIOLATION", Reason: opencost.GPUThrottleViolationThermal},
														
 
															+	{Metric: "DCGM_FI_DEV_SYNC_BOOST_VIOLATION", Reason: opencost.GPUThrottleViolationSyncBoost},
														
 
															+	{Metric: "DCGM_FI_DEV_BOARD_LIMIT_VIOLATION", Reason: opencost.GPUThrottleViolationBoardLimit},
														
 
															+}
														
 
															+
														
 
															+// buildGPUThrottleViolationQuery returns one query producing a series per
														
 
															+// (GPU, container, reason): the fraction of the window each violation
														
 
															+// counter accumulated. Branches for the four violation metrics are joined
														
 
															+// with "or" and tagged with a constant "reason" label so a single decoder
														
 
															+// handles all of them.
														
 
															+func buildGPUThrottleViolationQuery(clusterFilter, durStr, clusterLabel string, windowSeconds float64) string {
														
 
															+	windowMicros := windowSeconds * 1e6
														
 
															+	branches := make([]string, 0, len(gpuThrottleViolationMetrics))
														
 
															+	for _, violation := range gpuThrottleViolationMetrics {
														
 
															+		branches = append(branches, fmt.Sprintf(
														
 
															+			`label_replace(avg(increase(%s{container!="",%s}[%s])) by (%s, %s) / %g, "reason", "%s", "", "")`,
														
 
															+			violation.Metric, clusterFilter, durStr, gpuSaturationByLabels, clusterLabel, windowMicros, violation.Reason,
														
 
															+		))
														
 
															+	}
														
 
															+	return strings.Join(branches, " or ")
														
 
															+}
														
 
															+
														
 
															+// buildGPUThrottleReasonQuery returns one query producing a series per
														
 
															+// (GPU, container, reason): the fraction of window samples in which the
														
 
															+// reason bit was set in the clock throttle reasons bitmask. The bit test
														
 
															+// floor(mask / bit) % 2 is evaluated per sample via a subquery at the
														
 
															+// configured resolution (PromQL has no bitwise operators, hence the
														
 
															+// arithmetic). Both the pre-3.3 and post-3.3 DCGM field names are queried
														
 
															+// via `or`; at most one exists per dcgm-exporter version. The rename is
														
 
															+// handled here at the query layer because the prometheus source has no
														
 
															+// ingest step where the metric name could be normalized once — Prometheus
														
 
															+// stores whatever dcgm-exporter exposed. If a normalization layer ever
														
 
															+// exists, collapse these to the canonical name there.
														
 
															+func buildGPUThrottleReasonQuery(clusterFilter, durStr, clusterLabel string, minsPerResolution int) string {
														
 
															+	branches := make([]string, 0, len(opencost.GPUThrottleReasons))
														
 
															+	for _, reason := range opencost.GPUThrottleReasons {
														
 
															+		branches = append(branches, fmt.Sprintf(
														
 
															+			`label_replace(avg(avg_over_time(((floor((DCGM_FI_DEV_CLOCK_THROTTLE_REASONS{container!="",%s} or DCGM_FI_DEV_CLOCKS_EVENT_REASONS{container!="",%s}) / %d)) %% 2)[%s:%dm])) by (%s, %s), "reason", "%s", "", "")`,
														
 
															+			clusterFilter, clusterFilter, reason.Bit, durStr, minsPerResolution, gpuSaturationByLabels, clusterLabel, reason.Name,
														
 
															+		))
														
 
															+	}
														
 
															+	return strings.Join(branches, " or ")
														
 
															+}
														
 
															+
														
 
															+// queryGPUSaturation centralizes the shared shape of every GPU saturation
														
 
															+// query method: log it, then issue it at the window end.
														
 
															+func (pds *PrometheusMetricsQuerier) queryGPUSaturation(queryName, query string, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), query)
														
 
															+
														
 
															+	ctx := pds.promContexts.NewNamedContext(AllocationContextName)
														
 
															+	return source.NewFuture(source.DecodeGPUSaturationResult, ctx.QueryAtTime(query, end))
														
 
															+}
														
 
															+
														
 
															+// mustDurationString panics like every other querier when the window cannot
														
 
															+// be expressed as a duration string.
														
 
															+func mustDurationString(queryName string, start, end time.Time) string {
														
 
															+	durStr := timeutil.DurationString(end.Sub(start))
														
 
															+	if durStr == "" {
														
 
															+		panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
														
 
															+	}
														
 
															+	return durStr
														
 
															+}
														
 
															+
														
 
															+// QueryGPUThrottleViolationRatio queries the fraction of the window each GPU
														
 
															+// spent throttled, per reason, from the DCGM violation counters (default
														
 
															+// dcgm-exporter configuration).
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUThrottleViolationRatio(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	const queryName = "QueryGPUThrottleViolationRatio"
														
 
															+	cfg := pds.promConfig
														
 
															+
														
 
															+	durStr := mustDurationString(queryName, start, end)
														
 
															+	query := buildGPUThrottleViolationQuery(cfg.ClusterFilter, durStr, cfg.ClusterLabel, end.Sub(start).Seconds())
														
 
															+	return pds.queryGPUSaturation(queryName, query, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUThrottleReasonRatio queries the fraction of the window each
														
 
															+// saturation-relevant bit of the clock throttle reasons bitmask was set.
														
 
															+// Requires DCGM_FI_DEV_CLOCK_THROTTLE_REASONS (or its DCGM 3.3+ rename) to
														
 
															+// be enabled in the dcgm-exporter configuration.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUThrottleReasonRatio(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	const queryName = "QueryGPUThrottleReasonRatio"
														
 
															+	cfg := pds.promConfig
														
 
															+
														
 
															+	minsPerResolution := cfg.DataResolutionMinutes
														
 
															+	durStr := pds.durationStringFor(start, end, minsPerResolution, false)
														
 
															+	if durStr == "" {
														
 
															+		panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
														
 
															+	}
														
 
															+
														
 
															+	query := buildGPUThrottleReasonQuery(cfg.ClusterFilter, durStr, cfg.ClusterLabel, minsPerResolution)
														
 
															+	return pds.queryGPUSaturation(queryName, query, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUMemoryUsedRatioAvg queries average framebuffer occupancy over the
														
 
															+// window: FB_USED / (FB_USED + FB_FREE). Default dcgm-exporter configuration.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUMemoryUsedRatioAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	const queryName = "QueryGPUMemoryUsedRatioAvg"
														
 
															+	const queryFmt = `avg(avg_over_time(DCGM_FI_DEV_FB_USED{container!="",%s}[%s])) by (%s, %s) / (avg(avg_over_time(DCGM_FI_DEV_FB_USED{container!="",%s}[%s])) by (%s, %s) + avg(avg_over_time(DCGM_FI_DEV_FB_FREE{container!="",%s}[%s])) by (%s, %s))`
														
 
															+	cfg := pds.promConfig
														
 
															+
														
 
															+	durStr := mustDurationString(queryName, start, end)
														
 
															+	query := fmt.Sprintf(queryFmt,
														
 
															+		cfg.ClusterFilter, durStr, gpuSaturationByLabels, cfg.ClusterLabel,
														
 
															+		cfg.ClusterFilter, durStr, gpuSaturationByLabels, cfg.ClusterLabel,
														
 
															+		cfg.ClusterFilter, durStr, gpuSaturationByLabels, cfg.ClusterLabel,
														
 
															+	)
														
 
															+	return pds.queryGPUSaturation(queryName, query, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUMemoryUsedRatioMax queries peak framebuffer occupancy over the
														
 
															+// window. The denominator uses window averages, which is exact because
														
 
															+// FB_USED + FB_FREE is the fixed framebuffer capacity.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUMemoryUsedRatioMax(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	const queryName = "QueryGPUMemoryUsedRatioMax"
														
 
															+	const queryFmt = `max(max_over_time(DCGM_FI_DEV_FB_USED{container!="",%s}[%s])) by (%s, %s) / (avg(avg_over_time(DCGM_FI_DEV_FB_USED{container!="",%s}[%s])) by (%s, %s) + avg(avg_over_time(DCGM_FI_DEV_FB_FREE{container!="",%s}[%s])) by (%s, %s))`
														
 
															+	cfg := pds.promConfig
														
 
															+
														
 
															+	durStr := mustDurationString(queryName, start, end)
														
 
															+	query := fmt.Sprintf(queryFmt,
														
 
															+		cfg.ClusterFilter, durStr, gpuSaturationByLabels, cfg.ClusterLabel,
														
 
															+		cfg.ClusterFilter, durStr, gpuSaturationByLabels, cfg.ClusterLabel,
														
 
															+		cfg.ClusterFilter, durStr, gpuSaturationByLabels, cfg.ClusterLabel,
														
 
															+	)
														
 
															+	return pds.queryGPUSaturation(queryName, query, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUMemoryPressureRatio queries the fraction of window samples in
														
 
															+// which framebuffer occupancy exceeded the configured threshold.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUMemoryPressureRatio(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	const queryName = "QueryGPUMemoryPressureRatio"
														
 
															+	const queryFmt = `avg(avg_over_time(((DCGM_FI_DEV_FB_USED{container!="",%s} / (DCGM_FI_DEV_FB_USED{container!="",%s} + DCGM_FI_DEV_FB_FREE{container!="",%s})) >= bool %g)[%s:%dm])) by (%s, %s)`
														
 
															+	cfg := pds.promConfig
														
 
															+
														
 
															+	minsPerResolution := cfg.DataResolutionMinutes
														
 
															+	durStr := pds.durationStringFor(start, end, minsPerResolution, false)
														
 
															+	if durStr == "" {
														
 
															+		panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
														
 
															+	}
														
 
															+
														
 
															+	query := fmt.Sprintf(queryFmt,
														
 
															+		cfg.ClusterFilter, cfg.ClusterFilter, cfg.ClusterFilter,
														
 
															+		cfg.GPUMemorySaturationThreshold, durStr, minsPerResolution,
														
 
															+		gpuSaturationByLabels, cfg.ClusterLabel,
														
 
															+	)
														
 
															+	return pds.queryGPUSaturation(queryName, query, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUXIDErrorCount queries the number of XID error events observed in
														
 
															+// the window. DCGM_FI_DEV_XID_ERRORS reports the most recent XID code, so
														
 
															+// this counts changes of that value; consecutive identical errors are
														
 
															+// undercounted. Default dcgm-exporter configuration.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUXIDErrorCount(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	const queryName = "QueryGPUXIDErrorCount"
														
 
															+	const queryFmt = `sum(changes(DCGM_FI_DEV_XID_ERRORS{container!="",%s}[%s])) by (%s, %s)`
														
 
															+	cfg := pds.promConfig
														
 
															+
														
 
															+	durStr := mustDurationString(queryName, start, end)
														
 
															+	query := fmt.Sprintf(queryFmt, cfg.ClusterFilter, durStr, gpuSaturationByLabels, cfg.ClusterLabel)
														
 
															+	return pds.queryGPUSaturation(queryName, query, end)
														
 
															+}
														
 
															+
														
 
															+// queryGPUGaugeOverTime is the shared implementation for the DCP profiling
														
 
															+// gauges that need only an avg or max over the window.
														
 
															+func (pds *PrometheusMetricsQuerier) queryGPUGaugeOverTime(queryName, metric, agg string, start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	const queryFmt = `%s(%s_over_time(%s{container!="",%s}[%s])) by (%s, %s)`
														
 
															+	cfg := pds.promConfig
														
 
															+
														
 
															+	durStr := mustDurationString(queryName, start, end)
														
 
															+	query := fmt.Sprintf(queryFmt, agg, agg, metric, cfg.ClusterFilter, durStr, gpuSaturationByLabels, cfg.ClusterLabel)
														
 
															+	return pds.queryGPUSaturation(queryName, query, end)
														
 
															+}
														
 
															+
														
 
															+// queryGPUCounterRate is the shared implementation for the DCP byte
														
 
															+// counters reported as average bytes/sec over the window.
														
 
															+func (pds *PrometheusMetricsQuerier) queryGPUCounterRate(queryName, metric string, start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	const queryFmt = `avg(rate(%s{container!="",%s}[%s])) by (%s, %s)`
														
 
															+	cfg := pds.promConfig
														
 
															+
														
 
															+	durStr := mustDurationString(queryName, start, end)
														
 
															+	query := fmt.Sprintf(queryFmt, metric, cfg.ClusterFilter, durStr, gpuSaturationByLabels, cfg.ClusterLabel)
														
 
															+	return pds.queryGPUSaturation(queryName, query, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDRAMActiveAvg queries the average ratio of cycles the device
														
 
															+// memory interface was active. Requires DCP profiling.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUDRAMActiveAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return pds.queryGPUGaugeOverTime("QueryGPUDRAMActiveAvg", "DCGM_FI_PROF_DRAM_ACTIVE", "avg", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUDRAMActiveMax queries the peak ratio of cycles the device memory
														
 
															+// interface was active. Requires DCP profiling.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUDRAMActiveMax(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return pds.queryGPUGaugeOverTime("QueryGPUDRAMActiveMax", "DCGM_FI_PROF_DRAM_ACTIVE", "max", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUSMActiveAvg queries the average ratio of cycles at least one warp
														
 
															+// was assigned to any SM. Requires DCP profiling and explicit enablement in
														
 
															+// the dcgm-exporter configuration.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUSMActiveAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return pds.queryGPUGaugeOverTime("QueryGPUSMActiveAvg", "DCGM_FI_PROF_SM_ACTIVE", "avg", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUSMOccupancyAvg queries the average ratio of resident warps to the
														
 
															+// SM maximum. Requires DCP profiling and explicit enablement in the
														
 
															+// dcgm-exporter configuration.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUSMOccupancyAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return pds.queryGPUGaugeOverTime("QueryGPUSMOccupancyAvg", "DCGM_FI_PROF_SM_OCCUPANCY", "avg", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUPCIeTxBytesAvg queries average PCIe transmit throughput in
														
 
															+// bytes/sec. Requires DCP profiling.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUPCIeTxBytesAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return pds.queryGPUCounterRate("QueryGPUPCIeTxBytesAvg", "DCGM_FI_PROF_PCIE_TX_BYTES", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUPCIeRxBytesAvg queries average PCIe receive throughput in
														
 
															+// bytes/sec. Requires DCP profiling.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUPCIeRxBytesAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return pds.queryGPUCounterRate("QueryGPUPCIeRxBytesAvg", "DCGM_FI_PROF_PCIE_RX_BYTES", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUNVLinkTxBytesAvg queries average NVLink transmit throughput in
														
 
															+// bytes/sec. Requires DCP profiling and explicit enablement in the
														
 
															+// dcgm-exporter configuration.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUNVLinkTxBytesAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return pds.queryGPUCounterRate("QueryGPUNVLinkTxBytesAvg", "DCGM_FI_PROF_NVLINK_TX_BYTES", start, end)
														
 
															+}
														
 
															+
														
 
															+// QueryGPUNVLinkRxBytesAvg queries average NVLink receive throughput in
														
 
															+// bytes/sec. Requires DCP profiling and explicit enablement in the
														
 
															+// dcgm-exporter configuration.
														
 
															+func (pds *PrometheusMetricsQuerier) QueryGPUNVLinkRxBytesAvg(start, end time.Time) *source.Future[source.GPUSaturationResult] {
														
 
															+	return pds.queryGPUCounterRate("QueryGPUNVLinkRxBytesAvg", "DCGM_FI_PROF_NVLINK_RX_BYTES", start, end)
														
 
															+}
														
--- a/modules/prometheus-source/pkg/prom/gpusaturationquerier_test.go
+++ b/modules/prometheus-source/pkg/prom/gpusaturationquerier_test.go
@@ -0,0 +1,234 @@
 
															+package prom
														
 
															+
														
 
															+import (
														
 
															+	"strings"
														
 
															+	"testing"
														
 
															+	"time"
														
 
															+
														
 
															+	"github.com/rs/zerolog"
														
 
															+	zerologger "github.com/rs/zerolog/log"
														
 
															+)
														
 
															+
														
 
															+func TestBuildGPUThrottleViolationQuery(t *testing.T) {
														
 
															+	query := buildGPUThrottleViolationQuery(`cluster_id="c1"`, "1h", "cluster_id", 3600)
														
 
															+
														
 
															+	branches := strings.Split(query, " or ")
														
 
															+	if len(branches) != 4 {
														
 
															+		t.Fatalf("expected 4 violation branches, got %d: %s", len(branches), query)
														
 
															+	}
														
 
															+
														
 
															+	// one hour is 3.6e9 microseconds: each branch must normalize by it
														
 
															+	wantBranch := `label_replace(avg(increase(DCGM_FI_DEV_POWER_VIOLATION{container!="",cluster_id="c1"}[1h])) by (container, pod, namespace, device, modelName, UUID, GPU_I_PROFILE, GPU_I_ID, pod_uid, cluster_id) / 3.6e+09, "reason", "power", "", "")`
														
 
															+	if branches[0] != wantBranch {
														
 
															+		t.Errorf("violation branch mismatch:\n got %s\nwant %s", branches[0], wantBranch)
														
 
															+	}
														
 
															+
														
 
															+	for metric, reason := range map[string]string{
														
 
															+		"DCGM_FI_DEV_POWER_VIOLATION":       "power",
														
 
															+		"DCGM_FI_DEV_THERMAL_VIOLATION":     "thermal",
														
 
															+		"DCGM_FI_DEV_SYNC_BOOST_VIOLATION":  "sync_boost",
														
 
															+		"DCGM_FI_DEV_BOARD_LIMIT_VIOLATION": "board_limit",
														
 
															+	} {
														
 
															+		if !strings.Contains(query, metric) {
														
 
															+			t.Errorf("expected query to reference %s", metric)
														
 
															+		}
														
 
															+		if !strings.Contains(query, `"reason", "`+reason+`"`) {
														
 
															+			t.Errorf("expected query to tag reason %q", reason)
														
 
															+		}
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+func TestBuildGPUThrottleReasonQuery(t *testing.T) {
														
 
															+	query := buildGPUThrottleReasonQuery(`cluster_id="c1"`, "1h", "cluster_id", 5)
														
 
															+
														
 
															+	// one label_replace-wrapped branch per saturation-relevant reason bit
														
 
															+	if got := strings.Count(query, "label_replace"); got != 6 {
														
 
															+		t.Fatalf("expected 6 reason branches, got %d: %s", got, query)
														
 
															+	}
														
 
															+
														
 
															+	// the first branch tests the sw_power_cap bit (0x4 == 4) per sample at
														
 
															+	// the subquery resolution, then averages the 0/1 results over the window
														
 
															+	wantBranch := `label_replace(avg(avg_over_time(((floor((DCGM_FI_DEV_CLOCK_THROTTLE_REASONS{container!="",cluster_id="c1"} or DCGM_FI_DEV_CLOCKS_EVENT_REASONS{container!="",cluster_id="c1"}) / 4)) % 2)[1h:5m])) by (container, pod, namespace, device, modelName, UUID, GPU_I_PROFILE, GPU_I_ID, pod_uid, cluster_id), "reason", "sw_power_cap", "", "")`
														
 
															+	if !strings.HasPrefix(query, wantBranch+" or ") {
														
 
															+		t.Errorf("reason query does not start with expected sw_power_cap branch:\n got %s\nwant prefix %s", query, wantBranch)
														
 
															+	}
														
 
															+
														
 
															+	for reason, bit := range map[string]string{
														
 
															+		"sw_power_cap":   "/ 4",
														
 
															+		"hw_slowdown":    "/ 8",
														
 
															+		"sync_boost":     "/ 16",
														
 
															+		"sw_thermal":     "/ 32",
														
 
															+		"hw_thermal":     "/ 64",
														
 
															+		"hw_power_brake": "/ 128",
														
 
															+	} {
														
 
															+		if !strings.Contains(query, `"reason", "`+reason+`"`) {
														
 
															+			t.Errorf("expected query to tag reason %q", reason)
														
 
															+		}
														
 
															+		if !strings.Contains(query, bit) {
														
 
															+			t.Errorf("expected query to test bit via %q for reason %q", bit, reason)
														
 
															+		}
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+// TestGPUSaturationQueries runs every saturation query against the no-op
														
 
															+// client and asserts the logged query references the expected DCGM source
														
 
															+// metric, carries the cluster filter, and groups by the saturation label
														
 
															+// set.
														
 
															+func TestGPUSaturationQueries(t *testing.T) {
														
 
															+	initLogging(t, "debug", false)
														
 
															+
														
 
															+	logWriter := new(SingleLogWriter)
														
 
															+	zerologger.Logger = zerologger.Output(zerolog.ConsoleWriter{
														
 
															+		Out:        logWriter,
														
 
															+		TimeFormat: "",
														
 
															+		NoColor:    true,
														
 
															+		PartsExclude: []string{
														
 
															+			zerolog.TimestampFieldName,
														
 
															+			zerolog.LevelFieldName,
														
 
															+			zerolog.CallerFieldName,
														
 
															+		},
														
 
															+	})
														
 
															+	defer initLogging(t, "debug", false)
														
 
															+
														
 
															+	t.Setenv("PROMETHEUS_SERVER_ENDPOINT", "nowhere")
														
 
															+	t.Setenv("CURRENT_CLUSTER_ID_FILTER_ENABLED", "true")
														
 
															+	t.Setenv("CLUSTER_ID", "test-cluster")
														
 
															+	t.Setenv("GPU_MEMORY_SATURATION_THRESHOLD", "0.8")
														
 
															+
														
 
															+	config, err := NewOpenCostPrometheusConfigFromEnv()
														
 
															+	if err != nil {
														
 
															+		t.Fatalf("Failed to create OpenCost Prometheus config: %v", err)
														
 
															+	}
														
 
															+
														
 
															+	mock := new(NoOpPromClient)
														
 
															+	contextFactory := NewContextFactory(mock, config)
														
 
															+	querier := newPrometheusMetricsQuerier(config, mock, contextFactory)
														
 
															+
														
 
															+	queryEnd := time.Now().UTC().Truncate(time.Hour).Add(time.Hour)
														
 
															+	queryStart := queryEnd.Add(-24 * time.Hour)
														
 
															+
														
 
															+	tests := map[string]struct {
														
 
															+		query      func(time.Time, time.Time)
														
 
															+		wantMetric string
														
 
															+		wantExtra  string
														
 
															+	}{
														
 
															+		"QueryGPUThrottleViolationRatio": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUThrottleViolationRatio(s, e) },
														
 
															+			wantMetric: "DCGM_FI_DEV_POWER_VIOLATION",
														
 
															+		},
														
 
															+		"QueryGPUThrottleReasonRatio": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUThrottleReasonRatio(s, e) },
														
 
															+			wantMetric: "DCGM_FI_DEV_CLOCK_THROTTLE_REASONS",
														
 
															+			wantExtra:  "DCGM_FI_DEV_CLOCKS_EVENT_REASONS",
														
 
															+		},
														
 
															+		"QueryGPUMemoryUsedRatioAvg": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUMemoryUsedRatioAvg(s, e) },
														
 
															+			wantMetric: "DCGM_FI_DEV_FB_USED",
														
 
															+			wantExtra:  "DCGM_FI_DEV_FB_FREE",
														
 
															+		},
														
 
															+		"QueryGPUMemoryUsedRatioMax": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUMemoryUsedRatioMax(s, e) },
														
 
															+			wantMetric: "DCGM_FI_DEV_FB_USED",
														
 
															+			wantExtra:  "max_over_time",
														
 
															+		},
														
 
															+		"QueryGPUMemoryPressureRatio": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUMemoryPressureRatio(s, e) },
														
 
															+			wantMetric: "DCGM_FI_DEV_FB_USED",
														
 
															+			wantExtra:  ">= bool 0.8",
														
 
															+		},
														
 
															+		"QueryGPUXIDErrorCount": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUXIDErrorCount(s, e) },
														
 
															+			wantMetric: "DCGM_FI_DEV_XID_ERRORS",
														
 
															+			wantExtra:  "changes(",
														
 
															+		},
														
 
															+		"QueryGPUDRAMActiveAvg": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUDRAMActiveAvg(s, e) },
														
 
															+			wantMetric: "DCGM_FI_PROF_DRAM_ACTIVE",
														
 
															+			wantExtra:  "avg_over_time",
														
 
															+		},
														
 
															+		"QueryGPUDRAMActiveMax": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUDRAMActiveMax(s, e) },
														
 
															+			wantMetric: "DCGM_FI_PROF_DRAM_ACTIVE",
														
 
															+			wantExtra:  "max_over_time",
														
 
															+		},
														
 
															+		"QueryGPUSMActiveAvg": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUSMActiveAvg(s, e) },
														
 
															+			wantMetric: "DCGM_FI_PROF_SM_ACTIVE",
														
 
															+		},
														
 
															+		"QueryGPUSMOccupancyAvg": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUSMOccupancyAvg(s, e) },
														
 
															+			wantMetric: "DCGM_FI_PROF_SM_OCCUPANCY",
														
 
															+		},
														
 
															+		"QueryGPUPCIeTxBytesAvg": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUPCIeTxBytesAvg(s, e) },
														
 
															+			wantMetric: "DCGM_FI_PROF_PCIE_TX_BYTES",
														
 
															+			wantExtra:  "rate(",
														
 
															+		},
														
 
															+		"QueryGPUPCIeRxBytesAvg": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUPCIeRxBytesAvg(s, e) },
														
 
															+			wantMetric: "DCGM_FI_PROF_PCIE_RX_BYTES",
														
 
															+		},
														
 
															+		"QueryGPUNVLinkTxBytesAvg": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUNVLinkTxBytesAvg(s, e) },
														
 
															+			wantMetric: "DCGM_FI_PROF_NVLINK_TX_BYTES",
														
 
															+		},
														
 
															+		"QueryGPUNVLinkRxBytesAvg": {
														
 
															+			query:      func(s, e time.Time) { querier.QueryGPUNVLinkRxBytesAvg(s, e) },
														
 
															+			wantMetric: "DCGM_FI_PROF_NVLINK_RX_BYTES",
														
 
															+		},
														
 
															+	}
														
 
															+
														
 
															+	deviceTests := map[string]struct {
														
 
															+		query      func(time.Time, time.Time)
														
 
															+		wantMetric string
														
 
															+	}{
														
 
															+		"QueryGPUDevicePowerAvg":      {func(s, e time.Time) { querier.QueryGPUDevicePowerAvg(s, e) }, "DCGM_FI_DEV_POWER_USAGE"},
														
 
															+		"QueryGPUDeviceTempAvg":       {func(s, e time.Time) { querier.QueryGPUDeviceTempAvg(s, e) }, "DCGM_FI_DEV_GPU_TEMP"},
														
 
															+		"QueryGPUDeviceUsageAvg":      {func(s, e time.Time) { querier.QueryGPUDeviceUsageAvg(s, e) }, "DCGM_FI_PROF_GR_ENGINE_ACTIVE"},
														
 
															+		"QueryGPUDeviceUsageMax":      {func(s, e time.Time) { querier.QueryGPUDeviceUsageMax(s, e) }, "DCGM_FI_PROF_GR_ENGINE_ACTIVE"},
														
 
															+		"QueryGPUDeviceMemoryUsedAvg": {func(s, e time.Time) { querier.QueryGPUDeviceMemoryUsedAvg(s, e) }, "DCGM_FI_DEV_FB_USED"},
														
 
															+		"QueryGPUDeviceMemoryUsedMax": {func(s, e time.Time) { querier.QueryGPUDeviceMemoryUsedMax(s, e) }, "DCGM_FI_DEV_FB_USED"},
														
 
															+	}
														
 
															+	const wantDeviceFilter = `cluster_id="test-cluster"`
														
 
															+	for testName, tc := range deviceTests {
														
 
															+		t.Run(testName, func(t *testing.T) {
														
 
															+			tc.query(queryStart, queryEnd)
														
 
															+			logged := logWriter.Log
														
 
															+			if !strings.Contains(logged, tc.wantMetric) {
														
 
															+				t.Errorf("expected query to reference %q, got: %s", tc.wantMetric, logged)
														
 
															+			}
														
 
															+			if !strings.Contains(logged, wantDeviceFilter) {
														
 
															+				t.Errorf("expected query to contain cluster filter %q, got: %s", wantDeviceFilter, logged)
														
 
															+			}
														
 
															+			// device-level grouping: no container attribution
														
 
															+			if !strings.Contains(logged, gpuDeviceByLabels) || strings.Contains(logged, "container,") {
														
 
															+				t.Errorf("expected device-level grouping %q without container, got: %s", gpuDeviceByLabels, logged)
														
 
															+			}
														
 
															+		})
														
 
															+	}
														
 
															+
														
 
															+	const wantFilter = `cluster_id="test-cluster"`
														
 
															+
														
 
															+	for testName, tc := range tests {
														
 
															+		t.Run(testName, func(t *testing.T) {
														
 
															+			tc.query(queryStart, queryEnd)
														
 
															+			logged := logWriter.Log
														
 
															+
														
 
															+			if !strings.Contains(logged, testName) {
														
 
															+				t.Errorf("expected log to contain query name %q, got: %s", testName, logged)
														
 
															+			}
														
 
															+			if !strings.Contains(logged, tc.wantMetric) {
														
 
															+				t.Errorf("expected query to reference %q, got: %s", tc.wantMetric, logged)
														
 
															+			}
														
 
															+			if tc.wantExtra != "" && !strings.Contains(logged, tc.wantExtra) {
														
 
															+				t.Errorf("expected query to contain %q, got: %s", tc.wantExtra, logged)
														
 
															+			}
														
 
															+			if !strings.Contains(logged, wantFilter) {
														
 
															+				t.Errorf("expected query to contain cluster filter %q, got: %s", wantFilter, logged)
														
 
															+			}
														
 
															+			if !strings.Contains(logged, gpuSaturationByLabels) {
														
 
															+				t.Errorf("expected query to group by %q, got: %s", gpuSaturationByLabels, logged)
														
 
															+			}
														
 
															+		})
														
 
															+	}
														
 
															+}