metricsquerier.go 137 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912
  1. package prom
  2. import (
  3. "fmt"
  4. "time"
  5. "github.com/opencost/opencost/core/pkg/log"
  6. "github.com/opencost/opencost/core/pkg/source"
  7. "github.com/opencost/opencost/core/pkg/util/timeutil"
  8. prometheus "github.com/prometheus/client_golang/api"
  9. )
  10. //--------------------------------------------------------------------------
  11. // PrometheusMetricsQuerier
  12. //--------------------------------------------------------------------------
  13. // PrometheusMetricsQueryLogFormat is the log format used to log metric queries before being sent to the prometheus
  14. // instance
  15. const PrometheusMetricsQueryLogFormat = `[PrometheusMetricsQuerier][%s][At Time: %d]: %s`
  16. // PrometheusMetricsQuerier is the implementation of the data source's MetricsQuerier interface for Prometheus.
  17. type PrometheusMetricsQuerier struct {
  18. promConfig *OpenCostPrometheusConfig
  19. promClient prometheus.Client
  20. promContexts *ContextFactory
  21. }
  22. func newPrometheusMetricsQuerier(
  23. promConfig *OpenCostPrometheusConfig,
  24. promClient prometheus.Client,
  25. promContexts *ContextFactory,
  26. ) *PrometheusMetricsQuerier {
  27. return &PrometheusMetricsQuerier{
  28. promConfig: promConfig,
  29. promClient: promClient,
  30. promContexts: promContexts,
  31. }
  32. }
  33. func (pds *PrometheusMetricsQuerier) QueryPVPricePerGiBHour(start, end time.Time) *source.Future[source.PVPricePerGiBHourResult] {
  34. const queryName = "QueryPVPricePerGiBHour"
  35. const pvCostQuery = `avg(avg_over_time(pv_hourly_cost{%s}[%s])) by (%s, persistentvolume, volumename, uid, provider_id)`
  36. cfg := pds.promConfig
  37. durStr := timeutil.DurationString(end.Sub(start))
  38. if durStr == "" {
  39. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  40. }
  41. queryPVCost := fmt.Sprintf(pvCostQuery, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  42. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPVCost)
  43. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  44. return source.NewFuture(source.DecodePVPricePerGiBHourResult, ctx.QueryAtTime(queryPVCost, end))
  45. }
  46. func (pds *PrometheusMetricsQuerier) QueryPVUsedAverage(start, end time.Time) *source.Future[source.PVUsedAvgResult] {
  47. const queryName = "QueryPVUsedAverage"
  48. const pvUsedAverageQuery = `avg(avg_over_time(kubelet_volume_stats_used_bytes{%s}[%s])) by (%s, persistentvolumeclaim, namespace, uid)`
  49. cfg := pds.promConfig
  50. durStr := timeutil.DurationString(end.Sub(start))
  51. if durStr == "" {
  52. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  53. }
  54. queryPVUsedAvg := fmt.Sprintf(pvUsedAverageQuery, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  55. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPVUsedAvg)
  56. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  57. return source.NewFuture(source.DecodePVUsedAvgResult, ctx.QueryAtTime(queryPVUsedAvg, end))
  58. }
  59. func (pds *PrometheusMetricsQuerier) QueryPVUsedMax(start, end time.Time) *source.Future[source.PVUsedMaxResult] {
  60. const queryName = "QueryPVUsedMax"
  61. const pvUsedMaxQuery = `max(max_over_time(kubelet_volume_stats_used_bytes{%s}[%s])) by (%s, persistentvolumeclaim, namespace, uid)`
  62. cfg := pds.promConfig
  63. durStr := timeutil.DurationString(end.Sub(start))
  64. if durStr == "" {
  65. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  66. }
  67. queryPVUsedMax := fmt.Sprintf(pvUsedMaxQuery, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  68. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPVUsedMax)
  69. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  70. return source.NewFuture(source.DecodePVUsedMaxResult, ctx.QueryAtTime(queryPVUsedMax, end))
  71. }
  72. func (pds *PrometheusMetricsQuerier) QueryPVCUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  73. const queryName = "QueryPVCUptime"
  74. const queryFmtPVCUptime = `avg(kube_persistentvolumeclaim_info{%s}) by (%s, uid)[%s:%dm]`
  75. cfg := pds.promConfig
  76. minsPerResolution := cfg.DataResolutionMinutes
  77. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  78. if durStr == "" {
  79. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  80. }
  81. queryPVCUptime := fmt.Sprintf(queryFmtPVCUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  82. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPVCUptime)
  83. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  84. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryPVCUptime, end))
  85. }
  86. func (pds *PrometheusMetricsQuerier) QueryPVCInfo(start, end time.Time) *source.Future[source.PVCInfoResult] {
  87. const queryName = "QueryPVCInfo"
  88. const queryFmtPVCInfo = `avg(kube_persistentvolumeclaim_info{volumename != "", %s}) by (persistentvolumeclaim, storageclass, volumename, namespace, uid, %s)[%s:%dm]`
  89. cfg := pds.promConfig
  90. minsPerResolution := cfg.DataResolutionMinutes
  91. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  92. if durStr == "" {
  93. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  94. }
  95. queryPVCInfo := fmt.Sprintf(queryFmtPVCInfo, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  96. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPVCInfo)
  97. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  98. return source.NewFuture(source.DecodePVCInfoResult, ctx.QueryAtTime(queryPVCInfo, end))
  99. }
  100. func (pds *PrometheusMetricsQuerier) QueryKMPVCInfo(start, end time.Time) *source.Future[source.PVCInfoResult] {
  101. const queryName = "QueryKMPVCInfo"
  102. const queryFmt = `avg(avg_over_time(kube_persistentvolumeclaim_info{volumename != "", %s}[%s])) by (uid, namespace_uid, persistentvolumeclaim, namespace, storageclass, volumename, persistentvolume_uid, %s)`
  103. cfg := pds.promConfig
  104. durStr := timeutil.DurationString(end.Sub(start))
  105. if durStr == "" {
  106. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  107. }
  108. q := fmt.Sprintf(queryFmt, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  109. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), q)
  110. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  111. return source.NewFuture(source.DecodePVCInfoResult, ctx.QueryAtTime(q, end))
  112. }
  113. func (pds *PrometheusMetricsQuerier) QueryPVActiveMinutes(start, end time.Time) *source.Future[source.PVActiveMinutesResult] {
  114. const queryName = "QueryPVActiveMinutes"
  115. const pvActiveMinsQuery = `avg(kube_persistentvolume_capacity_bytes{%s}) by (%s, persistentvolume, uid)[%s:%dm]`
  116. cfg := pds.promConfig
  117. minsPerResolution := cfg.DataResolutionMinutes
  118. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  119. if durStr == "" {
  120. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  121. }
  122. queryPVActiveMins := fmt.Sprintf(pvActiveMinsQuery, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  123. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPVActiveMins)
  124. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  125. return source.NewFuture(source.DecodePVActiveMinutesResult, ctx.QueryAtTime(queryPVActiveMins, end))
  126. }
  127. func (pds *PrometheusMetricsQuerier) QueryLocalStorageUsedAvg(start, end time.Time) *source.Future[source.LocalStorageUsedAvgResult] {
  128. const queryName = "QueryLocalStorageUsedAvg"
  129. const localStorageUsedAvgQuery = `avg(sum(avg_over_time(container_fs_usage_bytes{device=~"/dev/(nvme|sda).*", id="/", %s}[%s])) by (instance, device, %s, job)) by (instance, device, %s)`
  130. cfg := pds.promConfig
  131. durStr := timeutil.DurationString(end.Sub(start))
  132. if durStr == "" {
  133. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  134. }
  135. queryLocalStorageUsedAvg := fmt.Sprintf(localStorageUsedAvgQuery, cfg.ClusterFilter, durStr, cfg.ClusterLabel, cfg.ClusterLabel)
  136. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryLocalStorageUsedAvg)
  137. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  138. return source.NewFuture(source.DecodeLocalStorageUsedAvgResult, ctx.QueryAtTime(queryLocalStorageUsedAvg, end))
  139. }
  140. func (pds *PrometheusMetricsQuerier) QueryLocalStorageUsedMax(start, end time.Time) *source.Future[source.LocalStorageUsedMaxResult] {
  141. const queryName = "QueryLocalStorageUsedMax"
  142. const localStorageUsedMaxQuery = `max(sum(max_over_time(container_fs_usage_bytes{device=~"/dev/(nvme|sda).*", id="/", %s}[%s])) by (instance, device, %s, job)) by (instance, device, %s)`
  143. cfg := pds.promConfig
  144. durStr := timeutil.DurationString(end.Sub(start))
  145. if durStr == "" {
  146. panic("failed to parse duration string passed to QueryLocalStorageUsedMax")
  147. }
  148. queryLocalStorageUsedMax := fmt.Sprintf(localStorageUsedMaxQuery, cfg.ClusterFilter, durStr, cfg.ClusterLabel, cfg.ClusterLabel)
  149. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryLocalStorageUsedMax)
  150. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  151. return source.NewFuture(source.DecodeLocalStorageUsedMaxResult, ctx.QueryAtTime(queryLocalStorageUsedMax, end))
  152. }
  153. func (pds *PrometheusMetricsQuerier) QueryLocalStorageBytes(start, end time.Time) *source.Future[source.LocalStorageBytesResult] {
  154. const queryName = "QueryLocalStorageBytes"
  155. const localStorageBytesQuery = `avg_over_time(sum(container_fs_limit_bytes{device=~"/dev/(nvme|sda).*", id="/", %s}) by (instance, device, %s)[%s:%dm])`
  156. cfg := pds.promConfig
  157. minsPerResolution := cfg.DataResolutionMinutes
  158. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  159. if durStr == "" {
  160. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  161. }
  162. queryLocalStorageBytes := fmt.Sprintf(localStorageBytesQuery, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  163. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryLocalStorageBytes)
  164. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  165. return source.NewFuture(source.DecodeLocalStorageBytesResult, ctx.QueryAtTime(queryLocalStorageBytes, end))
  166. }
  167. func (pds *PrometheusMetricsQuerier) QueryKMLocalStorageUsedAvg(start, end time.Time) *source.Future[source.NodeUIDValueResult] {
  168. const queryName = "QueryKMLocalStorageUsedAvg"
  169. const queryFmt = `avg(avg_over_time(container_fs_usage_bytes{%s}[%s])) by (node_uid, %s)`
  170. cfg := pds.promConfig
  171. durStr := timeutil.DurationString(end.Sub(start))
  172. if durStr == "" {
  173. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  174. }
  175. q := fmt.Sprintf(queryFmt, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  176. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), q)
  177. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  178. return source.NewFuture(source.DecodeNodeUIDValueResult, ctx.QueryAtTime(q, end))
  179. }
  180. func (pds *PrometheusMetricsQuerier) QueryKMLocalStorageUsedMax(start, end time.Time) *source.Future[source.NodeUIDValueResult] {
  181. const queryName = "QueryKMLocalStorageUsedMax"
  182. const queryFmt = `max(max_over_time(container_fs_usage_bytes{%s}[%s])) by (node_uid, %s)`
  183. cfg := pds.promConfig
  184. durStr := timeutil.DurationString(end.Sub(start))
  185. if durStr == "" {
  186. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  187. }
  188. q := fmt.Sprintf(queryFmt, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  189. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), q)
  190. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  191. return source.NewFuture(source.DecodeNodeUIDValueResult, ctx.QueryAtTime(q, end))
  192. }
  193. func (pds *PrometheusMetricsQuerier) QueryKMLocalStorageBytes(start, end time.Time) *source.Future[source.UIDValueResult] {
  194. const queryName = "QueryKMLocalStorageBytes"
  195. const queryFmt = `avg_over_time(node_fs_capacity_bytes{%s}[%s:%dm]) by (uid, %s)`
  196. cfg := pds.promConfig
  197. minsPerResolution := cfg.DataResolutionMinutes
  198. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  199. if durStr == "" {
  200. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  201. }
  202. q := fmt.Sprintf(queryFmt, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  203. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), q)
  204. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  205. return source.NewFuture(source.DecodeUIDValueResult, ctx.QueryAtTime(q, end))
  206. }
  207. func (pds *PrometheusMetricsQuerier) QueryLocalStorageActiveMinutes(start, end time.Time) *source.Future[source.LocalStorageActiveMinutesResult] {
  208. const queryName = "QueryLocalStorageActiveMinutes"
  209. const localStorageActiveMinutesQuery = `count(node_total_hourly_cost{%s}) by (%s, node, uid, instance, provider_id)[%s:%dm]`
  210. cfg := pds.promConfig
  211. minsPerResolution := cfg.DataResolutionMinutes
  212. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  213. if durStr == "" {
  214. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  215. }
  216. queryLocalStorageActiveMins := fmt.Sprintf(localStorageActiveMinutesQuery, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  217. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryLocalStorageActiveMins)
  218. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  219. return source.NewFuture(source.DecodeLocalStorageActiveMinutesResult, ctx.QueryAtTime(queryLocalStorageActiveMins, end))
  220. }
  221. func (pds *PrometheusMetricsQuerier) QueryNodeInfo(start, end time.Time) *source.Future[source.NodeInfoResult] {
  222. const queryName = "QueryNodeInfo"
  223. const queryFmtNodeInfo = `avg(avg_over_time(node_info{%s}[%s])) by (%s, node, uid, provider_id, instance_type)`
  224. cfg := pds.promConfig
  225. durStr := timeutil.DurationString(end.Sub(start))
  226. if durStr == "" {
  227. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  228. }
  229. queryNodeInfo := fmt.Sprintf(queryFmtNodeInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  230. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeInfo)
  231. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  232. return source.NewFuture(source.DecodeNodeInfoResult, ctx.QueryAtTime(queryNodeInfo, end))
  233. }
  234. func (pds *PrometheusMetricsQuerier) QueryNodeUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  235. const queryName = "QueryNodeUptime"
  236. const queryFmtNodeUptime = `avg(node_info{%s}) by (%s, uid)[%s:%dm]`
  237. cfg := pds.promConfig
  238. minsPerResolution := cfg.DataResolutionMinutes
  239. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  240. if durStr == "" {
  241. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  242. }
  243. queryNodeUptime := fmt.Sprintf(queryFmtNodeUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  244. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeUptime)
  245. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  246. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryNodeUptime, end))
  247. }
  248. func (pds *PrometheusMetricsQuerier) QueryNodeCPUCoresCapacity(start, end time.Time) *source.Future[source.NodeCPUCoresCapacityResult] {
  249. const queryName = "QueryNodeCPUCoresCapacity"
  250. const nodeCPUCoresCapacityQuery = `avg(avg_over_time(kube_node_status_capacity_cpu_cores{%s}[%s])) by (%s, node, uid)`
  251. cfg := pds.promConfig
  252. durStr := timeutil.DurationString(end.Sub(start))
  253. if durStr == "" {
  254. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  255. }
  256. queryNodeCPUCoresCapacity := fmt.Sprintf(nodeCPUCoresCapacityQuery, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  257. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeCPUCoresCapacity)
  258. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  259. return source.NewFuture(source.DecodeNodeCPUCoresCapacityResult, ctx.QueryAtTime(queryNodeCPUCoresCapacity, end))
  260. }
  261. func (pds *PrometheusMetricsQuerier) QueryNodeCPUCoresAllocatable(start, end time.Time) *source.Future[source.NodeCPUCoresAllocatableResult] {
  262. const queryName = "QueryNodeCPUCoresAllocatable"
  263. const nodeCPUCoresAllocatableQuery = `avg(avg_over_time(kube_node_status_allocatable_cpu_cores{%s}[%s])) by (%s, node, uid)`
  264. // `avg(avg_over_time(container_cpu_allocation{container!="", container!="POD", node!="", %s}[%s])) by (container, pod, namespace, node, %s)`
  265. cfg := pds.promConfig
  266. durStr := timeutil.DurationString(end.Sub(start))
  267. if durStr == "" {
  268. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  269. }
  270. queryNodeCPUCoresAllocatable := fmt.Sprintf(nodeCPUCoresAllocatableQuery, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  271. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeCPUCoresAllocatable)
  272. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  273. return source.NewFuture(source.DecodeNodeCPUCoresAllocatableResult, ctx.QueryAtTime(queryNodeCPUCoresAllocatable, end))
  274. }
  275. func (pds *PrometheusMetricsQuerier) QueryNodeRAMBytesCapacity(start, end time.Time) *source.Future[source.NodeRAMBytesCapacityResult] {
  276. const queryName = "QueryNodeRAMBytesCapacity"
  277. const nodeRAMBytesCapacityQuery = `avg(avg_over_time(kube_node_status_capacity_memory_bytes{%s}[%s])) by (%s, node, uid)`
  278. cfg := pds.promConfig
  279. durStr := timeutil.DurationString(end.Sub(start))
  280. if durStr == "" {
  281. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  282. }
  283. queryNodeRAMBytesCapacity := fmt.Sprintf(nodeRAMBytesCapacityQuery, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  284. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeRAMBytesCapacity)
  285. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  286. return source.NewFuture(source.DecodeNodeRAMBytesCapacityResult, ctx.QueryAtTime(queryNodeRAMBytesCapacity, end))
  287. }
  288. func (pds *PrometheusMetricsQuerier) QueryNodeRAMBytesAllocatable(start, end time.Time) *source.Future[source.NodeRAMBytesAllocatableResult] {
  289. const queryName = "QueryNodeRAMBytesAllocatable"
  290. const nodeRAMBytesAllocatableQuery = `avg(avg_over_time(kube_node_status_allocatable_memory_bytes{%s}[%s])) by (%s, node, uid)`
  291. cfg := pds.promConfig
  292. durStr := timeutil.DurationString(end.Sub(start))
  293. if durStr == "" {
  294. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  295. }
  296. queryNodeRAMBytesAllocatable := fmt.Sprintf(nodeRAMBytesAllocatableQuery, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  297. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeRAMBytesAllocatable)
  298. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  299. return source.NewFuture(source.DecodeNodeRAMBytesAllocatableResult, ctx.QueryAtTime(queryNodeRAMBytesAllocatable, end))
  300. }
  301. func (pds *PrometheusMetricsQuerier) QueryNodeGPUCount(start, end time.Time) *source.Future[source.NodeGPUCountResult] {
  302. const queryName = "QueryNodeGPUCount"
  303. const nodeGPUCountQuery = `avg(avg_over_time(node_gpu_count{%s}[%s])) by (%s, node, uid, provider_id)`
  304. cfg := pds.promConfig
  305. durStr := timeutil.DurationString(end.Sub(start))
  306. if durStr == "" {
  307. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  308. }
  309. queryNodeGPUCount := fmt.Sprintf(nodeGPUCountQuery, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  310. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeGPUCount)
  311. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  312. return source.NewFuture(source.DecodeNodeGPUCountResult, ctx.QueryAtTime(queryNodeGPUCount, end))
  313. }
  314. func (pds *PrometheusMetricsQuerier) QueryNodeLabels(start, end time.Time) *source.Future[source.NodeLabelsResult] {
  315. const queryName = "QueryNodeLabels"
  316. const labelsQuery = `avg_over_time(kube_node_labels{%s}[%s])`
  317. cfg := pds.promConfig
  318. durStr := timeutil.DurationString(end.Sub(start))
  319. if durStr == "" {
  320. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  321. }
  322. queryLabels := fmt.Sprintf(labelsQuery, cfg.ClusterFilter, durStr)
  323. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryLabels)
  324. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  325. return source.NewFuture(source.DecodeNodeLabelsResult, ctx.QueryAtTime(queryLabels, end))
  326. }
  327. func (pds *PrometheusMetricsQuerier) QueryNodeActiveMinutes(start, end time.Time) *source.Future[source.NodeActiveMinutesResult] {
  328. const queryName = "QueryNodeActiveMinutes"
  329. const activeMinsQuery = `avg(node_total_hourly_cost{%s}) by (node, uid, %s, provider_id)[%s:%dm]`
  330. cfg := pds.promConfig
  331. minsPerResolution := cfg.DataResolutionMinutes
  332. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  333. if durStr == "" {
  334. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  335. }
  336. queryActiveMins := fmt.Sprintf(activeMinsQuery, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  337. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryActiveMins)
  338. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  339. return source.NewFuture(source.DecodeNodeActiveMinutesResult, ctx.QueryAtTime(queryActiveMins, end))
  340. }
  341. func (pds *PrometheusMetricsQuerier) QueryNodeCPUModeTotal(start, end time.Time) *source.Future[source.NodeCPUModeTotalResult] {
  342. const queryName = "QueryNodeCPUModeTotal"
  343. const nodeCPUModeTotalQuery = `sum(rate(node_cpu_seconds_total{%s}[%s:%dm])) by (kubernetes_node, uid, %s, mode)`
  344. cfg := pds.promConfig
  345. minsPerResolution := cfg.DataResolutionMinutes
  346. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  347. if durStr == "" {
  348. panic("failed to parse duration string passed to QueryNodeCPUModeTotal")
  349. }
  350. queryCPUModeTotal := fmt.Sprintf(nodeCPUModeTotalQuery, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  351. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryCPUModeTotal)
  352. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  353. return source.NewFuture(source.DecodeNodeCPUModeTotalResult, ctx.QueryAtTime(queryCPUModeTotal, end))
  354. }
  355. func (pds *PrometheusMetricsQuerier) QueryNodeRAMSystemPercent(start, end time.Time) *source.Future[source.NodeRAMSystemPercentResult] {
  356. const queryName = "QueryNodeRAMSystemPercent"
  357. const nodeRAMSystemPctQuery = `sum(sum_over_time(container_memory_working_set_bytes{container_name!="POD",container_name!="",namespace="kube-system", %s}[%s:%dm])) by (instance, uid, %s) / avg(label_replace(sum(sum_over_time(kube_node_status_capacity_memory_bytes{%s}[%s:%dm])) by (node, uid, %s), "instance", "$1", "node", "(.*)")) by (instance, uid, %s)`
  358. cfg := pds.promConfig
  359. minsPerResolution := cfg.DataResolutionMinutes
  360. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  361. if durStr == "" {
  362. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  363. }
  364. queryRAMSystemPct := fmt.Sprintf(nodeRAMSystemPctQuery, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel, cfg.ClusterLabel)
  365. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryRAMSystemPct)
  366. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  367. return source.NewFuture(source.DecodeNodeRAMSystemPercentResult, ctx.QueryAtTime(queryRAMSystemPct, end))
  368. }
  369. func (pds *PrometheusMetricsQuerier) QueryNodeRAMUserPercent(start, end time.Time) *source.Future[source.NodeRAMUserPercentResult] {
  370. const queryName = "QueryNodeRAMUserPercent"
  371. const nodeRAMUserPctQuery = `sum(sum_over_time(container_memory_working_set_bytes{container_name!="POD",container_name!="",namespace!="kube-system", %s}[%s:%dm])) by (instance, uid, %s) / avg(label_replace(sum(sum_over_time(kube_node_status_capacity_memory_bytes{%s}[%s:%dm])) by (node, uid, %s), "instance", "$1", "node", "(.*)")) by (instance, uid, %s)`
  372. cfg := pds.promConfig
  373. minsPerResolution := cfg.DataResolutionMinutes
  374. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  375. if durStr == "" {
  376. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  377. }
  378. queryRAMUserPct := fmt.Sprintf(nodeRAMUserPctQuery, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel, cfg.ClusterLabel)
  379. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryRAMUserPct)
  380. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  381. return source.NewFuture(source.DecodeNodeRAMUserPercentResult, ctx.QueryAtTime(queryRAMUserPct, end))
  382. }
  383. func (pds *PrometheusMetricsQuerier) QueryNodeResourceCapacities(start, end time.Time) *source.Future[source.ResourceResult] {
  384. const queryName = "QueryNodeResourceCapacities"
  385. const queryFmtNodeResourceCapacities = `avg(avg_over_time(kube_node_status_capacity{%s}[%s])) by (%s, node, uid, resource, unit)`
  386. cfg := pds.promConfig
  387. durStr := timeutil.DurationString(end.Sub(start))
  388. if durStr == "" {
  389. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  390. }
  391. queryNodeResourceCapacities := fmt.Sprintf(queryFmtNodeResourceCapacities, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  392. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeResourceCapacities)
  393. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  394. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryNodeResourceCapacities, end))
  395. }
  396. func (pds *PrometheusMetricsQuerier) QueryNodeResourcesAllocatable(start, end time.Time) *source.Future[source.ResourceResult] {
  397. const queryName = "QueryNodeResourcesAllocatable"
  398. const queryFmtNodeResourcesAllocatable = `avg(avg_over_time(kube_node_status_allocatable{%s}[%s])) by (%s, node, uid, resource, unit)`
  399. cfg := pds.promConfig
  400. durStr := timeutil.DurationString(end.Sub(start))
  401. if durStr == "" {
  402. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  403. }
  404. queryNodeResourcesAllocatable := fmt.Sprintf(queryFmtNodeResourcesAllocatable, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  405. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeResourcesAllocatable)
  406. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  407. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryNodeResourcesAllocatable, end))
  408. }
  409. func (pds *PrometheusMetricsQuerier) QueryLBPricePerHr(start, end time.Time) *source.Future[source.LBPricePerHrResult] {
  410. const queryName = "QueryLBPricePerHr"
  411. const queryFmtLBCostPerHr = `avg(avg_over_time(kubecost_load_balancer_cost{%s}[%s])) by (namespace, service_name, ingress_ip, uid, %s)`
  412. cfg := pds.promConfig
  413. durStr := timeutil.DurationString(end.Sub(start))
  414. if durStr == "" {
  415. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  416. }
  417. queryLBCostPerHr := fmt.Sprintf(queryFmtLBCostPerHr, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  418. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryLBCostPerHr)
  419. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  420. return source.NewFuture(source.DecodeLBPricePerHrResult, ctx.QueryAtTime(queryLBCostPerHr, end))
  421. }
  422. func (pds *PrometheusMetricsQuerier) QueryLBActiveMinutes(start, end time.Time) *source.Future[source.LBActiveMinutesResult] {
  423. const queryName = "QueryLBActiveMinutes"
  424. const lbActiveMinutesQuery = `avg(kubecost_load_balancer_cost{%s}) by (namespace, service_name, uid, %s, ingress_ip)[%s:%dm]`
  425. cfg := pds.promConfig
  426. minsPerResolution := cfg.DataResolutionMinutes
  427. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  428. if durStr == "" {
  429. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  430. }
  431. queryLBActiveMins := fmt.Sprintf(lbActiveMinutesQuery, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  432. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryLBActiveMins)
  433. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  434. return source.NewFuture(source.DecodeLBActiveMinutesResult, ctx.QueryAtTime(queryLBActiveMins, end))
  435. }
  436. func (pds *PrometheusMetricsQuerier) QueryClusterInfo(start, end time.Time) *source.Future[source.ClusterInfoResult] {
  437. const queryName = "QueryClusterInfo"
  438. const queryFmtClusterInfo = `avg(avg_over_time(cluster_info{%s}[%s])) by (%s, uid, provider, account_id, provisioner_name, region)`
  439. cfg := pds.promConfig
  440. durStr := timeutil.DurationString(end.Sub(start))
  441. if durStr == "" {
  442. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  443. }
  444. queryClusterInfo := fmt.Sprintf(queryFmtClusterInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  445. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryClusterInfo)
  446. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  447. return source.NewFuture(source.DecodeClusterInfoResult, ctx.QueryAtTime(queryClusterInfo, end))
  448. }
  449. func (pds *PrometheusMetricsQuerier) QueryClusterUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  450. const queryName = "QueryClusterUptime"
  451. const queryFmtClusterUptime = `avg(cluster_info{%s}) by (%s, uid)[%s:%dm]`
  452. cfg := pds.promConfig
  453. minsPerResolution := cfg.DataResolutionMinutes
  454. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  455. if durStr == "" {
  456. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  457. }
  458. queryClusterUptime := fmt.Sprintf(queryFmtClusterUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  459. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryFmtClusterUptime)
  460. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  461. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryClusterUptime, end))
  462. }
  463. func (pds *PrometheusMetricsQuerier) QueryClusterManagementDuration(start, end time.Time) *source.Future[source.ClusterManagementDurationResult] {
  464. const queryName = "QueryClusterManagementDuration"
  465. const clusterManagementDurationQuery = `avg(kubecost_cluster_management_cost{%s}) by (%s, provisioner_name)[%s:%dm]`
  466. cfg := pds.promConfig
  467. minsPerResolution := cfg.DataResolutionMinutes
  468. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  469. if durStr == "" {
  470. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  471. }
  472. queryClusterManagementDuration := fmt.Sprintf(clusterManagementDurationQuery, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  473. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryClusterManagementDuration)
  474. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  475. return source.NewFuture(source.DecodeClusterManagementDurationResult, ctx.QueryAtTime(queryClusterManagementDuration, end))
  476. }
  477. func (pds *PrometheusMetricsQuerier) QueryClusterManagementPricePerHr(start, end time.Time) *source.Future[source.ClusterManagementPricePerHrResult] {
  478. const queryName = "QueryClusterManagementPricePerHr"
  479. const clusterManagementCostQuery = `avg(avg_over_time(kubecost_cluster_management_cost{%s}[%s])) by (%s, provisioner_name)`
  480. cfg := pds.promConfig
  481. durStr := timeutil.DurationString(end.Sub(start))
  482. if durStr == "" {
  483. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  484. }
  485. queryClusterManagementCost := fmt.Sprintf(clusterManagementCostQuery, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  486. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryClusterManagementCost)
  487. ctx := pds.promContexts.NewNamedContext(ClusterContextName)
  488. return source.NewFuture(source.DecodeClusterManagementPricePerHrResult, ctx.QueryAtTime(queryClusterManagementCost, end))
  489. }
  490. // AllocationMetricQuerier
  491. func (pds *PrometheusMetricsQuerier) QueryPods(start, end time.Time) *source.Future[source.PodsResult] {
  492. const queryName = "QueryPods"
  493. const queryFmtPods = `avg(kube_pod_container_status_running{%s} != 0) by (pod, namespace, uid, %s)[%s:%dm]`
  494. cfg := pds.promConfig
  495. minsPerResolution := cfg.DataResolutionMinutes
  496. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  497. if durStr == "" {
  498. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  499. }
  500. queryPods := fmt.Sprintf(queryFmtPods, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  501. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPods)
  502. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  503. return source.NewFuture(source.DecodePodsResult, ctx.QueryAtTime(queryPods, end))
  504. }
  505. func (pds *PrometheusMetricsQuerier) QueryPodsUID(start, end time.Time) *source.Future[source.PodsResult] {
  506. const queryName = "QueryPodsUID"
  507. const queryFmtPodsUID = `avg(kube_pod_container_status_running{%s} != 0) by (pod, namespace, uid, %s)[%s:%dm]`
  508. cfg := pds.promConfig
  509. minsPerResolution := cfg.DataResolutionMinutes
  510. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  511. if durStr == "" {
  512. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  513. }
  514. queryPodsUID := fmt.Sprintf(queryFmtPodsUID, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  515. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPodsUID)
  516. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  517. return source.NewFuture(source.DecodePodsResult, ctx.QueryAtTime(queryPodsUID, end))
  518. }
  519. func (pds *PrometheusMetricsQuerier) QueryPodInfo(start, end time.Time) *source.Future[source.PodInfoResult] {
  520. const queryName = "QueryPodInfo"
  521. const queryFmtPodInfo = `avg(avg_over_time(pod_info{%s}[%s])) by (%s, pod, uid, namespace_uid, node_uid)`
  522. cfg := pds.promConfig
  523. durStr := timeutil.DurationString(end.Sub(start))
  524. if durStr == "" {
  525. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  526. }
  527. queryPodInfo := fmt.Sprintf(queryFmtPodInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  528. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPodInfo)
  529. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  530. return source.NewFuture(source.DecodePodInfoResult, ctx.QueryAtTime(queryPodInfo, end))
  531. }
  532. func (pds *PrometheusMetricsQuerier) QueryPodUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  533. const queryName = "QueryPodUptime"
  534. const queryFmtPodUptime = `avg(pod_info{%s}) by (%s, uid)[%s:%dm]`
  535. cfg := pds.promConfig
  536. minsPerResolution := cfg.DataResolutionMinutes
  537. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  538. if durStr == "" {
  539. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  540. }
  541. queryPodUptime := fmt.Sprintf(queryFmtPodUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  542. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPodUptime)
  543. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  544. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryPodUptime, end))
  545. }
  546. func (pds *PrometheusMetricsQuerier) QueryPodOwners(start, end time.Time) *source.Future[source.OwnerResult] {
  547. const queryName = "QueryPodOwners"
  548. const queryFmtPodOwners = `avg(avg_over_time(kube_pod_owner{%s}[%s])) by (%s, uid, owner_uid, owner_kind)`
  549. cfg := pds.promConfig
  550. durStr := timeutil.DurationString(end.Sub(start))
  551. if durStr == "" {
  552. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  553. }
  554. queryPodOwners := fmt.Sprintf(queryFmtPodOwners, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  555. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPodOwners)
  556. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  557. return source.NewFuture(source.DecodeOwnerResult, ctx.QueryAtTime(queryPodOwners, end))
  558. }
  559. func (pds *PrometheusMetricsQuerier) QueryPodPVCVolumes(start, end time.Time) *source.Future[source.PodPVCVolumeResult] {
  560. const queryName = "QueryPodPVCVolumes"
  561. const queryFmtPodPVCVolumes = `avg(avg_over_time(pod_pvc_volume{%s}[%s])) by (%s, uid, persistentvolumeclaim_uid, pod_volume_name)`
  562. cfg := pds.promConfig
  563. durStr := timeutil.DurationString(end.Sub(start))
  564. if durStr == "" {
  565. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  566. }
  567. queryPodPVCVolumes := fmt.Sprintf(queryFmtPodPVCVolumes, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  568. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPodPVCVolumes)
  569. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  570. return source.NewFuture(source.DecodePodPVCVolumeResult, ctx.QueryAtTime(queryPodPVCVolumes, end))
  571. }
  572. func (pds *PrometheusMetricsQuerier) QueryPodNetworkEgressBytes(start, end time.Time) *source.Future[source.PodNetworkBytesResult] {
  573. const queryName = "QueryPodNetworkEgressBytes"
  574. const queryFmt = `sum(increase(kubecost_pod_network_egress_bytes_total{uid!="", %s}[%s:%dm])) by (uid, service, internet, same_region, same_zone, nat_gateway, %s)`
  575. cfg := pds.promConfig
  576. minsPerResolution := cfg.DataResolutionMinutes
  577. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  578. if durStr == "" {
  579. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  580. }
  581. q := fmt.Sprintf(queryFmt, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  582. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), q)
  583. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  584. return source.NewFuture(source.DecodePodNetworkBytesResult, ctx.QueryAtTime(q, end))
  585. }
  586. func (pds *PrometheusMetricsQuerier) QueryPodNetworkIngressBytes(start, end time.Time) *source.Future[source.PodNetworkBytesResult] {
  587. const queryName = "QueryPodNetworkIngressBytes"
  588. const queryFmt = `sum(increase(kubecost_pod_network_ingress_bytes_total{uid!="", %s}[%s:%dm])) by (uid, service, internet, same_region, same_zone, nat_gateway, %s)`
  589. cfg := pds.promConfig
  590. minsPerResolution := cfg.DataResolutionMinutes
  591. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  592. if durStr == "" {
  593. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  594. }
  595. q := fmt.Sprintf(queryFmt, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  596. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), q)
  597. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  598. return source.NewFuture(source.DecodePodNetworkBytesResult, ctx.QueryAtTime(q, end))
  599. }
  600. func (pds *PrometheusMetricsQuerier) QueryContainerUptime(start, end time.Time) *source.Future[source.ContainerUptimeResult] {
  601. const queryName = "QueryContainerUptime"
  602. const queryFmtContainerUptime = `avg(kube_pod_container_status_running{container!="", %s} != 0) by (container, uid, %s)[%s:%dm]`
  603. cfg := pds.promConfig
  604. minsPerResolution := cfg.DataResolutionMinutes
  605. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  606. if durStr == "" {
  607. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  608. }
  609. queryContainerUptime := fmt.Sprintf(queryFmtContainerUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  610. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryContainerUptime)
  611. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  612. return source.NewFuture(source.DecodeContainerUptimeResult, ctx.QueryAtTime(queryContainerUptime, end))
  613. }
  614. func (pds *PrometheusMetricsQuerier) QueryContainerResourceRequests(start, end time.Time) *source.Future[source.ContainerResourceResult] {
  615. const queryName = "QueryContainerResourceRequests"
  616. const queryFmtContainerResourceRequests = `avg(avg_over_time(kube_pod_container_resource_requests{container!="", container!="POD", node!="", %s}[%s])) by (container, uid, resource, unit, %s)`
  617. cfg := pds.promConfig
  618. durStr := timeutil.DurationString(end.Sub(start))
  619. if durStr == "" {
  620. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  621. }
  622. queryContainerResourceRequests := fmt.Sprintf(queryFmtContainerResourceRequests, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  623. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryContainerResourceRequests)
  624. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  625. return source.NewFuture(source.DecodeContainerResourceResult, ctx.QueryAtTime(queryContainerResourceRequests, end))
  626. }
  627. func (pds *PrometheusMetricsQuerier) QueryContainerResourceLimits(start, end time.Time) *source.Future[source.ContainerResourceResult] {
  628. const queryName = "QueryContainerResourceLimits"
  629. const queryFmtContainerResourceLimits = `avg(avg_over_time(kube_pod_container_resource_limits{container!="", container!="POD", node!="", %s}[%s])) by (container, uid, resource, unit, %s)`
  630. cfg := pds.promConfig
  631. durStr := timeutil.DurationString(end.Sub(start))
  632. if durStr == "" {
  633. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  634. }
  635. queryContainerResourceLimits := fmt.Sprintf(queryFmtContainerResourceLimits, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  636. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryContainerResourceLimits)
  637. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  638. return source.NewFuture(source.DecodeContainerResourceResult, ctx.QueryAtTime(queryContainerResourceLimits, end))
  639. }
  640. func (pds *PrometheusMetricsQuerier) QueryRAMBytesAllocated(start, end time.Time) *source.Future[source.RAMBytesAllocatedResult] {
  641. const queryName = "QueryRAMBytesAllocated"
  642. const queryFmtRAMBytesAllocated = `avg(avg_over_time(container_memory_allocation_bytes{container!="", container!="POD", node!="", %s}[%s])) by (container, pod, namespace, node, uid, %s, provider_id)`
  643. cfg := pds.promConfig
  644. durStr := timeutil.DurationString(end.Sub(start))
  645. if durStr == "" {
  646. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  647. }
  648. queryRAMBytesAllocated := fmt.Sprintf(queryFmtRAMBytesAllocated, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  649. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryRAMBytesAllocated)
  650. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  651. return source.NewFuture(source.DecodeRAMBytesAllocatedResult, ctx.QueryAtTime(queryRAMBytesAllocated, end))
  652. }
  653. func (pds *PrometheusMetricsQuerier) QueryRAMRequests(start, end time.Time) *source.Future[source.RAMRequestsResult] {
  654. const queryName = "QueryRAMRequests"
  655. const queryFmtRAMRequests = `avg(avg_over_time(kube_pod_container_resource_requests{resource="memory", unit="byte", container!="", container!="POD", node!="", %s}[%s])) by (container, pod, namespace, node, uid, %s)`
  656. cfg := pds.promConfig
  657. durStr := timeutil.DurationString(end.Sub(start))
  658. if durStr == "" {
  659. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  660. }
  661. queryRAMRequests := fmt.Sprintf(queryFmtRAMRequests, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  662. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryRAMRequests)
  663. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  664. return source.NewFuture(source.DecodeRAMRequestsResult, ctx.QueryAtTime(queryRAMRequests, end))
  665. }
  666. func (pds *PrometheusMetricsQuerier) QueryRAMLimits(start, end time.Time) *source.Future[source.RAMLimitsResult] {
  667. const queryName = "QueryRAMLimits"
  668. const queryFmtRAMLimits = `avg(avg_over_time(kube_pod_container_resource_limits{resource="memory", unit="byte", container!="", container!="POD", node!="", %s}[%s])) by (container, pod, namespace, node, %s)`
  669. cfg := pds.promConfig
  670. durStr := timeutil.DurationString(end.Sub(start))
  671. if durStr == "" {
  672. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  673. }
  674. queryRAMLimits := fmt.Sprintf(queryFmtRAMLimits, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  675. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryRAMLimits)
  676. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  677. return source.NewFuture(source.DecodeRAMLimitsResult, ctx.QueryAtTime(queryRAMLimits, end))
  678. }
  679. func (pds *PrometheusMetricsQuerier) QueryRAMUsageAvg(start, end time.Time) *source.Future[source.RAMUsageAvgResult] {
  680. const queryName = "QueryRAMUsageAvg"
  681. const queryFmtRAMUsageAvg = `avg(avg_over_time(container_memory_working_set_bytes{container!="", container_name!="POD", container!="POD", %s}[%s])) by (container_name, container, pod_name, pod, namespace, node, instance, uid, %s)`
  682. cfg := pds.promConfig
  683. durStr := timeutil.DurationString(end.Sub(start))
  684. if durStr == "" {
  685. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  686. }
  687. queryRAMUsageAvg := fmt.Sprintf(queryFmtRAMUsageAvg, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  688. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryRAMUsageAvg)
  689. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  690. return source.NewFuture(source.DecodeRAMUsageAvgResult, ctx.QueryAtTime(queryRAMUsageAvg, end))
  691. }
  692. func (pds *PrometheusMetricsQuerier) QueryRAMUsageMax(start, end time.Time) *source.Future[source.RAMUsageMaxResult] {
  693. const queryName = "QueryRAMUsageMax"
  694. const queryFmtRAMUsageMax = `max(max_over_time(container_memory_working_set_bytes{container!="", container_name!="POD", container!="POD", %s}[%s])) by (container_name, container, pod_name, pod, namespace, node, instance, uid, %s)`
  695. cfg := pds.promConfig
  696. durStr := timeutil.DurationString(end.Sub(start))
  697. if durStr == "" {
  698. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  699. }
  700. queryRAMUsageMax := fmt.Sprintf(queryFmtRAMUsageMax, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  701. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryRAMUsageMax)
  702. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  703. return source.NewFuture(source.DecodeRAMUsageMaxResult, ctx.QueryAtTime(queryRAMUsageMax, end))
  704. }
  705. func (pds *PrometheusMetricsQuerier) QueryCPUCoresAllocated(start, end time.Time) *source.Future[source.CPUCoresAllocatedResult] {
  706. const queryName = "QueryCPUCoresAllocated"
  707. const queryFmtCPUCoresAllocated = `avg(avg_over_time(container_cpu_allocation{container!="", container!="POD", node!="", %s}[%s])) by (container, pod, namespace, node, uid, %s)`
  708. cfg := pds.promConfig
  709. durStr := timeutil.DurationString(end.Sub(start))
  710. if durStr == "" {
  711. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  712. }
  713. queryCPUCoresAllocated := fmt.Sprintf(queryFmtCPUCoresAllocated, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  714. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryCPUCoresAllocated)
  715. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  716. return source.NewFuture(source.DecodeCPUCoresAllocatedResult, ctx.QueryAtTime(queryCPUCoresAllocated, end))
  717. }
  718. func (pds *PrometheusMetricsQuerier) QueryCPURequests(start, end time.Time) *source.Future[source.CPURequestsResult] {
  719. const queryName = "QueryCPURequests"
  720. const queryFmtCPURequests = `avg(avg_over_time(kube_pod_container_resource_requests{resource="cpu", unit="core", container!="", container!="POD", node!="", %s}[%s])) by (container, pod, namespace, node, uid, %s)`
  721. cfg := pds.promConfig
  722. durStr := timeutil.DurationString(end.Sub(start))
  723. if durStr == "" {
  724. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  725. }
  726. queryCPURequests := fmt.Sprintf(queryFmtCPURequests, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  727. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryCPURequests)
  728. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  729. return source.NewFuture(source.DecodeCPURequestsResult, ctx.QueryAtTime(queryCPURequests, end))
  730. }
  731. func (pds *PrometheusMetricsQuerier) QueryCPULimits(start, end time.Time) *source.Future[source.CPULimitsResult] {
  732. const queryName = "QueryCPULimits"
  733. const queryFmtCPULimits = `avg(avg_over_time(kube_pod_container_resource_limits{resource="cpu", unit="core", container!="", container!="POD", node!="", %s}[%s])) by (container, pod, namespace, node, %s)`
  734. cfg := pds.promConfig
  735. durStr := timeutil.DurationString(end.Sub(start))
  736. if durStr == "" {
  737. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  738. }
  739. queryCPULimits := fmt.Sprintf(queryFmtCPULimits, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  740. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryCPULimits)
  741. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  742. return source.NewFuture(source.DecodeCPULimitsResult, ctx.QueryAtTime(queryCPULimits, end))
  743. }
  744. func (pds *PrometheusMetricsQuerier) QueryCPUUsageAvg(start, end time.Time) *source.Future[source.CPUUsageAvgResult] {
  745. const queryName = "QueryCPUUsageAvg"
  746. const queryFmtCPUUsageAvg = `avg(rate(container_cpu_usage_seconds_total{container!="", container_name!="POD", container!="POD", %s}[%s])) by (container_name, container, pod_name, pod, namespace, node, instance, uid, %s)`
  747. cfg := pds.promConfig
  748. durStr := timeutil.DurationString(end.Sub(start))
  749. if durStr == "" {
  750. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  751. }
  752. queryCPUUsageAvg := fmt.Sprintf(queryFmtCPUUsageAvg, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  753. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryCPUUsageAvg)
  754. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  755. return source.NewFuture(source.DecodeCPUUsageAvgResult, ctx.QueryAtTime(queryCPUUsageAvg, end))
  756. }
  757. func (pds *PrometheusMetricsQuerier) QueryCPUUsageMax(start, end time.Time) *source.Future[source.CPUUsageMaxResult] {
  758. const queryName = "QueryCPUUsageMax"
  759. // Because we use container_cpu_usage_seconds_total to calculate CPU usage
  760. // at any given "instant" of time, we need to use an irate or rate. To then
  761. // calculate a max (or any aggregation) we have to perform an aggregation
  762. // query on top of an instant-by-instant maximum. Prometheus supports this
  763. // type of query with a "subquery" [1], however it is reportedly expensive
  764. // to make such a query. By default, Kubecost's Prometheus config includes
  765. // a recording rule that keeps track of the instant-by-instant irate for CPU
  766. // usage. The metric in this query is created by that recording rule.
  767. //
  768. // [1] https://prometheus.io/blog/2019/01/28/subquery-support/
  769. //
  770. // If changing the name of the recording rule, make sure to update the
  771. // corresponding diagnostic query to avoid confusion.
  772. const queryFmtCPUUsageMaxRecordingRule = `max(max_over_time(kubecost_container_cpu_usage_irate{%s}[%s])) by (container_name, container, pod_name, pod, namespace, node, instance, uid, %s)`
  773. // This is the subquery equivalent of the above recording rule query. It is
  774. // more expensive, but does not require the recording rule. It should be
  775. // used as a fallback query if the recording rule data does not exist.
  776. //
  777. // The parameter after the colon [:<thisone>] in the subquery affects the
  778. // resolution of the subquery.
  779. // The parameter after the metric ...{}[<thisone>] should be set to 2x
  780. // the resolution, to make sure the irate always has two points to query
  781. // in case the Prom scrape duration has been reduced to be equal to the
  782. // query resolution.
  783. const queryFmtCPUUsageMaxSubquery = `max(max_over_time(irate(container_cpu_usage_seconds_total{container!="POD", container!="", %s}[%dm])[%s:%dm])) by (container, pod_name, pod, namespace, node, instance, uid, %s)`
  784. cfg := pds.promConfig
  785. durStr := timeutil.DurationString(end.Sub(start))
  786. if durStr == "" {
  787. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  788. }
  789. queryCPUUsageMaxRecordingRule := fmt.Sprintf(queryFmtCPUUsageMaxRecordingRule, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  790. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryCPUUsageMaxRecordingRule)
  791. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  792. resCPUUsageMaxRR := ctx.QueryAtTime(queryCPUUsageMaxRecordingRule, end)
  793. resCPUUsageMax, _ := resCPUUsageMaxRR.Await()
  794. if len(resCPUUsageMax) > 0 {
  795. return source.NewFutureFrom(source.DecodeAll(resCPUUsageMax, source.DecodeCPUUsageMaxResult))
  796. }
  797. minsPerResolution := cfg.DataResolutionMinutes
  798. durStr = pds.durationStringFor(start, end, minsPerResolution, false)
  799. if durStr == "" {
  800. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  801. }
  802. queryCPUUsageMaxSubquery := fmt.Sprintf(queryFmtCPUUsageMaxSubquery, cfg.ClusterFilter, 2*minsPerResolution, durStr, minsPerResolution, cfg.ClusterLabel)
  803. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryCPUUsageMaxSubquery)
  804. return source.NewFuture(source.DecodeCPUUsageMaxResult, ctx.QueryAtTime(queryCPUUsageMaxSubquery, end))
  805. }
  806. func (pds *PrometheusMetricsQuerier) QueryGPUsRequested(start, end time.Time) *source.Future[source.GPUsRequestedResult] {
  807. const queryName = "QueryGPUsRequested"
  808. const queryFmtGPUsRequested = `avg(avg_over_time(kube_pod_container_resource_requests{resource="nvidia_com_gpu", container!="",container!="POD", node!="", %s}[%s])) by (container, pod, namespace, node, uid, %s)`
  809. cfg := pds.promConfig
  810. durStr := timeutil.DurationString(end.Sub(start))
  811. if durStr == "" {
  812. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  813. }
  814. queryGPUsRequested := fmt.Sprintf(queryFmtGPUsRequested, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  815. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryGPUsRequested)
  816. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  817. return source.NewFuture(source.DecodeGPUsRequestedResult, ctx.QueryAtTime(queryGPUsRequested, end))
  818. }
  819. func (pds *PrometheusMetricsQuerier) QueryGPUsUsageAvg(start, end time.Time) *source.Future[source.GPUsUsageAvgResult] {
  820. const queryName = "QueryGPUsUsageAvg"
  821. const queryFmtGPUsUsageAvg = `avg(avg_over_time(DCGM_FI_PROF_GR_ENGINE_ACTIVE{container!=""}[%s])) by (container, pod, namespace, pod_uid, %s)`
  822. cfg := pds.promConfig
  823. durStr := timeutil.DurationString(end.Sub(start))
  824. if durStr == "" {
  825. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  826. }
  827. queryGPUsUsageAvg := fmt.Sprintf(queryFmtGPUsUsageAvg, durStr, cfg.ClusterLabel)
  828. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryGPUsUsageAvg)
  829. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  830. return source.NewFuture(source.DecodeGPUsUsageAvgResult, ctx.QueryAtTime(queryGPUsUsageAvg, end))
  831. }
  832. func (pds *PrometheusMetricsQuerier) QueryGPUsUsageMax(start, end time.Time) *source.Future[source.GPUsUsageMaxResult] {
  833. const queryName = "QueryGPUsUsageMax"
  834. const queryFmtGPUsUsageMax = `max(max_over_time(DCGM_FI_PROF_GR_ENGINE_ACTIVE{container!=""}[%s])) by (container, pod, namespace, pod_uid, %s)`
  835. cfg := pds.promConfig
  836. durStr := timeutil.DurationString(end.Sub(start))
  837. if durStr == "" {
  838. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  839. }
  840. queryGPUsUsageMax := fmt.Sprintf(queryFmtGPUsUsageMax, durStr, cfg.ClusterLabel)
  841. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryGPUsUsageMax)
  842. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  843. return source.NewFuture(source.DecodeGPUsUsageMaxResult, ctx.QueryAtTime(queryGPUsUsageMax, end))
  844. }
  845. func (pds *PrometheusMetricsQuerier) QueryGPUsAllocated(start, end time.Time) *source.Future[source.GPUsAllocatedResult] {
  846. const queryName = "QueryGPUsAllocated"
  847. const queryFmtGPUsAllocated = `avg(avg_over_time(container_gpu_allocation{container!="", container!="POD", node!="", %s}[%s])) by (container, pod, namespace, node, uid, %s)`
  848. cfg := pds.promConfig
  849. durStr := timeutil.DurationString(end.Sub(start))
  850. if durStr == "" {
  851. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  852. }
  853. queryGPUsAllocated := fmt.Sprintf(queryFmtGPUsAllocated, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  854. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryGPUsAllocated)
  855. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  856. return source.NewFuture(source.DecodeGPUsAllocatedResult, ctx.QueryAtTime(queryGPUsAllocated, end))
  857. }
  858. func (pds *PrometheusMetricsQuerier) QueryIsGPUShared(start, end time.Time) *source.Future[source.IsGPUSharedResult] {
  859. const queryName = "QueryIsGPUShared"
  860. const queryFmtIsGPUShared = `avg(avg_over_time(kube_pod_container_resource_requests{container!="", node != "", pod != "", container!= "", unit = "integer", %s}[%s])) by (container, pod, namespace, node, resource, uid, %s)`
  861. cfg := pds.promConfig
  862. durStr := timeutil.DurationString(end.Sub(start))
  863. if durStr == "" {
  864. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  865. }
  866. queryIsGPUShared := fmt.Sprintf(queryFmtIsGPUShared, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  867. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryIsGPUShared)
  868. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  869. return source.NewFuture(source.DecodeIsGPUSharedResult, ctx.QueryAtTime(queryIsGPUShared, end))
  870. }
  871. func (pds *PrometheusMetricsQuerier) QueryDCGMDeviceInfo(start, end time.Time) *source.Future[source.DCGMDeviceInfoResult] {
  872. const queryName = "QueryDCGMDeviceInfo"
  873. const queryFmtDCGMDeviceInfo = `avg(avg_over_time(DCGM_FI_DEV_DEC_UTIL{%s}[%s])) by (UUID, device, modelName, Hostname, %s)`
  874. cfg := pds.promConfig
  875. durStr := timeutil.DurationString(end.Sub(start))
  876. if durStr == "" {
  877. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  878. }
  879. queryDCGMDeviceInfo := fmt.Sprintf(queryFmtDCGMDeviceInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  880. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDCGMDeviceInfo)
  881. ctx := pds.promContexts.NewNamedContext(ComputeCostDataContextName)
  882. return source.NewFuture(source.DecodeDCGMDeviceInfoResult, ctx.QueryAtTime(queryDCGMDeviceInfo, end))
  883. }
  884. func (pds *PrometheusMetricsQuerier) QueryDCGMDeviceUptime(start, end time.Time) *source.Future[source.DCGMDeviceUptimeResult] {
  885. const queryName = "QueryDCGMDeviceUptime"
  886. const queryFmtDCGMDeviceUptime = `avg(DCGM_FI_DEV_DEC_UTIL{%s}) by (UUID, %s)[%s:%dm]`
  887. cfg := pds.promConfig
  888. minsPerResolution := cfg.DataResolutionMinutes
  889. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  890. if durStr == "" {
  891. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  892. }
  893. queryDCGMDeviceUptime := fmt.Sprintf(queryFmtDCGMDeviceUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  894. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDCGMDeviceUptime)
  895. ctx := pds.promContexts.NewNamedContext(ComputeCostDataContextName)
  896. return source.NewFuture(source.DecodeDCGMDeviceUptimeResult, ctx.QueryAtTime(queryDCGMDeviceUptime, end))
  897. }
  898. func (pds *PrometheusMetricsQuerier) QueryDCGMContainerUsageAvg(start, end time.Time) *source.Future[source.DCGMDeviceContainerUsageResult] {
  899. const queryName = "QueryDCGMContainerUsageAvg"
  900. const queryFmtDCGMContainerUsageAvg = `avg(avg_over_time(DCGM_FI_PROF_GR_ENGINE_ACTIVE{container!="", %s}[%s])) by (UUID, pod_uid, container, %s)`
  901. cfg := pds.promConfig
  902. durStr := timeutil.DurationString(end.Sub(start))
  903. if durStr == "" {
  904. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  905. }
  906. queryDCGMContainerUsageAvg := fmt.Sprintf(queryFmtDCGMContainerUsageAvg, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  907. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDCGMContainerUsageAvg)
  908. ctx := pds.promContexts.NewNamedContext(ComputeCostDataContextName)
  909. return source.NewFuture(source.DecodeDCGMDeviceContainerUsageResult, ctx.QueryAtTime(queryDCGMContainerUsageAvg, end))
  910. }
  911. func (pds *PrometheusMetricsQuerier) QueryDCGMContainerUsageMax(start, end time.Time) *source.Future[source.DCGMDeviceContainerUsageResult] {
  912. const queryName = "QueryDCGMContainerUsageMax"
  913. const queryFmtDCGMContainerUsageMax = `max(max_over_time(DCGM_FI_PROF_GR_ENGINE_ACTIVE{container!="", %s}[%s])) by (UUID, pod_uid, container, %s)`
  914. cfg := pds.promConfig
  915. durStr := timeutil.DurationString(end.Sub(start))
  916. if durStr == "" {
  917. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  918. }
  919. queryDCGMContainerUsageMax := fmt.Sprintf(queryFmtDCGMContainerUsageMax, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  920. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDCGMContainerUsageMax)
  921. ctx := pds.promContexts.NewNamedContext(ComputeCostDataContextName)
  922. return source.NewFuture(source.DecodeDCGMDeviceContainerUsageResult, ctx.QueryAtTime(queryDCGMContainerUsageMax, end))
  923. }
  924. func (pds *PrometheusMetricsQuerier) QueryGPUInfo(start, end time.Time) *source.Future[source.GPUInfoResult] {
  925. const queryName = "QueryGPUInfo"
  926. const queryFmtGetGPUInfo = `avg(avg_over_time(DCGM_FI_DEV_DEC_UTIL{container!="",%s}[%s])) by (container, pod, namespace, device, modelName, UUID, pod_uid, %s)`
  927. cfg := pds.promConfig
  928. durStr := timeutil.DurationString(end.Sub(start))
  929. if durStr == "" {
  930. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  931. }
  932. queryGetGPUInfo := fmt.Sprintf(queryFmtGetGPUInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  933. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryGetGPUInfo)
  934. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  935. return source.NewFuture(source.DecodeGPUInfoResult, ctx.QueryAtTime(queryGetGPUInfo, end))
  936. }
  937. func (pds *PrometheusMetricsQuerier) QueryNodeCPUPricePerHr(start, end time.Time) *source.Future[source.NodeCPUPricePerHrResult] {
  938. const queryName = "QueryNodeCPUPricePerHr"
  939. const queryFmtNodeCostPerCPUHr = `avg(avg_over_time(node_cpu_hourly_cost{%s}[%s])) by (node, uid, %s, instance_type, provider_id)`
  940. cfg := pds.promConfig
  941. durStr := timeutil.DurationString(end.Sub(start))
  942. if durStr == "" {
  943. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  944. }
  945. queryNodeCostPerCPUHr := fmt.Sprintf(queryFmtNodeCostPerCPUHr, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  946. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeCostPerCPUHr)
  947. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  948. return source.NewFuture(source.DecodeNodeCPUPricePerHrResult, ctx.QueryAtTime(queryNodeCostPerCPUHr, end))
  949. }
  950. func (pds *PrometheusMetricsQuerier) QueryNodeRAMPricePerGiBHr(start, end time.Time) *source.Future[source.NodeRAMPricePerGiBHrResult] {
  951. const queryName = "QueryNodeRAMPricePerGiBHr"
  952. const queryFmtNodeCostPerRAMGiBHr = `avg(avg_over_time(node_ram_hourly_cost{%s}[%s])) by (node, uid, %s, instance_type, provider_id)`
  953. cfg := pds.promConfig
  954. durStr := timeutil.DurationString(end.Sub(start))
  955. if durStr == "" {
  956. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  957. }
  958. queryNodeCostPerRAMGiBHr := fmt.Sprintf(queryFmtNodeCostPerRAMGiBHr, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  959. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeCostPerRAMGiBHr)
  960. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  961. return source.NewFuture(source.DecodeNodeRAMPricePerGiBHrResult, ctx.QueryAtTime(queryNodeCostPerRAMGiBHr, end))
  962. }
  963. func (pds *PrometheusMetricsQuerier) QueryNodeGPUPricePerHr(start, end time.Time) *source.Future[source.NodeGPUPricePerHrResult] {
  964. const queryName = "QueryNodeGPUPricePerHr"
  965. const queryFmtNodeCostPerGPUHr = `avg(avg_over_time(node_gpu_hourly_cost{%s}[%s])) by (node, uid, %s, instance_type, provider_id)`
  966. cfg := pds.promConfig
  967. durStr := timeutil.DurationString(end.Sub(start))
  968. if durStr == "" {
  969. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  970. }
  971. queryNodeCostPerGPUHr := fmt.Sprintf(queryFmtNodeCostPerGPUHr, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  972. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeCostPerGPUHr)
  973. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  974. return source.NewFuture(source.DecodeNodeGPUPricePerHrResult, ctx.QueryAtTime(queryNodeCostPerGPUHr, end))
  975. }
  976. func (pds *PrometheusMetricsQuerier) QueryNodeIsSpot(start, end time.Time) *source.Future[source.NodeIsSpotResult] {
  977. const queryName = "QueryNodeIsSpot"
  978. const queryFmtNodeIsSpot = `avg_over_time(kubecost_node_is_spot{%s}[%s])`
  979. cfg := pds.promConfig
  980. durStr := timeutil.DurationString(end.Sub(start))
  981. if durStr == "" {
  982. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  983. }
  984. queryNodeIsSpot := fmt.Sprintf(queryFmtNodeIsSpot, cfg.ClusterFilter, durStr)
  985. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNodeIsSpot)
  986. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  987. return source.NewFuture(source.DecodeNodeIsSpotResult, ctx.QueryAtTime(queryNodeIsSpot, end))
  988. }
  989. func (pds *PrometheusMetricsQuerier) QueryPodPVCAllocation(start, end time.Time) *source.Future[source.PodPVCAllocationResult] {
  990. const queryName = "QueryPodPVCAllocation"
  991. const queryFmtPodPVCAllocation = `avg(avg_over_time(pod_pvc_allocation{%s}[%s])) by (persistentvolume, persistentvolumeclaim, pod, namespace, uid, %s)`
  992. cfg := pds.promConfig
  993. durStr := timeutil.DurationString(end.Sub(start))
  994. if durStr == "" {
  995. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  996. }
  997. queryPodPVCAllocation := fmt.Sprintf(queryFmtPodPVCAllocation, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  998. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPodPVCAllocation)
  999. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1000. return source.NewFuture(source.DecodePodPVCAllocationResult, ctx.QueryAtTime(queryPodPVCAllocation, end))
  1001. }
  1002. func (pds *PrometheusMetricsQuerier) QueryPVCBytesRequested(start, end time.Time) *source.Future[source.PVCBytesRequestedResult] {
  1003. const queryName = "QueryPVCBytesRequested"
  1004. const queryFmtPVCBytesRequested = `avg(avg_over_time(kube_persistentvolumeclaim_resource_requests_storage_bytes{%s}[%s])) by (persistentvolumeclaim, namespace, uid, %s)`
  1005. cfg := pds.promConfig
  1006. durStr := timeutil.DurationString(end.Sub(start))
  1007. if durStr == "" {
  1008. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1009. }
  1010. queryPVCBytesRequested := fmt.Sprintf(queryFmtPVCBytesRequested, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1011. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPVCBytesRequested)
  1012. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1013. return source.NewFuture(source.DecodePVCBytesRequestedResult, ctx.QueryAtTime(queryPVCBytesRequested, end))
  1014. }
  1015. func (pds *PrometheusMetricsQuerier) QueryPVBytes(start, end time.Time) *source.Future[source.PVBytesResult] {
  1016. const queryName = "QueryPVBytes"
  1017. const queryFmtPVBytes = `avg(avg_over_time(kube_persistentvolume_capacity_bytes{%s}[%s])) by (persistentvolume, uid, %s)`
  1018. cfg := pds.promConfig
  1019. durStr := timeutil.DurationString(end.Sub(start))
  1020. if durStr == "" {
  1021. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1022. }
  1023. queryPVBytes := fmt.Sprintf(queryFmtPVBytes, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1024. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPVBytes)
  1025. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1026. return source.NewFuture(source.DecodePVBytesResult, ctx.QueryAtTime(queryPVBytes, end))
  1027. }
  1028. func (pds *PrometheusMetricsQuerier) QueryPVInfo(start, end time.Time) *source.Future[source.PVInfoResult] {
  1029. const queryName = "QueryPVInfo"
  1030. const queryFmtPVMeta = `avg(avg_over_time(kubecost_pv_info{%s}[%s])) by (%s, storageclass, persistentvolume, uid, provider_id)`
  1031. cfg := pds.promConfig
  1032. durStr := timeutil.DurationString(end.Sub(start))
  1033. if durStr == "" {
  1034. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1035. }
  1036. queryPVMeta := fmt.Sprintf(queryFmtPVMeta, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1037. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPVMeta)
  1038. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1039. return source.NewFuture(source.DecodePVInfoResult, ctx.QueryAtTime(queryPVMeta, end))
  1040. }
  1041. func (pds *PrometheusMetricsQuerier) QueryPVUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  1042. const queryName = "QueryPVUptime"
  1043. const queryFmtPVUptime = `avg(kubecost_pv_info{%s}) by (%s, uid)[%s:%dm]`
  1044. cfg := pds.promConfig
  1045. minsPerResolution := cfg.DataResolutionMinutes
  1046. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  1047. if durStr == "" {
  1048. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1049. }
  1050. queryPVUptime := fmt.Sprintf(queryFmtPVUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  1051. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPVUptime)
  1052. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1053. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryPVUptime, end))
  1054. }
  1055. func (pds *PrometheusMetricsQuerier) QueryNetZoneGiB(start, end time.Time) *source.Future[source.NetZoneGiBResult] {
  1056. const queryName = "QueryNetZoneGiB"
  1057. const queryFmtNetZoneGiB = `sum(increase(kubecost_pod_network_egress_bytes_total{internet="false", same_zone="false", same_region="true", %s}[%s:%dm])) by (pod_name, namespace, uid, %s) / 1024 / 1024 / 1024`
  1058. cfg := pds.promConfig
  1059. minsPerResolution := cfg.DataResolutionMinutes
  1060. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1061. if durStr == "" {
  1062. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1063. }
  1064. queryNetZoneGiB := fmt.Sprintf(queryFmtNetZoneGiB, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1065. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetZoneGiB)
  1066. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1067. return source.NewFuture(source.DecodeNetZoneGiBResult, ctx.QueryAtTime(queryNetZoneGiB, end))
  1068. }
  1069. func (pds *PrometheusMetricsQuerier) QueryNetZonePricePerGiB(start, end time.Time) *source.Future[source.NetZonePricePerGiBResult] {
  1070. const queryName = "QueryNetZonePricePerGiB"
  1071. const queryFmtNetZoneCostPerGiB = `avg(avg_over_time(kubecost_network_zone_egress_cost{%s}[%s])) by (%s)`
  1072. cfg := pds.promConfig
  1073. durStr := timeutil.DurationString(end.Sub(start))
  1074. if durStr == "" {
  1075. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1076. }
  1077. queryNetZoneCostPerGiB := fmt.Sprintf(queryFmtNetZoneCostPerGiB, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1078. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetZoneCostPerGiB)
  1079. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1080. return source.NewFuture(source.DecodeNetZonePricePerGiBResult, ctx.QueryAtTime(queryNetZoneCostPerGiB, end))
  1081. }
  1082. func (pds *PrometheusMetricsQuerier) QueryNetRegionGiB(start, end time.Time) *source.Future[source.NetRegionGiBResult] {
  1083. const queryName = "QueryNetRegionGiB"
  1084. const queryFmtNetRegionGiB = `sum(increase(kubecost_pod_network_egress_bytes_total{internet="false", same_zone="false", same_region="false", %s}[%s:%dm])) by (pod_name, namespace, uid, %s) / 1024 / 1024 / 1024`
  1085. cfg := pds.promConfig
  1086. minsPerResolution := cfg.DataResolutionMinutes
  1087. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1088. if durStr == "" {
  1089. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1090. }
  1091. queryNetRegionGiB := fmt.Sprintf(queryFmtNetRegionGiB, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1092. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetRegionGiB)
  1093. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1094. return source.NewFuture(source.DecodeNetRegionGiBResult, ctx.QueryAtTime(queryNetRegionGiB, end))
  1095. }
  1096. func (pds *PrometheusMetricsQuerier) QueryNetRegionPricePerGiB(start, end time.Time) *source.Future[source.NetRegionPricePerGiBResult] {
  1097. const queryName = "QueryNetRegionPricePerGiB"
  1098. const queryFmtNetRegionCostPerGiB = `avg(avg_over_time(kubecost_network_region_egress_cost{%s}[%s])) by (%s)`
  1099. cfg := pds.promConfig
  1100. durStr := timeutil.DurationString(end.Sub(start))
  1101. if durStr == "" {
  1102. panic("failed to parse duration string passed to QueryNetRegionPricePerGiB")
  1103. }
  1104. queryNetRegionCostPerGiB := fmt.Sprintf(queryFmtNetRegionCostPerGiB, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1105. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetRegionCostPerGiB)
  1106. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1107. return source.NewFuture(source.DecodeNetRegionPricePerGiBResult, ctx.QueryAtTime(queryNetRegionCostPerGiB, end))
  1108. }
  1109. func (pds *PrometheusMetricsQuerier) QueryNetInternetGiB(start, end time.Time) *source.Future[source.NetInternetGiBResult] {
  1110. const queryName = "QueryNetInternetGiB"
  1111. const queryFmtNetInternetGiB = `sum(increase(kubecost_pod_network_egress_bytes_total{internet="true", %s}[%s:%dm])) by (pod_name, namespace, uid, %s) / 1024 / 1024 / 1024`
  1112. cfg := pds.promConfig
  1113. minsPerResolution := cfg.DataResolutionMinutes
  1114. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1115. if durStr == "" {
  1116. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1117. }
  1118. queryNetInternetGiB := fmt.Sprintf(queryFmtNetInternetGiB, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1119. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetInternetGiB)
  1120. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1121. return source.NewFuture(source.DecodeNetInternetGiBResult, ctx.QueryAtTime(queryNetInternetGiB, end))
  1122. }
  1123. func (pds *PrometheusMetricsQuerier) QueryNetInternetPricePerGiB(start, end time.Time) *source.Future[source.NetInternetPricePerGiBResult] {
  1124. const queryName = "QueryNetInternetPricePerGiB"
  1125. const queryFmtNetInternetCostPerGiB = `avg(avg_over_time(kubecost_network_internet_egress_cost{%s}[%s])) by (%s)`
  1126. cfg := pds.promConfig
  1127. durStr := timeutil.DurationString(end.Sub(start))
  1128. if durStr == "" {
  1129. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1130. }
  1131. queryNetInternetCostPerGiB := fmt.Sprintf(queryFmtNetInternetCostPerGiB, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1132. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetInternetCostPerGiB)
  1133. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1134. return source.NewFuture(source.DecodeNetInternetPricePerGiBResult, ctx.QueryAtTime(queryNetInternetCostPerGiB, end))
  1135. }
  1136. func (pds *PrometheusMetricsQuerier) QueryNetInternetServiceGiB(start, end time.Time) *source.Future[source.NetInternetServiceGiBResult] {
  1137. const queryName = "QueryNetInternetServiceGiB"
  1138. const queryFmtNetInternetGiB = `sum(increase(kubecost_pod_network_egress_bytes_total{internet="true", %s}[%s:%dm])) by (pod_name, namespace, service, uid, %s) / 1024 / 1024 / 1024`
  1139. cfg := pds.promConfig
  1140. minsPerResolution := cfg.DataResolutionMinutes
  1141. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1142. if durStr == "" {
  1143. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1144. }
  1145. queryNetInternetGiB := fmt.Sprintf(queryFmtNetInternetGiB, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1146. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetInternetGiB)
  1147. ctx := pds.promContexts.NewNamedContext(NetworkInsightsContextName)
  1148. return source.NewFuture(source.DecodeNetInternetServiceGiBResult, ctx.QueryAtTime(queryNetInternetGiB, end))
  1149. }
  1150. func (pds *PrometheusMetricsQuerier) QueryNetNatGatewayPricePerGiB(start, end time.Time) *source.Future[source.NetNatGatewayPricePerGiBResult] {
  1151. const queryName = "QueryNetNatGatewayPricePerGiB"
  1152. const queryFmtNetNatGatewayPricePerGiB = `avg(avg_over_time(kubecost_network_nat_gateway_egress_cost{%s}[%s])) by (%s)`
  1153. cfg := pds.promConfig
  1154. durStr := timeutil.DurationString(end.Sub(start))
  1155. if durStr == "" {
  1156. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1157. }
  1158. queryNetNatGatewayPricePerGiB := fmt.Sprintf(queryFmtNetNatGatewayPricePerGiB, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1159. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetNatGatewayPricePerGiB)
  1160. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1161. return source.NewFuture(source.DecodeNetNatGatewayPricePerGiBResult, ctx.QueryAtTime(queryNetNatGatewayPricePerGiB, end))
  1162. }
  1163. func (pds *PrometheusMetricsQuerier) QueryNetNatGatewayGiB(start, end time.Time) *source.Future[source.NetNatGatewayGiBResult] {
  1164. const queryName = "QueryNetNatGatewayGiB"
  1165. const queryFmtNetNatGatewayGiB = `sum(increase(kubecost_pod_network_egress_bytes_total{nat_gateway="true", %s}[%s:%dm])) by (pod_name, namespace, service, uid, %s) / 1024 / 1024 / 1024`
  1166. cfg := pds.promConfig
  1167. minsPerResolution := cfg.DataResolutionMinutes
  1168. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1169. if durStr == "" {
  1170. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1171. }
  1172. queryNetNatGatewayGiB := fmt.Sprintf(queryFmtNetNatGatewayGiB, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1173. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetNatGatewayGiB)
  1174. ctx := pds.promContexts.NewNamedContext(NetworkInsightsContextName)
  1175. return source.NewFuture(source.DecodeNetNatGatewayGiBResult, ctx.QueryAtTime(queryNetNatGatewayGiB, end))
  1176. }
  1177. func (pds *PrometheusMetricsQuerier) QueryNetTransferBytes(start, end time.Time) *source.Future[source.NetTransferBytesResult] {
  1178. const queryName = "QueryNetTransferBytes"
  1179. const queryFmtNetTransferBytes = `sum(increase(container_network_transmit_bytes_total{pod!="", %s}[%s:%dm])) by (pod_name, pod, namespace, uid, %s)`
  1180. cfg := pds.promConfig
  1181. minsPerResolution := cfg.DataResolutionMinutes
  1182. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1183. if durStr == "" {
  1184. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1185. }
  1186. queryNetTransferBytes := fmt.Sprintf(queryFmtNetTransferBytes, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1187. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetTransferBytes)
  1188. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1189. return source.NewFuture(source.DecodeNetTransferBytesResult, ctx.QueryAtTime(queryNetTransferBytes, end))
  1190. }
  1191. func (pds *PrometheusMetricsQuerier) QueryNetZoneIngressGiB(start, end time.Time) *source.Future[source.NetZoneIngressGiBResult] {
  1192. const queryName = "QueryNetZoneIngressGiB"
  1193. const queryFmtIngNetZoneGiB = `sum(increase(kubecost_pod_network_ingress_bytes_total{internet="false", same_zone="false", same_region="true", %s}[%s:%dm])) by (pod_name, namespace, uid, %s) / 1024 / 1024 / 1024`
  1194. cfg := pds.promConfig
  1195. minsPerResolution := cfg.DataResolutionMinutes
  1196. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1197. if durStr == "" {
  1198. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1199. }
  1200. queryNetZoneCostPerGiB := fmt.Sprintf(queryFmtIngNetZoneGiB, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1201. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetZoneCostPerGiB)
  1202. ctx := pds.promContexts.NewNamedContext(NetworkInsightsContextName)
  1203. return source.NewFuture(source.DecodeNetZoneIngressGiBResult, ctx.QueryAtTime(queryNetZoneCostPerGiB, end))
  1204. }
  1205. func (pds *PrometheusMetricsQuerier) QueryNetRegionIngressGiB(start, end time.Time) *source.Future[source.NetRegionIngressGiBResult] {
  1206. const queryName = "QueryNetRegionIngressGiB"
  1207. const queryFmtIngNetRegionGiB = `sum(increase(kubecost_pod_network_ingress_bytes_total{internet="false", same_zone="false", same_region="false", %s}[%s:%dm])) by (pod_name, namespace, uid, %s) / 1024 / 1024 / 1024`
  1208. cfg := pds.promConfig
  1209. minsPerResolution := cfg.DataResolutionMinutes
  1210. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1211. if durStr == "" {
  1212. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1213. }
  1214. queryNetRegionIngGiB := fmt.Sprintf(queryFmtIngNetRegionGiB, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1215. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetRegionIngGiB)
  1216. ctx := pds.promContexts.NewNamedContext(NetworkInsightsContextName)
  1217. return source.NewFuture(source.DecodeNetRegionIngressGiBResult, ctx.QueryAtTime(queryNetRegionIngGiB, end))
  1218. }
  1219. func (pds *PrometheusMetricsQuerier) QueryNetInternetIngressGiB(start, end time.Time) *source.Future[source.NetInternetIngressGiBResult] {
  1220. const queryName = "QueryNetInternetIngressGiB"
  1221. const queryFmtNetIngInternetGiB = `sum(increase(kubecost_pod_network_ingress_bytes_total{internet="true", %s}[%s:%dm])) by (pod_name, namespace, uid, %s) / 1024 / 1024 / 1024`
  1222. cfg := pds.promConfig
  1223. minsPerResolution := cfg.DataResolutionMinutes
  1224. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1225. if durStr == "" {
  1226. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1227. }
  1228. queryNetIngInternetGiB := fmt.Sprintf(queryFmtNetIngInternetGiB, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1229. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetIngInternetGiB)
  1230. ctx := pds.promContexts.NewNamedContext(NetworkInsightsContextName)
  1231. return source.NewFuture(source.DecodeNetInternetIngressGiBResult, ctx.QueryAtTime(queryNetIngInternetGiB, end))
  1232. }
  1233. func (pds *PrometheusMetricsQuerier) QueryNetInternetServiceIngressGiB(start, end time.Time) *source.Future[source.NetInternetServiceIngressGiBResult] {
  1234. const queryName = "QueryNetInternetServiceIngressGiB"
  1235. const queryFmtIngNetInternetGiB = `sum(increase(kubecost_pod_network_ingress_bytes_total{internet="true", %s}[%s:%dm])) by (pod_name, namespace, service, uid, %s) / 1024 / 1024 / 1024`
  1236. cfg := pds.promConfig
  1237. minsPerResolution := cfg.DataResolutionMinutes
  1238. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1239. if durStr == "" {
  1240. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1241. }
  1242. queryNetIngInternetGiB := fmt.Sprintf(queryFmtIngNetInternetGiB, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1243. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetIngInternetGiB)
  1244. ctx := pds.promContexts.NewNamedContext(NetworkInsightsContextName)
  1245. return source.NewFuture(source.DecodeNetInternetServiceIngressGiBResult, ctx.QueryAtTime(queryNetIngInternetGiB, end))
  1246. }
  1247. func (pds *PrometheusMetricsQuerier) QueryNetNatGatewayIngressPricePerGiB(start, end time.Time) *source.Future[source.NetNatGatewayPricePerGiBResult] {
  1248. const queryName = "QueryNetNatGatewayIngressPricePerGiB"
  1249. const queryFmtNetNatGatewayIngressPricePerGiB = `avg(avg_over_time(kubecost_network_nat_gateway_ingress_cost{%s}[%s])) by (%s)`
  1250. cfg := pds.promConfig
  1251. durStr := timeutil.DurationString(end.Sub(start))
  1252. if durStr == "" {
  1253. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1254. }
  1255. queryNetNatGatewayIngressPricePerGiB := fmt.Sprintf(queryFmtNetNatGatewayIngressPricePerGiB, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1256. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetNatGatewayIngressPricePerGiB)
  1257. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1258. return source.NewFuture(source.DecodeNetNatGatewayPricePerGiBResult, ctx.QueryAtTime(queryNetNatGatewayIngressPricePerGiB, end))
  1259. }
  1260. func (pds *PrometheusMetricsQuerier) QueryNetNatGatewayIngressGiB(start, end time.Time) *source.Future[source.NetNatGatewayIngressGiBResult] {
  1261. const queryName = "QueryNetNatGatewayIngressGiB"
  1262. const queryFmtNetNatGatewayIngressGiB = `sum(increase(kubecost_pod_network_ingress_bytes_total{nat_gateway="true", %s}[%s:%dm])) by (pod_name, namespace, service, uid, %s) / 1024 / 1024 / 1024`
  1263. cfg := pds.promConfig
  1264. minsPerResolution := cfg.DataResolutionMinutes
  1265. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1266. if durStr == "" {
  1267. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1268. }
  1269. queryNetNatGatewayIngressGiB := fmt.Sprintf(queryFmtNetNatGatewayIngressGiB, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1270. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetNatGatewayIngressGiB)
  1271. ctx := pds.promContexts.NewNamedContext(NetworkInsightsContextName)
  1272. return source.NewFuture(source.DecodeNetNatGatewayIngressGiBResult, ctx.QueryAtTime(queryNetNatGatewayIngressGiB, end))
  1273. }
  1274. func (pds *PrometheusMetricsQuerier) QueryNetReceiveBytes(start, end time.Time) *source.Future[source.NetReceiveBytesResult] {
  1275. const queryName = "QueryNetReceiveBytes"
  1276. const queryFmtNetReceiveBytes = `sum(increase(container_network_receive_bytes_total{pod!="", %s}[%s:%dm])) by (pod_name, pod, namespace, uid, %s)`
  1277. cfg := pds.promConfig
  1278. minsPerResolution := cfg.DataResolutionMinutes
  1279. durStr := pds.durationStringFor(start, end, minsPerResolution, true)
  1280. if durStr == "" {
  1281. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1282. }
  1283. queryNetReceiveBytes := fmt.Sprintf(queryFmtNetReceiveBytes, cfg.ClusterFilter, durStr, minsPerResolution, cfg.ClusterLabel)
  1284. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNetReceiveBytes)
  1285. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1286. return source.NewFuture(source.DecodeNetReceiveBytesResult, ctx.QueryAtTime(queryNetReceiveBytes, end))
  1287. }
  1288. func (pds *PrometheusMetricsQuerier) QueryNamespaceInfo(start, end time.Time) *source.Future[source.NamespaceInfoResult] {
  1289. const queryName = "QueryNamespaceInfo"
  1290. const queryFmtNamespaceInfo = `avg(avg_over_time(namespace_info{%s}[%s])) by (%s, uid, namespace)`
  1291. cfg := pds.promConfig
  1292. durStr := timeutil.DurationString(end.Sub(start))
  1293. if durStr == "" {
  1294. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1295. }
  1296. queryNamespaceInfo := fmt.Sprintf(queryFmtNamespaceInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1297. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNamespaceInfo)
  1298. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1299. return source.NewFuture(source.DecodeNamespaceInfoResult, ctx.QueryAtTime(queryNamespaceInfo, end))
  1300. }
  1301. // Note: namespace_info is not currently emitted
  1302. func (pds *PrometheusMetricsQuerier) QueryNamespaceUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  1303. const queryName = "QueryNamespaceUptime"
  1304. const queryFmtNamespaceUptime = `avg(namespace_info{%s}) by (%s, uid)[%s:%dm]`
  1305. cfg := pds.promConfig
  1306. minsPerResolution := cfg.DataResolutionMinutes
  1307. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  1308. if durStr == "" {
  1309. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1310. }
  1311. queryNamespaceUptime := fmt.Sprintf(queryFmtNamespaceUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  1312. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryFmtNamespaceUptime)
  1313. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1314. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryNamespaceUptime, end))
  1315. }
  1316. func (pds *PrometheusMetricsQuerier) QueryNamespaceLabels(start, end time.Time) *source.Future[source.NamespaceLabelsResult] {
  1317. const queryName = "QueryNamespaceLabels"
  1318. const queryFmtNamespaceLabels = `avg_over_time(kube_namespace_labels{%s}[%s])`
  1319. cfg := pds.promConfig
  1320. durStr := timeutil.DurationString(end.Sub(start))
  1321. if durStr == "" {
  1322. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1323. }
  1324. queryNamespaceLabels := fmt.Sprintf(queryFmtNamespaceLabels, cfg.ClusterFilter, durStr)
  1325. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNamespaceLabels)
  1326. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1327. return source.NewFuture(source.DecodeNamespaceLabelsResult, ctx.QueryAtTime(queryNamespaceLabels, end))
  1328. }
  1329. func (pds *PrometheusMetricsQuerier) QueryNamespaceAnnotations(start, end time.Time) *source.Future[source.NamespaceAnnotationsResult] {
  1330. const queryName = "QueryNamespaceAnnotations"
  1331. const queryFmtNamespaceAnnotations = `avg_over_time(kube_namespace_annotations{%s}[%s])`
  1332. cfg := pds.promConfig
  1333. durStr := timeutil.DurationString(end.Sub(start))
  1334. if durStr == "" {
  1335. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1336. }
  1337. queryNamespaceAnnotations := fmt.Sprintf(queryFmtNamespaceAnnotations, cfg.ClusterFilter, durStr)
  1338. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryNamespaceAnnotations)
  1339. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1340. return source.NewFuture(source.DecodeNamespaceAnnotationsResult, ctx.QueryAtTime(queryNamespaceAnnotations, end))
  1341. }
  1342. func (pds *PrometheusMetricsQuerier) QueryPodLabels(start, end time.Time) *source.Future[source.PodLabelsResult] {
  1343. const queryName = "QueryPodLabels"
  1344. const queryFmtPodLabels = `avg_over_time(kube_pod_labels{%s}[%s])`
  1345. cfg := pds.promConfig
  1346. durStr := timeutil.DurationString(end.Sub(start))
  1347. if durStr == "" {
  1348. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1349. }
  1350. queryPodLabels := fmt.Sprintf(queryFmtPodLabels, cfg.ClusterFilter, durStr)
  1351. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPodLabels)
  1352. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1353. return source.NewFuture(source.DecodePodLabelsResult, ctx.QueryAtTime(queryPodLabels, end))
  1354. }
  1355. func (pds *PrometheusMetricsQuerier) QueryPodAnnotations(start, end time.Time) *source.Future[source.PodAnnotationsResult] {
  1356. const queryName = "QueryPodAnnotations"
  1357. const queryFmtPodAnnotations = `avg_over_time(kube_pod_annotations{%s}[%s])`
  1358. cfg := pds.promConfig
  1359. durStr := timeutil.DurationString(end.Sub(start))
  1360. if durStr == "" {
  1361. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1362. }
  1363. queryPodAnnotations := fmt.Sprintf(queryFmtPodAnnotations, cfg.ClusterFilter, durStr)
  1364. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPodAnnotations)
  1365. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1366. return source.NewFuture(source.DecodePodAnnotationsResult, ctx.QueryAtTime(queryPodAnnotations, end))
  1367. }
  1368. func (pds *PrometheusMetricsQuerier) QueryServiceInfo(start, end time.Time) *source.Future[source.ServiceInfoResult] {
  1369. const queryName = "QueryServiceInfo"
  1370. const queryFmtServiceInfo = `avg(avg_over_time(service_selector_labels{%s}[%s])) by (%s, uid, namespace_uid, service, service_type)`
  1371. cfg := pds.promConfig
  1372. durStr := timeutil.DurationString(end.Sub(start))
  1373. if durStr == "" {
  1374. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1375. }
  1376. queryServiceInfo := fmt.Sprintf(queryFmtServiceInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1377. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryServiceInfo)
  1378. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1379. return source.NewFuture(source.DecodeServiceInfoResult, ctx.QueryAtTime(queryServiceInfo, end))
  1380. }
  1381. func (pds *PrometheusMetricsQuerier) QueryServiceUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  1382. const queryName = "QueryServiceUptime"
  1383. const queryFmtServiceUptime = `avg(service_selector_labels{%s}) by (%s, uid)[%s:%dm]`
  1384. cfg := pds.promConfig
  1385. minsPerResolution := cfg.DataResolutionMinutes
  1386. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  1387. if durStr == "" {
  1388. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1389. }
  1390. queryServiceUptime := fmt.Sprintf(queryFmtServiceUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  1391. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryServiceUptime)
  1392. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1393. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryServiceUptime, end))
  1394. }
  1395. func (pds *PrometheusMetricsQuerier) QueryServiceSelectorLabels(start, end time.Time) *source.Future[source.ServiceLabelsResult] {
  1396. const queryName = "QueryServiceSelectorLabels"
  1397. const queryFmtServiceSelectorLabels = `avg_over_time(service_selector_labels{%s}[%s])`
  1398. cfg := pds.promConfig
  1399. durStr := timeutil.DurationString(end.Sub(start))
  1400. if durStr == "" {
  1401. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1402. }
  1403. queryServiceSelectorLabels := fmt.Sprintf(queryFmtServiceSelectorLabels, cfg.ClusterFilter, durStr)
  1404. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryServiceSelectorLabels)
  1405. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1406. return source.NewFuture(source.DecodeServiceLabelsResult, ctx.QueryAtTime(queryServiceSelectorLabels, end))
  1407. }
  1408. func (pds *PrometheusMetricsQuerier) QueryDeploymentInfo(start, end time.Time) *source.Future[source.DeploymentInfoResult] {
  1409. const queryName = "QueryDeploymentInfo"
  1410. const queryFmtDeploymentInfo = `avg(avg_over_time(deployment_info{%s}[%s])) by (%s, uid, namespace_uid, deployment)`
  1411. cfg := pds.promConfig
  1412. durStr := timeutil.DurationString(end.Sub(start))
  1413. if durStr == "" {
  1414. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1415. }
  1416. queryDeploymentInfo := fmt.Sprintf(queryFmtDeploymentInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1417. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDeploymentInfo)
  1418. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1419. return source.NewFuture(source.DecodeDeploymentInfoResult, ctx.QueryAtTime(queryDeploymentInfo, end))
  1420. }
  1421. func (pds *PrometheusMetricsQuerier) QueryDeploymentUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  1422. const queryName = "QueryDeploymentUptime"
  1423. const queryFmtDeploymentUptime = `avg(deployment_info{%s}) by (%s, uid)[%s:%dm]`
  1424. cfg := pds.promConfig
  1425. minsPerResolution := cfg.DataResolutionMinutes
  1426. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  1427. if durStr == "" {
  1428. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1429. }
  1430. queryDeploymentUptime := fmt.Sprintf(queryFmtDeploymentUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  1431. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDeploymentUptime)
  1432. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1433. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryDeploymentUptime, end))
  1434. }
  1435. func (pds *PrometheusMetricsQuerier) QueryDeploymentLabels(start, end time.Time) *source.Future[source.LabelsResult] {
  1436. const queryName = "QueryDeploymentLabels"
  1437. const queryFmtDeploymentLabels = `avg_over_time(deployment_labels{%s}[%s])`
  1438. cfg := pds.promConfig
  1439. durStr := timeutil.DurationString(end.Sub(start))
  1440. if durStr == "" {
  1441. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1442. }
  1443. queryDeploymentLabels := fmt.Sprintf(queryFmtDeploymentLabels, cfg.ClusterFilter, durStr)
  1444. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDeploymentLabels)
  1445. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1446. return source.NewFuture(source.DecodeLabelsResult, ctx.QueryAtTime(queryDeploymentLabels, end))
  1447. }
  1448. func (pds *PrometheusMetricsQuerier) QueryDeploymentAnnotations(start, end time.Time) *source.Future[source.AnnotationsResult] {
  1449. const queryName = "QueryDeploymentAnnotations"
  1450. const queryFmtDeploymentAnnotations = `avg_over_time(deployment_annotations{%s}[%s])`
  1451. cfg := pds.promConfig
  1452. durStr := timeutil.DurationString(end.Sub(start))
  1453. if durStr == "" {
  1454. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1455. }
  1456. queryDeploymentAnnotations := fmt.Sprintf(queryFmtDeploymentAnnotations, cfg.ClusterFilter, durStr)
  1457. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDeploymentAnnotations)
  1458. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1459. return source.NewFuture(source.DecodeAnnotationsResult, ctx.QueryAtTime(queryDeploymentAnnotations, end))
  1460. }
  1461. func (pds *PrometheusMetricsQuerier) QueryDeploymentMatchLabels(start, end time.Time) *source.Future[source.DeploymentLabelsResult] {
  1462. const queryName = "QueryDeploymentMatchLabels"
  1463. const queryFmtDeploymentLabels = `avg_over_time(deployment_match_labels{%s}[%s])`
  1464. cfg := pds.promConfig
  1465. durStr := timeutil.DurationString(end.Sub(start))
  1466. if durStr == "" {
  1467. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1468. }
  1469. queryDeploymentMatchLabels := fmt.Sprintf(queryFmtDeploymentLabels, cfg.ClusterFilter, durStr)
  1470. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDeploymentMatchLabels)
  1471. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1472. return source.NewFuture(source.DecodeDeploymentLabelsResult, ctx.QueryAtTime(queryDeploymentMatchLabels, end))
  1473. }
  1474. func (pds *PrometheusMetricsQuerier) QueryStatefulSetInfo(start, end time.Time) *source.Future[source.StatefulSetInfoResult] {
  1475. const queryName = "QueryStatefulSetInfo"
  1476. const queryFmtStatefulSetInfo = `avg(avg_over_time(statefulset_info{%s}[%s])) by (%s, uid, namespace_uid, statefulSet)`
  1477. cfg := pds.promConfig
  1478. durStr := timeutil.DurationString(end.Sub(start))
  1479. if durStr == "" {
  1480. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1481. }
  1482. queryStatefulSetInfo := fmt.Sprintf(queryFmtStatefulSetInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1483. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryStatefulSetInfo)
  1484. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1485. return source.NewFuture(source.DecodeStatefulSetInfoResult, ctx.QueryAtTime(queryStatefulSetInfo, end))
  1486. }
  1487. func (pds *PrometheusMetricsQuerier) QueryStatefulSetUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  1488. const queryName = "QueryStatefulSetUptime"
  1489. const queryFmtStatefulSetUptime = `avg(statefulset_info{%s}) by (%s, uid)[%s:%dm]`
  1490. cfg := pds.promConfig
  1491. minsPerResolution := cfg.DataResolutionMinutes
  1492. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  1493. if durStr == "" {
  1494. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1495. }
  1496. queryStatefulSetUptime := fmt.Sprintf(queryFmtStatefulSetUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  1497. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryStatefulSetUptime)
  1498. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1499. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryStatefulSetUptime, end))
  1500. }
  1501. func (pds *PrometheusMetricsQuerier) QueryStatefulSetLabels(start, end time.Time) *source.Future[source.LabelsResult] {
  1502. const queryName = "QueryStatefulSetLabels"
  1503. const queryFmtStatefulSetLabels = `avg_over_time(statefulset_labels{%s}[%s])`
  1504. cfg := pds.promConfig
  1505. durStr := timeutil.DurationString(end.Sub(start))
  1506. if durStr == "" {
  1507. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1508. }
  1509. queryStatefulSetLabels := fmt.Sprintf(queryFmtStatefulSetLabels, cfg.ClusterFilter, durStr)
  1510. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryStatefulSetLabels)
  1511. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1512. return source.NewFuture(source.DecodeLabelsResult, ctx.QueryAtTime(queryStatefulSetLabels, end))
  1513. }
  1514. func (pds *PrometheusMetricsQuerier) QueryStatefulSetAnnotations(start, end time.Time) *source.Future[source.AnnotationsResult] {
  1515. const queryName = "QueryStatefulSetAnnotations"
  1516. const queryFmtStatefulSetAnnotations = `avg_over_time(statefulset_annotations{%s}[%s])`
  1517. cfg := pds.promConfig
  1518. durStr := timeutil.DurationString(end.Sub(start))
  1519. if durStr == "" {
  1520. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1521. }
  1522. queryStatefulSetAnnotations := fmt.Sprintf(queryFmtStatefulSetAnnotations, cfg.ClusterFilter, durStr)
  1523. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryStatefulSetAnnotations)
  1524. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1525. return source.NewFuture(source.DecodeAnnotationsResult, ctx.QueryAtTime(queryStatefulSetAnnotations, end))
  1526. }
  1527. func (pds *PrometheusMetricsQuerier) QueryStatefulSetMatchLabels(start, end time.Time) *source.Future[source.StatefulSetLabelsResult] {
  1528. const queryName = "QueryStatefulSetMatchLabels"
  1529. const queryFmtStatefulSetMatchLabels = `avg_over_time(statefulSet_match_labels{%s}[%s])`
  1530. cfg := pds.promConfig
  1531. durStr := timeutil.DurationString(end.Sub(start))
  1532. if durStr == "" {
  1533. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1534. }
  1535. queryStatefulSetMatchLabels := fmt.Sprintf(queryFmtStatefulSetMatchLabels, cfg.ClusterFilter, durStr)
  1536. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryStatefulSetMatchLabels)
  1537. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1538. return source.NewFuture(source.DecodeStatefulSetLabelsResult, ctx.QueryAtTime(queryStatefulSetMatchLabels, end))
  1539. }
  1540. func (pds *PrometheusMetricsQuerier) QueryDaemonSetInfo(start, end time.Time) *source.Future[source.DaemonSetInfoResult] {
  1541. const queryName = "QueryDaemonSetInfo"
  1542. const queryFmtDaemonSetInfo = `avg(avg_over_time(daemonset_info{%s}[%s])) by (%s, uid, namespace_uid, daemonset)`
  1543. cfg := pds.promConfig
  1544. durStr := timeutil.DurationString(end.Sub(start))
  1545. if durStr == "" {
  1546. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1547. }
  1548. queryDaemonSetInfo := fmt.Sprintf(queryFmtDaemonSetInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1549. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDaemonSetInfo)
  1550. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1551. return source.NewFuture(source.DecodeDaemonSetInfoResult, ctx.QueryAtTime(queryDaemonSetInfo, end))
  1552. }
  1553. func (pds *PrometheusMetricsQuerier) QueryDaemonSetUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  1554. const queryName = "QueryDaemonSetUptime"
  1555. const queryFmtDaemonSetUptime = `avg(daemonset_info{%s}) by (%s, uid)[%s:%dm]`
  1556. cfg := pds.promConfig
  1557. minsPerResolution := cfg.DataResolutionMinutes
  1558. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  1559. if durStr == "" {
  1560. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1561. }
  1562. queryDaemonSetUptime := fmt.Sprintf(queryFmtDaemonSetUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  1563. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDaemonSetUptime)
  1564. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1565. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryDaemonSetUptime, end))
  1566. }
  1567. func (pds *PrometheusMetricsQuerier) QueryDaemonSetLabels(start, end time.Time) *source.Future[source.LabelsResult] {
  1568. const queryName = "QueryDaemonSetLabels"
  1569. const queryFmtDaemonSetLabels = `avg_over_time(daemonset_labels{%s}[%s])`
  1570. cfg := pds.promConfig
  1571. durStr := timeutil.DurationString(end.Sub(start))
  1572. if durStr == "" {
  1573. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1574. }
  1575. queryDaemonSetLabels := fmt.Sprintf(queryFmtDaemonSetLabels, cfg.ClusterFilter, durStr)
  1576. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDaemonSetLabels)
  1577. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1578. return source.NewFuture(source.DecodeLabelsResult, ctx.QueryAtTime(queryDaemonSetLabels, end))
  1579. }
  1580. func (pds *PrometheusMetricsQuerier) QueryDaemonSetAnnotations(start, end time.Time) *source.Future[source.AnnotationsResult] {
  1581. const queryName = "QueryDaemonSetAnnotations"
  1582. const queryFmtDaemonSetAnnotations = `avg_over_time(daemonset_annotations{%s}[%s])`
  1583. cfg := pds.promConfig
  1584. durStr := timeutil.DurationString(end.Sub(start))
  1585. if durStr == "" {
  1586. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1587. }
  1588. queryDaemonSetAnnotations := fmt.Sprintf(queryFmtDaemonSetAnnotations, cfg.ClusterFilter, durStr)
  1589. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryDaemonSetAnnotations)
  1590. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1591. return source.NewFuture(source.DecodeAnnotationsResult, ctx.QueryAtTime(queryDaemonSetAnnotations, end))
  1592. }
  1593. func (pds *PrometheusMetricsQuerier) QueryJobInfo(start, end time.Time) *source.Future[source.JobInfoResult] {
  1594. const queryName = "QueryJobInfo"
  1595. const queryFmtJobInfo = `avg(avg_over_time(job_info{%s}[%s])) by (%s, uid, namespace_uid, job)`
  1596. cfg := pds.promConfig
  1597. durStr := timeutil.DurationString(end.Sub(start))
  1598. if durStr == "" {
  1599. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1600. }
  1601. queryJobInfo := fmt.Sprintf(queryFmtJobInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1602. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryJobInfo)
  1603. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1604. return source.NewFuture(source.DecodeJobInfoResult, ctx.QueryAtTime(queryJobInfo, end))
  1605. }
  1606. func (pds *PrometheusMetricsQuerier) QueryJobUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  1607. const queryName = "QueryJobUptime"
  1608. const queryFmtJobUptime = `avg(job_info{%s}) by (%s, uid)[%s:%dm]`
  1609. cfg := pds.promConfig
  1610. minsPerResolution := cfg.DataResolutionMinutes
  1611. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  1612. if durStr == "" {
  1613. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1614. }
  1615. queryJobUptime := fmt.Sprintf(queryFmtJobUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  1616. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryJobUptime)
  1617. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1618. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryJobUptime, end))
  1619. }
  1620. func (pds *PrometheusMetricsQuerier) QueryJobLabels(start, end time.Time) *source.Future[source.LabelsResult] {
  1621. const queryName = "QueryJobLabels"
  1622. const queryFmtJobLabels = `avg_over_time(job_labels{%s}[%s])`
  1623. cfg := pds.promConfig
  1624. durStr := timeutil.DurationString(end.Sub(start))
  1625. if durStr == "" {
  1626. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1627. }
  1628. queryJobLabels := fmt.Sprintf(queryFmtJobLabels, cfg.ClusterFilter, durStr)
  1629. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryJobLabels)
  1630. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1631. return source.NewFuture(source.DecodeLabelsResult, ctx.QueryAtTime(queryJobLabels, end))
  1632. }
  1633. func (pds *PrometheusMetricsQuerier) QueryJobAnnotations(start, end time.Time) *source.Future[source.AnnotationsResult] {
  1634. const queryName = "QueryJobAnnotations"
  1635. const queryFmtJobAnnotations = `avg_over_time(job_annotations{%s}[%s])`
  1636. cfg := pds.promConfig
  1637. durStr := timeutil.DurationString(end.Sub(start))
  1638. if durStr == "" {
  1639. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1640. }
  1641. queryJobAnnotations := fmt.Sprintf(queryFmtJobAnnotations, cfg.ClusterFilter, durStr)
  1642. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryJobAnnotations)
  1643. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1644. return source.NewFuture(source.DecodeAnnotationsResult, ctx.QueryAtTime(queryJobAnnotations, end))
  1645. }
  1646. func (pds *PrometheusMetricsQuerier) QueryCronJobInfo(start, end time.Time) *source.Future[source.CronJobInfoResult] {
  1647. const queryName = "QueryCronJobInfo"
  1648. const queryFmtCronJobInfo = `avg(avg_over_time(cronjob_info{%s}[%s])) by (%s, uid, namespace_uid, cronjob)`
  1649. cfg := pds.promConfig
  1650. durStr := timeutil.DurationString(end.Sub(start))
  1651. if durStr == "" {
  1652. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1653. }
  1654. queryCronJobInfo := fmt.Sprintf(queryFmtCronJobInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1655. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryCronJobInfo)
  1656. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1657. return source.NewFuture(source.DecodeCronJobInfoResult, ctx.QueryAtTime(queryCronJobInfo, end))
  1658. }
  1659. func (pds *PrometheusMetricsQuerier) QueryCronJobUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  1660. const queryName = "QueryCronJobUptime"
  1661. const queryFmtCronJobUptime = `avg(cronjob_info{%s}) by (%s, uid)[%s:%dm]`
  1662. cfg := pds.promConfig
  1663. minsPerResolution := cfg.DataResolutionMinutes
  1664. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  1665. if durStr == "" {
  1666. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1667. }
  1668. queryCronJobUptime := fmt.Sprintf(queryFmtCronJobUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  1669. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryCronJobUptime)
  1670. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1671. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryCronJobUptime, end))
  1672. }
  1673. func (pds *PrometheusMetricsQuerier) QueryCronJobLabels(start, end time.Time) *source.Future[source.LabelsResult] {
  1674. const queryName = "QueryCronJobLabels"
  1675. const queryFmtCronJobLabels = `avg_over_time(cronjob_labels{%s}[%s])`
  1676. cfg := pds.promConfig
  1677. durStr := timeutil.DurationString(end.Sub(start))
  1678. if durStr == "" {
  1679. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1680. }
  1681. queryCronJobLabels := fmt.Sprintf(queryFmtCronJobLabels, cfg.ClusterFilter, durStr)
  1682. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryCronJobLabels)
  1683. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1684. return source.NewFuture(source.DecodeLabelsResult, ctx.QueryAtTime(queryCronJobLabels, end))
  1685. }
  1686. func (pds *PrometheusMetricsQuerier) QueryCronJobAnnotations(start, end time.Time) *source.Future[source.AnnotationsResult] {
  1687. const queryName = "QueryCronJobAnnotations"
  1688. const queryFmtCronJobAnnotations = `avg_over_time(cronjob_annotations{%s}[%s])`
  1689. cfg := pds.promConfig
  1690. durStr := timeutil.DurationString(end.Sub(start))
  1691. if durStr == "" {
  1692. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1693. }
  1694. queryCronJobAnnotations := fmt.Sprintf(queryFmtCronJobAnnotations, cfg.ClusterFilter, durStr)
  1695. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryCronJobAnnotations)
  1696. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1697. return source.NewFuture(source.DecodeAnnotationsResult, ctx.QueryAtTime(queryCronJobAnnotations, end))
  1698. }
  1699. func (pds *PrometheusMetricsQuerier) QueryReplicaSetInfo(start, end time.Time) *source.Future[source.ReplicaSetInfoResult] {
  1700. const queryName = "QueryReplicaSetInfo"
  1701. const queryFmtReplicaSetInfo = `avg(avg_over_time(replicaset_info{%s}[%s])) by (%s, uid, namespace_uid, replicaset)`
  1702. cfg := pds.promConfig
  1703. durStr := timeutil.DurationString(end.Sub(start))
  1704. if durStr == "" {
  1705. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1706. }
  1707. queryReplicaSetInfo := fmt.Sprintf(queryFmtReplicaSetInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1708. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryReplicaSetInfo)
  1709. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1710. return source.NewFuture(source.DecodeReplicaSetInfoResult, ctx.QueryAtTime(queryReplicaSetInfo, end))
  1711. }
  1712. func (pds *PrometheusMetricsQuerier) QueryReplicaSetUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  1713. const queryName = "QueryReplicaSetUptime"
  1714. const queryFmtReplicaSetUptime = `avg(replicaset_info{%s}) by (%s, uid)[%s:%dm]`
  1715. cfg := pds.promConfig
  1716. minsPerResolution := cfg.DataResolutionMinutes
  1717. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  1718. if durStr == "" {
  1719. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1720. }
  1721. queryReplicaSetUptime := fmt.Sprintf(queryFmtReplicaSetUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  1722. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryReplicaSetUptime)
  1723. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1724. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryReplicaSetUptime, end))
  1725. }
  1726. func (pds *PrometheusMetricsQuerier) QueryReplicaSetLabels(start, end time.Time) *source.Future[source.LabelsResult] {
  1727. const queryName = "QueryReplicaSetLabels"
  1728. const queryFmtReplicaSetLabels = `avg_over_time(replicaset_labels{%s}[%s])`
  1729. cfg := pds.promConfig
  1730. durStr := timeutil.DurationString(end.Sub(start))
  1731. if durStr == "" {
  1732. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1733. }
  1734. queryReplicaSetLabels := fmt.Sprintf(queryFmtReplicaSetLabels, cfg.ClusterFilter, durStr)
  1735. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryReplicaSetLabels)
  1736. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1737. return source.NewFuture(source.DecodeLabelsResult, ctx.QueryAtTime(queryReplicaSetLabels, end))
  1738. }
  1739. func (pds *PrometheusMetricsQuerier) QueryReplicaSetAnnotations(start, end time.Time) *source.Future[source.AnnotationsResult] {
  1740. const queryName = "QueryReplicaSetAnnotations"
  1741. const queryFmtReplicaSetAnnotations = `avg_over_time(replicaset_annotations{%s}[%s])`
  1742. cfg := pds.promConfig
  1743. durStr := timeutil.DurationString(end.Sub(start))
  1744. if durStr == "" {
  1745. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1746. }
  1747. queryReplicaSetAnnotations := fmt.Sprintf(queryFmtReplicaSetAnnotations, cfg.ClusterFilter, durStr)
  1748. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryReplicaSetAnnotations)
  1749. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1750. return source.NewFuture(source.DecodeAnnotationsResult, ctx.QueryAtTime(queryReplicaSetAnnotations, end))
  1751. }
  1752. func (pds *PrometheusMetricsQuerier) QueryReplicaSetOwners(start, end time.Time) *source.Future[source.OwnerResult] {
  1753. const queryName = "QueryReplicaSetOwners"
  1754. const queryFmtReplicaSetOwners = `avg(avg_over_time(kube_replicaset_owner{%s}[%s])) by (%s, uid, owner_uid, owner_kind)`
  1755. cfg := pds.promConfig
  1756. durStr := timeutil.DurationString(end.Sub(start))
  1757. if durStr == "" {
  1758. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1759. }
  1760. queryReplicaSetOwners := fmt.Sprintf(queryFmtReplicaSetOwners, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1761. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryReplicaSetOwners)
  1762. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1763. return source.NewFuture(source.DecodeOwnerResult, ctx.QueryAtTime(queryReplicaSetOwners, end))
  1764. }
  1765. func (pds *PrometheusMetricsQuerier) QueryPodsWithDaemonSetOwner(start, end time.Time) *source.Future[source.PodsWithDaemonSetOwnerResult] {
  1766. const queryName = "QueryPodsWithDaemonSetOwner"
  1767. const queryFmtPodsWithDaemonSetOwner = `sum(avg_over_time(kube_pod_owner{owner_kind="DaemonSet", %s}[%s])) by (pod, owner_name, namespace, uid, %s)`
  1768. cfg := pds.promConfig
  1769. durStr := timeutil.DurationString(end.Sub(start))
  1770. if durStr == "" {
  1771. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1772. }
  1773. queryPodsWithDaemonSetOwner := fmt.Sprintf(queryFmtPodsWithDaemonSetOwner, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1774. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPodsWithDaemonSetOwner)
  1775. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1776. return source.NewFuture(source.DecodePodsWithDaemonSetOwnerResult, ctx.QueryAtTime(queryPodsWithDaemonSetOwner, end))
  1777. }
  1778. func (pds *PrometheusMetricsQuerier) QueryPodsWithJobOwner(start, end time.Time) *source.Future[source.PodsWithJobOwnerResult] {
  1779. const queryName = "QueryPodsWithJobOwner"
  1780. const queryFmtPodsWithJobOwner = `sum(avg_over_time(kube_pod_owner{owner_kind="Job", %s}[%s])) by (pod, owner_name, namespace, uid, %s)`
  1781. cfg := pds.promConfig
  1782. durStr := timeutil.DurationString(end.Sub(start))
  1783. if durStr == "" {
  1784. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1785. }
  1786. queryPodsWithJobOwner := fmt.Sprintf(queryFmtPodsWithJobOwner, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1787. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPodsWithJobOwner)
  1788. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1789. return source.NewFuture(source.DecodePodsWithJobOwnerResult, ctx.QueryAtTime(queryPodsWithJobOwner, end))
  1790. }
  1791. func (pds *PrometheusMetricsQuerier) QueryPodsWithReplicaSetOwner(start, end time.Time) *source.Future[source.PodsWithReplicaSetOwnerResult] {
  1792. const queryName = "QueryPodsWithReplicaSetOwner"
  1793. const queryFmtPodsWithReplicaSetOwner = `sum(avg_over_time(kube_pod_owner{owner_kind="ReplicaSet", %s}[%s])) by (pod, owner_name, namespace, uid, %s)`
  1794. cfg := pds.promConfig
  1795. durStr := timeutil.DurationString(end.Sub(start))
  1796. if durStr == "" {
  1797. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1798. }
  1799. queryPodsWithReplicaSetOwner := fmt.Sprintf(queryFmtPodsWithReplicaSetOwner, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1800. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryPodsWithReplicaSetOwner)
  1801. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1802. return source.NewFuture(source.DecodePodsWithReplicaSetOwnerResult, ctx.QueryAtTime(queryPodsWithReplicaSetOwner, end))
  1803. }
  1804. func (pds *PrometheusMetricsQuerier) QueryReplicaSetsWithoutOwners(start, end time.Time) *source.Future[source.ReplicaSetsWithoutOwnersResult] {
  1805. const queryName = "QueryReplicaSetsWithoutOwners"
  1806. const queryFmtReplicaSetsWithoutOwners = `avg(avg_over_time(kube_replicaset_owner{owner_kind="<none>", owner_name="<none>", %s}[%s])) by (replicaset, namespace, uid, %s)`
  1807. cfg := pds.promConfig
  1808. durStr := timeutil.DurationString(end.Sub(start))
  1809. if durStr == "" {
  1810. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1811. }
  1812. queryReplicaSetsWithoutOwners := fmt.Sprintf(queryFmtReplicaSetsWithoutOwners, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1813. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryReplicaSetsWithoutOwners)
  1814. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1815. return source.NewFuture(source.DecodeReplicaSetsWithoutOwnersResult, ctx.QueryAtTime(queryReplicaSetsWithoutOwners, end))
  1816. }
  1817. func (pds *PrometheusMetricsQuerier) QueryReplicaSetsWithRollout(start, end time.Time) *source.Future[source.ReplicaSetsWithRolloutResult] {
  1818. const queryName = "QueryReplicaSetsWithRollout"
  1819. const queryFmtReplicaSetsWithRolloutOwner = `avg(avg_over_time(kube_replicaset_owner{owner_kind="Rollout", %s}[%s])) by (replicaset, namespace, owner_kind, owner_name, uid, %s)`
  1820. cfg := pds.promConfig
  1821. durStr := timeutil.DurationString(end.Sub(start))
  1822. if durStr == "" {
  1823. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1824. }
  1825. queryReplicaSetsWithRolloutOwner := fmt.Sprintf(queryFmtReplicaSetsWithRolloutOwner, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1826. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryReplicaSetsWithRolloutOwner)
  1827. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  1828. return source.NewFuture(source.DecodeReplicaSetsWithRolloutResult, ctx.QueryAtTime(queryReplicaSetsWithRolloutOwner, end))
  1829. }
  1830. // Note: The ResourceQuota metrics are _not_ emitted at the moment. Leaving the query implementations here in case we add metric emission later on.
  1831. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaInfo(start, end time.Time) *source.Future[source.ResourceQuotaInfoResult] {
  1832. const queryName = "QueryResourceQuotaInfo"
  1833. const queryFmtResourceQuotaInfo = `avg(avg_over_time(resourcequota_info{%s}[%s])) by (%s, uid, namespace_uid, resourcequota)`
  1834. cfg := pds.promConfig
  1835. durStr := timeutil.DurationString(end.Sub(start))
  1836. if durStr == "" {
  1837. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1838. }
  1839. queryResourceQuotaInfo := fmt.Sprintf(queryFmtResourceQuotaInfo, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1840. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaInfo)
  1841. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1842. return source.NewFuture(source.DecodeResourceQuotaInfoResult, ctx.QueryAtTime(queryResourceQuotaInfo, end))
  1843. }
  1844. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaUptime(start, end time.Time) *source.Future[source.UptimeResult] {
  1845. const queryName = "QueryResourceQuotaUptime"
  1846. const queryFmtResourceQuotaUptime = `avg(resourcequota_info{%s}) by (%s, uid)[%s:%dm]`
  1847. cfg := pds.promConfig
  1848. minsPerResolution := cfg.DataResolutionMinutes
  1849. durStr := pds.durationStringFor(start, end, minsPerResolution, false)
  1850. if durStr == "" {
  1851. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1852. }
  1853. queryResourceQuotaUptime := fmt.Sprintf(queryFmtResourceQuotaUptime, cfg.ClusterFilter, cfg.ClusterLabel, durStr, minsPerResolution)
  1854. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryFmtResourceQuotaUptime)
  1855. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1856. return source.NewFuture(source.DecodeUptimeResult, ctx.QueryAtTime(queryResourceQuotaUptime, end))
  1857. }
  1858. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaSpecCPURequestAverage(start, end time.Time) *source.Future[source.ResourceResult] {
  1859. const queryName = "QueryResourceQuotaSpecCPURequestAverage"
  1860. const queryFmtResourceQuotaSpecCPURequests = `avg(avg_over_time(resourcequota_spec_resource_requests{resource="cpu",unit="core", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  1861. cfg := pds.promConfig
  1862. durStr := timeutil.DurationString(end.Sub(start))
  1863. if durStr == "" {
  1864. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1865. }
  1866. queryResourceQuotaSpecCPURequests := fmt.Sprintf(queryFmtResourceQuotaSpecCPURequests, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1867. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaSpecCPURequests)
  1868. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1869. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaSpecCPURequests, end))
  1870. }
  1871. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaSpecCPURequestMax(start, end time.Time) *source.Future[source.ResourceResult] {
  1872. const queryName = "QueryResourceQuotaSpecCPURequestMax"
  1873. const queryFmtResourceQuotaSpecCPURequests = `max(max_over_time(resourcequota_spec_resource_requests{resource="cpu",unit="core", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  1874. cfg := pds.promConfig
  1875. durStr := timeutil.DurationString(end.Sub(start))
  1876. if durStr == "" {
  1877. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1878. }
  1879. queryResourceQuotaSpecCPURequests := fmt.Sprintf(queryFmtResourceQuotaSpecCPURequests, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1880. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaSpecCPURequests)
  1881. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1882. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaSpecCPURequests, end))
  1883. }
  1884. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaSpecRAMRequestAverage(start, end time.Time) *source.Future[source.ResourceResult] {
  1885. const queryName = "QueryResourceQuotaSpecRAMRequestAverage"
  1886. const queryFmtResourceQuotaSpecRAMRequests = `avg(avg_over_time(resourcequota_spec_resource_requests{resource="memory",unit="byte", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  1887. cfg := pds.promConfig
  1888. durStr := timeutil.DurationString(end.Sub(start))
  1889. if durStr == "" {
  1890. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1891. }
  1892. queryResourceQuotaSpecRAMRequests := fmt.Sprintf(queryFmtResourceQuotaSpecRAMRequests, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1893. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaSpecRAMRequests)
  1894. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1895. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaSpecRAMRequests, end))
  1896. }
  1897. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaSpecRAMRequestMax(start, end time.Time) *source.Future[source.ResourceResult] {
  1898. const queryName = "QueryResourceQuotaSpecRAMRequestMax"
  1899. const queryFmtResourceQuotaSpecRAMRequests = `max(max_over_time(resourcequota_spec_resource_requests{resource="memory",unit="byte", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  1900. cfg := pds.promConfig
  1901. durStr := timeutil.DurationString(end.Sub(start))
  1902. if durStr == "" {
  1903. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1904. }
  1905. queryResourceQuotaSpecRAMRequests := fmt.Sprintf(queryFmtResourceQuotaSpecRAMRequests, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1906. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaSpecRAMRequests)
  1907. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1908. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaSpecRAMRequests, end))
  1909. }
  1910. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaSpecCPULimitAverage(start, end time.Time) *source.Future[source.ResourceResult] {
  1911. const queryName = "QueryResourceQuotaSpecCPULimitAverage"
  1912. const queryFmtResourceQuotaSpecCPULimits = `avg(avg_over_time(resourcequota_spec_resource_limits{resource="cpu",unit="core", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  1913. cfg := pds.promConfig
  1914. durStr := timeutil.DurationString(end.Sub(start))
  1915. if durStr == "" {
  1916. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1917. }
  1918. queryResourceQuotaSpecCPULimits := fmt.Sprintf(queryFmtResourceQuotaSpecCPULimits, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1919. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaSpecCPULimits)
  1920. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1921. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaSpecCPULimits, end))
  1922. }
  1923. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaSpecCPULimitMax(start, end time.Time) *source.Future[source.ResourceResult] {
  1924. const queryName = "QueryResourceQuotaSpecCPULimitMax"
  1925. const queryFmtResourceQuotaSpecCPULimits = `max(max_over_time(resourcequota_spec_resource_limits{resource="cpu",unit="core", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  1926. cfg := pds.promConfig
  1927. durStr := timeutil.DurationString(end.Sub(start))
  1928. if durStr == "" {
  1929. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1930. }
  1931. queryResourceQuotaSpecCPULimits := fmt.Sprintf(queryFmtResourceQuotaSpecCPULimits, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1932. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaSpecCPULimits)
  1933. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1934. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaSpecCPULimits, end))
  1935. }
  1936. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaSpecRAMLimitAverage(start, end time.Time) *source.Future[source.ResourceResult] {
  1937. const queryName = "QueryResourceQuotaSpecRAMLimitAverage"
  1938. const queryFmtResourceQuotaSpecRAMLimits = `avg(avg_over_time(resourcequota_spec_resource_limits{resource="memory",unit="byte", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  1939. cfg := pds.promConfig
  1940. durStr := timeutil.DurationString(end.Sub(start))
  1941. if durStr == "" {
  1942. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1943. }
  1944. queryResourceQuotaSpecRAMLimits := fmt.Sprintf(queryFmtResourceQuotaSpecRAMLimits, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1945. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaSpecRAMLimits)
  1946. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1947. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaSpecRAMLimits, end))
  1948. }
  1949. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaSpecRAMLimitMax(start, end time.Time) *source.Future[source.ResourceResult] {
  1950. const queryName = "QueryResourceQuotaSpecRAMLimitMax"
  1951. const queryFmtResourceQuotaSpecRAMLimits = `max(max_over_time(resourcequota_spec_resource_limits{resource="memory",unit="byte", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  1952. cfg := pds.promConfig
  1953. durStr := timeutil.DurationString(end.Sub(start))
  1954. if durStr == "" {
  1955. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1956. }
  1957. queryResourceQuotaSpecRAMLimits := fmt.Sprintf(queryFmtResourceQuotaSpecRAMLimits, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1958. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaSpecRAMLimits)
  1959. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1960. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaSpecRAMLimits, end))
  1961. }
  1962. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaStatusUsedCPURequestAverage(start, end time.Time) *source.Future[source.ResourceResult] {
  1963. const queryName = "QueryResourceQuotaStatusUsedCPURequestAverage"
  1964. const queryFmtResourceQuotaStatusUsedCPURequests = `avg(avg_over_time(resourcequota_status_used_resource_requests{resource="cpu",unit="core", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  1965. cfg := pds.promConfig
  1966. durStr := timeutil.DurationString(end.Sub(start))
  1967. if durStr == "" {
  1968. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1969. }
  1970. queryResourceQuotaStatusUsedCPURequests := fmt.Sprintf(queryFmtResourceQuotaStatusUsedCPURequests, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1971. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaStatusUsedCPURequests)
  1972. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1973. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaStatusUsedCPURequests, end))
  1974. }
  1975. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaStatusUsedCPURequestMax(start, end time.Time) *source.Future[source.ResourceResult] {
  1976. const queryName = "QueryResourceQuotaStatusUsedCPURequestMax"
  1977. const queryFmtResourceQuotaStatusUsedCPURequests = `max(max_over_time(resourcequota_status_used_resource_requests{resource="cpu",unit="core", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  1978. cfg := pds.promConfig
  1979. durStr := timeutil.DurationString(end.Sub(start))
  1980. if durStr == "" {
  1981. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1982. }
  1983. queryResourceQuotaStatusUsedCPURequests := fmt.Sprintf(queryFmtResourceQuotaStatusUsedCPURequests, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1984. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaStatusUsedCPURequests)
  1985. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1986. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaStatusUsedCPURequests, end))
  1987. }
  1988. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaStatusUsedRAMRequestAverage(start, end time.Time) *source.Future[source.ResourceResult] {
  1989. const queryName = "QueryResourceQuotaStatusUsedRAMRequestAverage"
  1990. const queryFmtResourceQuotaStatusUsedRAMRequests = `avg(avg_over_time(resourcequota_status_used_resource_requests{resource="memory",unit="byte", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  1991. cfg := pds.promConfig
  1992. durStr := timeutil.DurationString(end.Sub(start))
  1993. if durStr == "" {
  1994. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  1995. }
  1996. queryResourceQuotaStatusUsedRAMRequests := fmt.Sprintf(queryFmtResourceQuotaStatusUsedRAMRequests, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  1997. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaStatusUsedRAMRequests)
  1998. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  1999. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaStatusUsedRAMRequests, end))
  2000. }
  2001. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaStatusUsedRAMRequestMax(start, end time.Time) *source.Future[source.ResourceResult] {
  2002. const queryName = "QueryResourceQuotaStatusUsedRAMRequestMax"
  2003. const queryFmtResourceQuotaStatusUsedRAMRequests = `max(max_over_time(resourcequota_status_used_resource_requests{resource="memory",unit="byte", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  2004. cfg := pds.promConfig
  2005. durStr := timeutil.DurationString(end.Sub(start))
  2006. if durStr == "" {
  2007. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  2008. }
  2009. queryResourceQuotaStatusUsedRAMRequests := fmt.Sprintf(queryFmtResourceQuotaStatusUsedRAMRequests, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  2010. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaStatusUsedRAMRequests)
  2011. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  2012. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaStatusUsedRAMRequests, end))
  2013. }
  2014. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaStatusUsedCPULimitAverage(start, end time.Time) *source.Future[source.ResourceResult] {
  2015. const queryName = "QueryResourceQuotaStatusUsedCPULimitAverage"
  2016. const queryFmtResourceQuotaStatusUsedCPULimits = `avg(avg_over_time(resourcequota_status_used_resource_limits{resource="cpu",unit="core", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  2017. cfg := pds.promConfig
  2018. durStr := timeutil.DurationString(end.Sub(start))
  2019. if durStr == "" {
  2020. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  2021. }
  2022. queryResourceQuotaStatusUsedCPULimits := fmt.Sprintf(queryFmtResourceQuotaStatusUsedCPULimits, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  2023. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaStatusUsedCPULimits)
  2024. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  2025. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaStatusUsedCPULimits, end))
  2026. }
  2027. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaStatusUsedCPULimitMax(start, end time.Time) *source.Future[source.ResourceResult] {
  2028. const queryName = "QueryResourceQuotaStatusUsedCPULimitMax"
  2029. const queryFmtResourceQuotaStatusUsedCPULimits = `max(max_over_time(resourcequota_status_used_resource_limits{resource="cpu",unit="core", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  2030. cfg := pds.promConfig
  2031. durStr := timeutil.DurationString(end.Sub(start))
  2032. if durStr == "" {
  2033. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  2034. }
  2035. queryResourceQuotaStatusUsedCPULimits := fmt.Sprintf(queryFmtResourceQuotaStatusUsedCPULimits, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  2036. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaStatusUsedCPULimits)
  2037. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  2038. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaStatusUsedCPULimits, end))
  2039. }
  2040. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaStatusUsedRAMLimitAverage(start, end time.Time) *source.Future[source.ResourceResult] {
  2041. const queryName = "QueryResourceQuotaStatusUsedRAMLimitAverage"
  2042. const queryFmtResourceQuotaStatusUsedRAMLimits = `avg(avg_over_time(resourcequota_status_used_resource_limits{resource="memory",unit="byte", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  2043. cfg := pds.promConfig
  2044. durStr := timeutil.DurationString(end.Sub(start))
  2045. if durStr == "" {
  2046. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  2047. }
  2048. queryResourceQuotaStatusUsedRAMLimits := fmt.Sprintf(queryFmtResourceQuotaStatusUsedRAMLimits, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  2049. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaStatusUsedRAMLimits)
  2050. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  2051. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaStatusUsedRAMLimits, end))
  2052. }
  2053. func (pds *PrometheusMetricsQuerier) QueryResourceQuotaStatusUsedRAMLimitMax(start, end time.Time) *source.Future[source.ResourceResult] {
  2054. const queryName = "QueryResourceQuotaStatusUsedRAMLimitMax"
  2055. const queryFmtResourceQuotaStatusUsedRAMLimits = `max(max_over_time(resourcequota_status_used_resource_limits{resource="memory",unit="byte", %s}[%s])) by (resourcequota, namespace, uid, %s)`
  2056. cfg := pds.promConfig
  2057. durStr := timeutil.DurationString(end.Sub(start))
  2058. if durStr == "" {
  2059. panic(fmt.Sprintf("failed to parse duration string passed to %s", queryName))
  2060. }
  2061. queryResourceQuotaStatusUsedRAMLimits := fmt.Sprintf(queryFmtResourceQuotaStatusUsedRAMLimits, cfg.ClusterFilter, durStr, cfg.ClusterLabel)
  2062. log.Debugf(PrometheusMetricsQueryLogFormat, queryName, end.Unix(), queryResourceQuotaStatusUsedRAMLimits)
  2063. ctx := pds.promContexts.NewNamedContext(KubeModelContextName)
  2064. return source.NewFuture(source.DecodeResourceResult, ctx.QueryAtTime(queryResourceQuotaStatusUsedRAMLimits, end))
  2065. }
  2066. func (pds *PrometheusMetricsQuerier) QueryDataCoverage(limitDays int) (time.Time, time.Time, error) {
  2067. const (
  2068. queryName = "QueryDataCoverage"
  2069. queryFmtOldestSample = `min_over_time(timestamp(group(node_cpu_hourly_cost{%s}))[%s:%s])`
  2070. queryFmtNewestSample = `max_over_time(timestamp(group(node_cpu_hourly_cost{%s}))[%s:%s])`
  2071. )
  2072. cfg := pds.promConfig
  2073. minutesPerDuration := 60
  2074. dur := time.Duration(limitDays) * timeutil.Day
  2075. end := time.Now().UTC().Truncate(timeutil.Day).Add(timeutil.Day)
  2076. start := end.Add(-dur)
  2077. durStr := pds.durationStringFor(start, end, minutesPerDuration, false)
  2078. ctx := pds.promContexts.NewNamedContext(AllocationContextName)
  2079. queryOldest := fmt.Sprintf(queryFmtOldestSample, cfg.ClusterFilter, durStr, "1h")
  2080. log.Debugf("[Prometheus][%s[Oldest]][At Time: %d]: %s", queryName, end.Unix(), queryOldest)
  2081. resOldestFut := ctx.QueryAtTime(queryOldest, end)
  2082. resOldest, err := resOldestFut.Await()
  2083. if err != nil {
  2084. return time.Time{}, time.Time{}, fmt.Errorf("querying oldest sample: %w", err)
  2085. }
  2086. if len(resOldest) == 0 || len(resOldest[0].Values) == 0 {
  2087. // If node_cpu_hourly_cost metric is not available, fallback to a reasonable time range
  2088. // This prevents CSV export from failing when the metric doesn't exist yet
  2089. log.Warnf("QueryDataCoverage: node_cpu_hourly_cost metric not available, using fallback time range")
  2090. // Use a reasonable fallback: start from 1 day ago to account for metric collection delay
  2091. fallbackEnd := time.Now().UTC().Truncate(timeutil.Day)
  2092. fallbackStart := fallbackEnd.AddDate(0, 0, -1) // 1 day ago
  2093. return fallbackStart, fallbackEnd, nil
  2094. }
  2095. oldest := time.Unix(int64(resOldest[0].Values[0].Value), 0)
  2096. queryNewest := fmt.Sprintf(queryFmtNewestSample, cfg.ClusterFilter, durStr, "1h")
  2097. log.Debugf("[Prometheus][%s[Newest]][At Time: %d]: %s", queryName, end.Unix(), queryNewest)
  2098. resNewestFut := ctx.QueryAtTime(queryNewest, end)
  2099. resNewest, err := resNewestFut.Await()
  2100. if err != nil {
  2101. return time.Time{}, time.Time{}, fmt.Errorf("querying newest sample: %w", err)
  2102. }
  2103. if len(resNewest) == 0 || len(resNewest[0].Values) == 0 {
  2104. // If newest query fails but oldest succeeded, use oldest as both start and end
  2105. // This allows CSV export to proceed with at least some time range
  2106. log.Warnf("QueryDataCoverage: newest sample query returned no results, using oldest timestamp")
  2107. return oldest, oldest, nil
  2108. }
  2109. newest := time.Unix(int64(resNewest[0].Values[0].Value), 0)
  2110. return oldest, newest, nil
  2111. }
  2112. // durationStringFor simplifies the determination of query duration based on the version of prom and if the function
  2113. // in the query needs all data points in the vector it is provided or if it will extrapolate its own. Functions
  2114. // that extrapolate will add on another resolution if given a duration that is one resolution longer than the intended
  2115. // duration.
  2116. func (pds *PrometheusMetricsQuerier) durationStringFor(start, end time.Time, minsPerResolution int, extrapolated bool) string {
  2117. dur := end.Sub(start)
  2118. // If using a version of Prometheus where the resolution needs duration offset,
  2119. // we need to apply that here.
  2120. //
  2121. // E.g. avg(node_total_hourly_cost{}) by (node, provider_id)[60m:5m] with
  2122. // time=01:00:00 will return, for a node running the entire time, 12
  2123. // timestamps where the first is 00:05:00 and the last is 01:00:00.
  2124. // However, OpenCost expects for there to be 13 timestamps where the first
  2125. // begins at 00:00:00. To achieve this, we must modify our query to
  2126. // avg(node_total_hourly_cost{}) by (node, provider_id)[65m:5m]
  2127. if pds.promConfig.IsOffsetResolution && !extrapolated {
  2128. // increase the query time by the resolution
  2129. dur = dur + (time.Duration(minsPerResolution) * time.Minute)
  2130. }
  2131. return timeutil.DurationString(dur)
  2132. }