awsprovider.go 67 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298
  1. package cloud
  2. import (
  3. "bytes"
  4. "compress/gzip"
  5. "context"
  6. "encoding/csv"
  7. "fmt"
  8. "io"
  9. "net/http"
  10. "os"
  11. "regexp"
  12. "strconv"
  13. "strings"
  14. "sync"
  15. "time"
  16. "github.com/opencost/opencost/pkg/kubecost"
  17. "github.com/opencost/opencost/pkg/clustercache"
  18. "github.com/opencost/opencost/pkg/env"
  19. errs "github.com/opencost/opencost/pkg/errors"
  20. "github.com/opencost/opencost/pkg/log"
  21. "github.com/opencost/opencost/pkg/util"
  22. "github.com/opencost/opencost/pkg/util/fileutil"
  23. "github.com/opencost/opencost/pkg/util/json"
  24. "github.com/opencost/opencost/pkg/util/timeutil"
  25. awsSDK "github.com/aws/aws-sdk-go-v2/aws"
  26. "github.com/aws/aws-sdk-go-v2/config"
  27. "github.com/aws/aws-sdk-go-v2/credentials/stscreds"
  28. "github.com/aws/aws-sdk-go-v2/feature/s3/manager"
  29. "github.com/aws/aws-sdk-go-v2/service/athena"
  30. athenaTypes "github.com/aws/aws-sdk-go-v2/service/athena/types"
  31. "github.com/aws/aws-sdk-go-v2/service/ec2"
  32. ec2Types "github.com/aws/aws-sdk-go-v2/service/ec2/types"
  33. "github.com/aws/aws-sdk-go-v2/service/s3"
  34. "github.com/aws/aws-sdk-go-v2/service/sts"
  35. "github.com/jszwec/csvutil"
  36. v1 "k8s.io/api/core/v1"
  37. )
  38. const (
  39. supportedSpotFeedVersion = "1"
  40. SpotInfoUpdateType = "spotinfo"
  41. AthenaInfoUpdateType = "athenainfo"
  42. PreemptibleType = "preemptible"
  43. APIPricingSource = "Public API"
  44. SpotPricingSource = "Spot Data Feed"
  45. ReservedInstancePricingSource = "Savings Plan, Reserved Instance, and Out-Of-Cluster"
  46. InUseState = "in-use"
  47. AttachedState = "attached"
  48. AWSHourlyPublicIPCost = 0.005
  49. EKSCapacityTypeLabel = "eks.amazonaws.com/capacityType"
  50. EKSCapacitySpotTypeValue = "SPOT"
  51. )
  52. var (
  53. // It's of the form aws:///us-east-2a/i-0fea4fd46592d050b and we want i-0fea4fd46592d050b, if it exists
  54. provIdRx = regexp.MustCompile("aws:///([^/]+)/([^/]+)")
  55. usageTypeRegx = regexp.MustCompile(".*(-|^)(EBS.+)")
  56. versionRx = regexp.MustCompile("^#Version: (\\d+)\\.\\d+$")
  57. regionRx = regexp.MustCompile("([a-z]+-[a-z]+-[0-9])")
  58. )
  59. func (aws *AWS) PricingSourceStatus() map[string]*PricingSource {
  60. sources := make(map[string]*PricingSource)
  61. sps := &PricingSource{
  62. Name: SpotPricingSource,
  63. Enabled: true,
  64. }
  65. if !aws.SpotRefreshEnabled() {
  66. sps.Available = false
  67. sps.Error = "Spot instances not set up"
  68. sps.Enabled = false
  69. } else {
  70. sps.Error = ""
  71. if aws.SpotPricingError != nil {
  72. sps.Error = aws.SpotPricingError.Error()
  73. }
  74. if sps.Error != "" {
  75. sps.Available = false
  76. } else if len(aws.SpotPricingByInstanceID) > 0 {
  77. sps.Available = true
  78. } else {
  79. sps.Error = "No spot instances detected"
  80. }
  81. }
  82. sources[SpotPricingSource] = sps
  83. rps := &PricingSource{
  84. Name: ReservedInstancePricingSource,
  85. Enabled: true,
  86. }
  87. rps.Error = ""
  88. if aws.RIPricingError != nil {
  89. rps.Error = aws.RIPricingError.Error()
  90. }
  91. if rps.Error != "" {
  92. rps.Available = false
  93. } else {
  94. rps.Available = true
  95. }
  96. sources[ReservedInstancePricingSource] = rps
  97. return sources
  98. }
  99. // How often spot data is refreshed
  100. const SpotRefreshDuration = 15 * time.Minute
  101. var awsRegions = []string{
  102. "us-east-2",
  103. "us-east-1",
  104. "us-west-1",
  105. "us-west-2",
  106. "ap-east-1",
  107. "ap-south-1",
  108. "ap-northeast-3",
  109. "ap-northeast-2",
  110. "ap-southeast-1",
  111. "ap-southeast-2",
  112. "ap-northeast-1",
  113. "ap-southeast-3",
  114. "ca-central-1",
  115. "cn-north-1",
  116. "cn-northwest-1",
  117. "eu-central-1",
  118. "eu-west-1",
  119. "eu-west-2",
  120. "eu-west-3",
  121. "eu-north-1",
  122. "eu-south-1",
  123. "me-south-1",
  124. "sa-east-1",
  125. "af-south-1",
  126. "us-gov-east-1",
  127. "us-gov-west-1",
  128. }
  129. // AWS represents an Amazon Provider
  130. type AWS struct {
  131. Pricing map[string]*AWSProductTerms
  132. SpotPricingByInstanceID map[string]*spotInfo
  133. SpotPricingUpdatedAt *time.Time
  134. SpotRefreshRunning bool
  135. SpotPricingLock sync.RWMutex
  136. SpotPricingError error
  137. RIPricingByInstanceID map[string]*RIData
  138. RIPricingError error
  139. RIDataRunning bool
  140. RIDataLock sync.RWMutex
  141. SavingsPlanDataByInstanceID map[string]*SavingsPlanData
  142. SavingsPlanDataRunning bool
  143. SavingsPlanDataLock sync.RWMutex
  144. ValidPricingKeys map[string]bool
  145. Clientset clustercache.ClusterCache
  146. BaseCPUPrice string
  147. BaseRAMPrice string
  148. BaseGPUPrice string
  149. BaseSpotCPUPrice string
  150. BaseSpotRAMPrice string
  151. BaseSpotGPUPrice string
  152. SpotLabelName string
  153. SpotLabelValue string
  154. SpotDataRegion string
  155. SpotDataBucket string
  156. SpotDataPrefix string
  157. ProjectID string
  158. DownloadPricingDataLock sync.RWMutex
  159. Config *ProviderConfig
  160. serviceAccountChecks *ServiceAccountChecks
  161. clusterManagementPrice float64
  162. clusterAccountId string
  163. clusterRegion string
  164. clusterProvisioner string
  165. *CustomProvider
  166. }
  167. // AWSAccessKey holds AWS credentials and fulfils the awsV2.CredentialsProvider interface
  168. type AWSAccessKey struct {
  169. AccessKeyID string `json:"aws_access_key_id"`
  170. SecretAccessKey string `json:"aws_secret_access_key"`
  171. }
  172. // Retrieve returns a set of awsV2 credentials using the AWSAccessKey's key and secret.
  173. // This fulfils the awsV2.CredentialsProvider interface contract.
  174. func (accessKey AWSAccessKey) Retrieve(ctx context.Context) (awsSDK.Credentials, error) {
  175. return awsSDK.Credentials{
  176. AccessKeyID: accessKey.AccessKeyID,
  177. SecretAccessKey: accessKey.SecretAccessKey,
  178. }, nil
  179. }
  180. // CreateConfig creates an AWS SDK V2 Config for the credentials that it contains for the provided region
  181. func (accessKey AWSAccessKey) CreateConfig(region string) (awsSDK.Config, error) {
  182. var cfg awsSDK.Config
  183. var err error
  184. // If accessKey values have not been provided, attempt to load cfg from service key annotations
  185. if accessKey.AccessKeyID == "" && accessKey.SecretAccessKey == "" {
  186. cfg, err = config.LoadDefaultConfig(context.TODO(), config.WithRegion(region))
  187. if err != nil {
  188. return cfg, fmt.Errorf("failed to initialize AWS SDK config for region from annotation %s: %s", region, err)
  189. }
  190. } else {
  191. // The AWS SDK v2 requires an object fulfilling the CredentialsProvider interface, which cloud.AWSAccessKey does
  192. cfg, err = config.LoadDefaultConfig(context.TODO(), config.WithCredentialsProvider(accessKey), config.WithRegion(region))
  193. if err != nil {
  194. return cfg, fmt.Errorf("failed to initialize AWS SDK config for region %s: %s", region, err)
  195. }
  196. }
  197. return cfg, nil
  198. }
  199. // AWSPricing maps a k8s node to an AWS Pricing "product"
  200. type AWSPricing struct {
  201. Products map[string]*AWSProduct `json:"products"`
  202. Terms AWSPricingTerms `json:"terms"`
  203. }
  204. // AWSProduct represents a purchased SKU
  205. type AWSProduct struct {
  206. Sku string `json:"sku"`
  207. Attributes AWSProductAttributes `json:"attributes"`
  208. }
  209. // AWSProductAttributes represents metadata about the product used to map to a node.
  210. type AWSProductAttributes struct {
  211. Location string `json:"location"`
  212. InstanceType string `json:"instanceType"`
  213. Memory string `json:"memory"`
  214. Storage string `json:"storage"`
  215. VCpu string `json:"vcpu"`
  216. UsageType string `json:"usagetype"`
  217. OperatingSystem string `json:"operatingSystem"`
  218. PreInstalledSw string `json:"preInstalledSw"`
  219. InstanceFamily string `json:"instanceFamily"`
  220. CapacityStatus string `json:"capacitystatus"`
  221. GPU string `json:"gpu"` // GPU represents the number of GPU on the instance
  222. }
  223. // AWSPricingTerms are how you pay for the node: OnDemand, Reserved, or (TODO) Spot
  224. type AWSPricingTerms struct {
  225. OnDemand map[string]map[string]*AWSOfferTerm `json:"OnDemand"`
  226. Reserved map[string]map[string]*AWSOfferTerm `json:"Reserved"`
  227. }
  228. // AWSOfferTerm is a sku extension used to pay for the node.
  229. type AWSOfferTerm struct {
  230. Sku string `json:"sku"`
  231. PriceDimensions map[string]*AWSRateCode `json:"priceDimensions"`
  232. }
  233. func (ot *AWSOfferTerm) String() string {
  234. var strs []string
  235. for k, rc := range ot.PriceDimensions {
  236. strs = append(strs, fmt.Sprintf("%s:%s", k, rc.String()))
  237. }
  238. return fmt.Sprintf("%s:%s", ot.Sku, strings.Join(strs, ","))
  239. }
  240. // AWSRateCode encodes data about the price of a product
  241. type AWSRateCode struct {
  242. Unit string `json:"unit"`
  243. PricePerUnit AWSCurrencyCode `json:"pricePerUnit"`
  244. }
  245. func (rc *AWSRateCode) String() string {
  246. return fmt.Sprintf("{unit: %s, pricePerUnit: %v", rc.Unit, rc.PricePerUnit)
  247. }
  248. // AWSCurrencyCode is the localized currency. (TODO: support non-USD)
  249. type AWSCurrencyCode struct {
  250. USD string `json:"USD,omitempty"`
  251. CNY string `json:"CNY,omitempty"`
  252. }
  253. // AWSProductTerms represents the full terms of the product
  254. type AWSProductTerms struct {
  255. Sku string `json:"sku"`
  256. OnDemand *AWSOfferTerm `json:"OnDemand"`
  257. Reserved *AWSOfferTerm `json:"Reserved"`
  258. Memory string `json:"memory"`
  259. Storage string `json:"storage"`
  260. VCpu string `json:"vcpu"`
  261. GPU string `json:"gpu"` // GPU represents the number of GPU on the instance
  262. PV *PV `json:"pv"`
  263. }
  264. // ClusterIdEnvVar is the environment variable in which one can manually set the ClusterId
  265. const ClusterIdEnvVar = "AWS_CLUSTER_ID"
  266. // OnDemandRateCode is appended to an node sku
  267. const OnDemandRateCode = ".JRTCKXETXF"
  268. const OnDemandRateCodeCn = ".99YE2YK9UR"
  269. // ReservedRateCode is appended to a node sku
  270. const ReservedRateCode = ".38NPMPTW36"
  271. // HourlyRateCode is appended to a node sku
  272. const HourlyRateCode = ".6YS6EN2CT7"
  273. const HourlyRateCodeCn = ".Q7UJUT2CE6"
  274. // volTypes are used to map between AWS UsageTypes and
  275. // EBS volume types, as they would appear in K8s storage class
  276. // name and the EC2 API.
  277. var volTypes = map[string]string{
  278. "EBS:VolumeUsage.gp2": "gp2",
  279. "EBS:VolumeUsage.gp3": "gp3",
  280. "EBS:VolumeUsage": "standard",
  281. "EBS:VolumeUsage.sc1": "sc1",
  282. "EBS:VolumeP-IOPS.piops": "io1",
  283. "EBS:VolumeUsage.st1": "st1",
  284. "EBS:VolumeUsage.piops": "io1",
  285. "gp2": "EBS:VolumeUsage.gp2",
  286. "gp3": "EBS:VolumeUsage.gp3",
  287. "standard": "EBS:VolumeUsage",
  288. "sc1": "EBS:VolumeUsage.sc1",
  289. "io1": "EBS:VolumeUsage.piops",
  290. "st1": "EBS:VolumeUsage.st1",
  291. }
  292. // locationToRegion maps AWS region names (As they come from Billing)
  293. // to actual region identifiers
  294. var locationToRegion = map[string]string{
  295. "US East (Ohio)": "us-east-2",
  296. "US East (N. Virginia)": "us-east-1",
  297. "US West (N. California)": "us-west-1",
  298. "US West (Oregon)": "us-west-2",
  299. "Asia Pacific (Hong Kong)": "ap-east-1",
  300. "Asia Pacific (Mumbai)": "ap-south-1",
  301. "Asia Pacific (Osaka)": "ap-northeast-3",
  302. "Asia Pacific (Seoul)": "ap-northeast-2",
  303. "Asia Pacific (Singapore)": "ap-southeast-1",
  304. "Asia Pacific (Sydney)": "ap-southeast-2",
  305. "Asia Pacific (Tokyo)": "ap-northeast-1",
  306. "Asia Pacific (Jakarta)": "ap-southeast-3",
  307. "Canada (Central)": "ca-central-1",
  308. "China (Beijing)": "cn-north-1",
  309. "China (Ningxia)": "cn-northwest-1",
  310. "EU (Frankfurt)": "eu-central-1",
  311. "EU (Ireland)": "eu-west-1",
  312. "EU (London)": "eu-west-2",
  313. "EU (Paris)": "eu-west-3",
  314. "EU (Stockholm)": "eu-north-1",
  315. "EU (Milan)": "eu-south-1",
  316. "South America (Sao Paulo)": "sa-east-1",
  317. "Africa (Cape Town)": "af-south-1",
  318. "AWS GovCloud (US-East)": "us-gov-east-1",
  319. "AWS GovCloud (US-West)": "us-gov-west-1",
  320. }
  321. var regionToBillingRegionCode = map[string]string{
  322. "us-east-2": "USE2",
  323. "us-east-1": "",
  324. "us-west-1": "USW1",
  325. "us-west-2": "USW2",
  326. "ap-east-1": "APE1",
  327. "ap-south-1": "APS3",
  328. "ap-northeast-3": "APN3",
  329. "ap-northeast-2": "APN2",
  330. "ap-southeast-1": "APS1",
  331. "ap-southeast-2": "APS2",
  332. "ap-northeast-1": "APN1",
  333. "ap-southeast-3": "APS4",
  334. "ca-central-1": "CAN1",
  335. "cn-north-1": "",
  336. "cn-northwest-1": "",
  337. "eu-central-1": "EUC1",
  338. "eu-west-1": "EU",
  339. "eu-west-2": "EUW2",
  340. "eu-west-3": "EUW3",
  341. "eu-north-1": "EUN1",
  342. "eu-south-1": "EUS1",
  343. "sa-east-1": "SAE1",
  344. "af-south-1": "AFS1",
  345. "us-gov-east-1": "UGE1",
  346. "us-gov-west-1": "UGW1",
  347. }
  348. var loadedAWSSecret bool = false
  349. var awsSecret *AWSAccessKey = nil
  350. func (aws *AWS) GetLocalStorageQuery(window, offset time.Duration, rate bool, used bool) string {
  351. return ""
  352. }
  353. // KubeAttrConversion maps the k8s labels for region to an aws region
  354. func (aws *AWS) KubeAttrConversion(location, instanceType, operatingSystem string) string {
  355. operatingSystem = strings.ToLower(operatingSystem)
  356. region := locationToRegion[location]
  357. return region + "," + instanceType + "," + operatingSystem
  358. }
  359. // AwsSpotFeedInfo contains configuration for spot feed integration
  360. type AwsSpotFeedInfo struct {
  361. BucketName string `json:"bucketName"`
  362. Prefix string `json:"prefix"`
  363. Region string `json:"region"`
  364. AccountID string `json:"projectID"`
  365. ServiceKeyName string `json:"serviceKeyName"`
  366. ServiceKeySecret string `json:"serviceKeySecret"`
  367. SpotLabel string `json:"spotLabel"`
  368. SpotLabelValue string `json:"spotLabelValue"`
  369. }
  370. // AwsAthenaInfo contains configuration for CUR integration
  371. type AwsAthenaInfo struct {
  372. AthenaBucketName string `json:"athenaBucketName"`
  373. AthenaRegion string `json:"athenaRegion"`
  374. AthenaDatabase string `json:"athenaDatabase"`
  375. AthenaTable string `json:"athenaTable"`
  376. AthenaWorkgroup string `json:"athenaWorkgroup"`
  377. ServiceKeyName string `json:"serviceKeyName"`
  378. ServiceKeySecret string `json:"serviceKeySecret"`
  379. AccountID string `json:"projectID"`
  380. MasterPayerARN string `json:"masterPayerARN"`
  381. }
  382. // IsEmpty returns true if all fields in config are empty, false if not.
  383. func (aai *AwsAthenaInfo) IsEmpty() bool {
  384. return aai.AthenaBucketName == "" &&
  385. aai.AthenaRegion == "" &&
  386. aai.AthenaDatabase == "" &&
  387. aai.AthenaTable == "" &&
  388. aai.AthenaWorkgroup == "" &&
  389. aai.ServiceKeyName == "" &&
  390. aai.ServiceKeySecret == "" &&
  391. aai.AccountID == "" &&
  392. aai.MasterPayerARN == ""
  393. }
  394. // CreateConfig creates an AWS SDK V2 Config for the credentials that it contains
  395. func (aai *AwsAthenaInfo) CreateConfig() (awsSDK.Config, error) {
  396. keyProvider := AWSAccessKey{AccessKeyID: aai.ServiceKeyName, SecretAccessKey: aai.ServiceKeySecret}
  397. cfg, err := keyProvider.CreateConfig(aai.AthenaRegion)
  398. if err != nil {
  399. return cfg, err
  400. }
  401. if aai.MasterPayerARN != "" {
  402. // Create the credentials from AssumeRoleProvider to assume the role
  403. // referenced by the roleARN.
  404. stsSvc := sts.NewFromConfig(cfg)
  405. creds := stscreds.NewAssumeRoleProvider(stsSvc, aai.MasterPayerARN)
  406. cfg.Credentials = awsSDK.NewCredentialsCache(creds)
  407. }
  408. return cfg, nil
  409. }
  410. func (aws *AWS) GetManagementPlatform() (string, error) {
  411. nodes := aws.Clientset.GetAllNodes()
  412. if len(nodes) > 0 {
  413. n := nodes[0]
  414. version := n.Status.NodeInfo.KubeletVersion
  415. if strings.Contains(version, "eks") {
  416. return "eks", nil
  417. }
  418. if _, ok := n.Labels["kops.k8s.io/instancegroup"]; ok {
  419. return "kops", nil
  420. }
  421. }
  422. return "", nil
  423. }
  424. func (aws *AWS) GetConfig() (*CustomPricing, error) {
  425. c, err := aws.Config.GetCustomPricingData()
  426. if err != nil {
  427. return nil, err
  428. }
  429. if c.Discount == "" {
  430. c.Discount = "0%"
  431. }
  432. if c.NegotiatedDiscount == "" {
  433. c.NegotiatedDiscount = "0%"
  434. }
  435. if c.ShareTenancyCosts == "" {
  436. c.ShareTenancyCosts = defaultShareTenancyCost
  437. }
  438. return c, nil
  439. }
  440. // GetAWSAccessKey generate an AWSAccessKey object from the config
  441. func (aws *AWS) GetAWSAccessKey() (*AWSAccessKey, error) {
  442. config, err := aws.GetConfig()
  443. if err != nil {
  444. return nil, fmt.Errorf("could not retrieve AwsAthenaInfo %s", err)
  445. }
  446. err = aws.ConfigureAuthWith(config)
  447. if err != nil {
  448. return nil, fmt.Errorf("error configuring Cloud Provider %s", err)
  449. }
  450. //Look for service key values in env if not present in config
  451. if config.ServiceKeyName == "" {
  452. config.ServiceKeyName = env.GetAWSAccessKeyID()
  453. }
  454. if config.ServiceKeySecret == "" {
  455. config.ServiceKeySecret = env.GetAWSAccessKeySecret()
  456. }
  457. if config.ServiceKeyName == "" && config.ServiceKeySecret == "" {
  458. log.DedupedInfof(1, "missing service key values for AWS cloud integration attempting to use service account integration")
  459. }
  460. return &AWSAccessKey{AccessKeyID: config.ServiceKeyName, SecretAccessKey: config.ServiceKeySecret}, nil
  461. }
  462. // GetAWSAthenaInfo generate an AWSAthenaInfo object from the config
  463. func (aws *AWS) GetAWSAthenaInfo() (*AwsAthenaInfo, error) {
  464. config, err := aws.GetConfig()
  465. if err != nil {
  466. return nil, fmt.Errorf("could not retrieve AwsAthenaInfo %s", err)
  467. }
  468. aak, err := aws.GetAWSAccessKey()
  469. if err != nil {
  470. return nil, err
  471. }
  472. return &AwsAthenaInfo{
  473. AthenaBucketName: config.AthenaBucketName,
  474. AthenaRegion: config.AthenaRegion,
  475. AthenaDatabase: config.AthenaDatabase,
  476. AthenaTable: config.AthenaTable,
  477. AthenaWorkgroup: config.AthenaWorkgroup,
  478. ServiceKeyName: aak.AccessKeyID,
  479. ServiceKeySecret: aak.SecretAccessKey,
  480. AccountID: config.AthenaProjectID,
  481. MasterPayerARN: config.MasterPayerARN,
  482. }, nil
  483. }
  484. func (aws *AWS) UpdateConfigFromConfigMap(cm map[string]string) (*CustomPricing, error) {
  485. return aws.Config.UpdateFromMap(cm)
  486. }
  487. func (aws *AWS) UpdateConfig(r io.Reader, updateType string) (*CustomPricing, error) {
  488. return aws.Config.Update(func(c *CustomPricing) error {
  489. if updateType == SpotInfoUpdateType {
  490. asfi := AwsSpotFeedInfo{}
  491. err := json.NewDecoder(r).Decode(&asfi)
  492. if err != nil {
  493. return err
  494. }
  495. c.ServiceKeyName = asfi.ServiceKeyName
  496. if asfi.ServiceKeySecret != "" {
  497. c.ServiceKeySecret = asfi.ServiceKeySecret
  498. }
  499. c.SpotDataPrefix = asfi.Prefix
  500. c.SpotDataBucket = asfi.BucketName
  501. c.ProjectID = asfi.AccountID
  502. c.SpotDataRegion = asfi.Region
  503. c.SpotLabel = asfi.SpotLabel
  504. c.SpotLabelValue = asfi.SpotLabelValue
  505. } else if updateType == AthenaInfoUpdateType {
  506. aai := AwsAthenaInfo{}
  507. err := json.NewDecoder(r).Decode(&aai)
  508. if err != nil {
  509. return err
  510. }
  511. c.AthenaBucketName = aai.AthenaBucketName
  512. c.AthenaRegion = aai.AthenaRegion
  513. c.AthenaDatabase = aai.AthenaDatabase
  514. c.AthenaTable = aai.AthenaTable
  515. c.AthenaWorkgroup = aai.AthenaWorkgroup
  516. c.ServiceKeyName = aai.ServiceKeyName
  517. if aai.ServiceKeySecret != "" {
  518. c.ServiceKeySecret = aai.ServiceKeySecret
  519. }
  520. if aai.MasterPayerARN != "" {
  521. c.MasterPayerARN = aai.MasterPayerARN
  522. }
  523. c.AthenaProjectID = aai.AccountID
  524. } else {
  525. a := make(map[string]interface{})
  526. err := json.NewDecoder(r).Decode(&a)
  527. if err != nil {
  528. return err
  529. }
  530. for k, v := range a {
  531. kUpper := strings.Title(k) // Just so we consistently supply / receive the same values, uppercase the first letter.
  532. vstr, ok := v.(string)
  533. if ok {
  534. err := SetCustomPricingField(c, kUpper, vstr)
  535. if err != nil {
  536. return err
  537. }
  538. } else {
  539. return fmt.Errorf("type error while updating config for %s", kUpper)
  540. }
  541. }
  542. }
  543. if env.IsRemoteEnabled() {
  544. err := UpdateClusterMeta(env.GetClusterID(), c.ClusterName)
  545. if err != nil {
  546. return err
  547. }
  548. }
  549. return nil
  550. })
  551. }
  552. type awsKey struct {
  553. SpotLabelName string
  554. SpotLabelValue string
  555. Labels map[string]string
  556. ProviderID string
  557. }
  558. func (k *awsKey) GPUCount() int {
  559. return 0
  560. }
  561. func (k *awsKey) GPUType() string {
  562. return ""
  563. }
  564. func (k *awsKey) ID() string {
  565. for matchNum, group := range provIdRx.FindStringSubmatch(k.ProviderID) {
  566. if matchNum == 2 {
  567. return group
  568. }
  569. }
  570. log.Warnf("Could not find instance ID in \"%s\"", k.ProviderID)
  571. return ""
  572. }
  573. // Features will return a comma seperated list of features for the given node
  574. // If the node has a spot label, it will be included in the list
  575. // Otherwise, the list include instance type, operating system, and the region
  576. func (k *awsKey) Features() string {
  577. instanceType, _ := util.GetInstanceType(k.Labels)
  578. operatingSystem, _ := util.GetOperatingSystem(k.Labels)
  579. region, _ := util.GetRegion(k.Labels)
  580. key := region + "," + instanceType + "," + operatingSystem
  581. usageType := k.getUsageType(k.Labels)
  582. spotKey := key + "," + usageType
  583. if l, ok := k.Labels["lifecycle"]; ok && l == "EC2Spot" {
  584. return spotKey
  585. }
  586. if l, ok := k.Labels[k.SpotLabelName]; ok && l == k.SpotLabelValue {
  587. return spotKey
  588. }
  589. if usageType == PreemptibleType {
  590. return spotKey
  591. }
  592. return key
  593. }
  594. // getUsageType returns the usage type of the instance
  595. // If the instance is a spot instance, it will return PreemptibleType
  596. // Otherwise returns an empty string
  597. func (k *awsKey) getUsageType(labels map[string]string) string {
  598. if label, ok := labels[EKSCapacityTypeLabel]; ok && label == EKSCapacitySpotTypeValue {
  599. // We currently write out spot instances as "preemptible" in the pricing data, so these need to match
  600. return PreemptibleType
  601. }
  602. return ""
  603. }
  604. func (aws *AWS) PVPricing(pvk PVKey) (*PV, error) {
  605. pricing, ok := aws.Pricing[pvk.Features()]
  606. if !ok {
  607. log.Debugf("Persistent Volume pricing not found for %s: %s", pvk.GetStorageClass(), pvk.Features())
  608. return &PV{}, nil
  609. }
  610. return pricing.PV, nil
  611. }
  612. type awsPVKey struct {
  613. Labels map[string]string
  614. StorageClassParameters map[string]string
  615. StorageClassName string
  616. Name string
  617. DefaultRegion string
  618. ProviderID string
  619. }
  620. func (aws *AWS) GetPVKey(pv *v1.PersistentVolume, parameters map[string]string, defaultRegion string) PVKey {
  621. providerID := ""
  622. if pv.Spec.AWSElasticBlockStore != nil {
  623. providerID = pv.Spec.AWSElasticBlockStore.VolumeID
  624. } else if pv.Spec.CSI != nil {
  625. providerID = pv.Spec.CSI.VolumeHandle
  626. }
  627. return &awsPVKey{
  628. Labels: pv.Labels,
  629. StorageClassName: pv.Spec.StorageClassName,
  630. StorageClassParameters: parameters,
  631. Name: pv.Name,
  632. DefaultRegion: defaultRegion,
  633. ProviderID: providerID,
  634. }
  635. }
  636. func (key *awsPVKey) ID() string {
  637. return key.ProviderID
  638. }
  639. func (key *awsPVKey) GetStorageClass() string {
  640. return key.StorageClassName
  641. }
  642. func (key *awsPVKey) Features() string {
  643. storageClass := key.StorageClassParameters["type"]
  644. if storageClass == "standard" {
  645. storageClass = "gp2"
  646. }
  647. // Storage class names are generally EBS volume types (gp2)
  648. // Keys in Pricing are based on UsageTypes (EBS:VolumeType.gp2)
  649. // Converts between the 2
  650. region, ok := util.GetRegion(key.Labels)
  651. if !ok {
  652. region = key.DefaultRegion
  653. }
  654. class, ok := volTypes[storageClass]
  655. if !ok {
  656. log.Debugf("No voltype mapping for %s's storageClass: %s", key.Name, storageClass)
  657. }
  658. return region + "," + class
  659. }
  660. // GetKey maps node labels to information needed to retrieve pricing data
  661. func (aws *AWS) GetKey(labels map[string]string, n *v1.Node) Key {
  662. return &awsKey{
  663. SpotLabelName: aws.SpotLabelName,
  664. SpotLabelValue: aws.SpotLabelValue,
  665. Labels: labels,
  666. ProviderID: labels["providerID"],
  667. }
  668. }
  669. func (aws *AWS) isPreemptible(key string) bool {
  670. s := strings.Split(key, ",")
  671. if len(s) == 4 && s[3] == PreemptibleType {
  672. return true
  673. }
  674. return false
  675. }
  676. func (aws *AWS) ClusterManagementPricing() (string, float64, error) {
  677. return aws.clusterProvisioner, aws.clusterManagementPrice, nil
  678. }
  679. // Use the pricing data from the current region. Fall back to using all region data if needed.
  680. func (aws *AWS) getRegionPricing(nodeList []*v1.Node) (*http.Response, string, error) {
  681. pricingURL := "https://pricing.us-east-1.amazonaws.com/offers/v1.0/aws/AmazonEC2/current/"
  682. region := ""
  683. multiregion := false
  684. for _, n := range nodeList {
  685. labels := n.GetLabels()
  686. currentNodeRegion := ""
  687. if r, ok := util.GetRegion(labels); ok {
  688. currentNodeRegion = r
  689. // Switch to Chinese endpoint for regions with the Chinese prefix
  690. if strings.HasPrefix(currentNodeRegion, "cn-") {
  691. pricingURL = "https://pricing.cn-north-1.amazonaws.com.cn/offers/v1.0/cn/AmazonEC2/current/"
  692. }
  693. } else {
  694. multiregion = true // We weren't able to detect the node's region, so pull all data.
  695. break
  696. }
  697. if region == "" { // We haven't set a region yet
  698. region = currentNodeRegion
  699. } else if region != "" && currentNodeRegion != region { // If two nodes have different regions here, we'll need to fetch all pricing data.
  700. multiregion = true
  701. break
  702. }
  703. }
  704. // Chinese multiregion endpoint only contains data for Chinese regions and Chinese regions are excluded from other endpoint
  705. if region != "" && !multiregion {
  706. pricingURL += region + "/"
  707. }
  708. pricingURL += "index.json"
  709. if env.GetAWSPricingURL() != "" { // Allow override of pricing URL
  710. pricingURL = env.GetAWSPricingURL()
  711. }
  712. log.Infof("starting download of \"%s\", which is quite large ...", pricingURL)
  713. resp, err := http.Get(pricingURL)
  714. if err != nil {
  715. log.Errorf("Bogus fetch of \"%s\": %v", pricingURL, err)
  716. return nil, pricingURL, err
  717. }
  718. return resp, pricingURL, err
  719. }
  720. // SpotRefreshEnabled determines whether the required configs to run the spot feed query have been set up
  721. func (aws *AWS) SpotRefreshEnabled() bool {
  722. // Need a valid value for at least one of these fields to consider spot pricing as enabled
  723. return len(aws.SpotDataBucket) != 0 || len(aws.SpotDataRegion) != 0 || len(aws.ProjectID) != 0
  724. }
  725. // DownloadPricingData fetches data from the AWS Pricing API
  726. func (aws *AWS) DownloadPricingData() error {
  727. aws.DownloadPricingDataLock.Lock()
  728. defer aws.DownloadPricingDataLock.Unlock()
  729. c, err := aws.Config.GetCustomPricingData()
  730. if err != nil {
  731. log.Errorf("Error downloading default pricing data: %s", err.Error())
  732. }
  733. aws.BaseCPUPrice = c.CPU
  734. aws.BaseRAMPrice = c.RAM
  735. aws.BaseGPUPrice = c.GPU
  736. aws.BaseSpotCPUPrice = c.SpotCPU
  737. aws.BaseSpotRAMPrice = c.SpotRAM
  738. aws.BaseSpotGPUPrice = c.SpotGPU
  739. aws.SpotLabelName = c.SpotLabel
  740. aws.SpotLabelValue = c.SpotLabelValue
  741. aws.SpotDataBucket = c.SpotDataBucket
  742. aws.SpotDataPrefix = c.SpotDataPrefix
  743. aws.ProjectID = c.ProjectID
  744. aws.SpotDataRegion = c.SpotDataRegion
  745. aws.ConfigureAuthWith(c) // load aws authentication from configuration or secret
  746. if len(aws.SpotDataBucket) != 0 && len(aws.ProjectID) == 0 {
  747. log.Warnf("using SpotDataBucket \"%s\" without ProjectID will not end well", aws.SpotDataBucket)
  748. }
  749. nodeList := aws.Clientset.GetAllNodes()
  750. inputkeys := make(map[string]bool)
  751. for _, n := range nodeList {
  752. if _, ok := n.Labels["eks.amazonaws.com/nodegroup"]; ok {
  753. aws.clusterManagementPrice = 0.10
  754. aws.clusterProvisioner = "EKS"
  755. } else if _, ok := n.Labels["kops.k8s.io/instancegroup"]; ok {
  756. aws.clusterProvisioner = "KOPS"
  757. }
  758. labels := n.GetObjectMeta().GetLabels()
  759. key := aws.GetKey(labels, n)
  760. inputkeys[key.Features()] = true
  761. }
  762. pvList := aws.Clientset.GetAllPersistentVolumes()
  763. storageClasses := aws.Clientset.GetAllStorageClasses()
  764. storageClassMap := make(map[string]map[string]string)
  765. for _, storageClass := range storageClasses {
  766. params := storageClass.Parameters
  767. storageClassMap[storageClass.ObjectMeta.Name] = params
  768. if storageClass.GetAnnotations()["storageclass.kubernetes.io/is-default-class"] == "true" || storageClass.GetAnnotations()["storageclass.beta.kubernetes.io/is-default-class"] == "true" {
  769. storageClassMap["default"] = params
  770. storageClassMap[""] = params
  771. }
  772. }
  773. pvkeys := make(map[string]PVKey)
  774. for _, pv := range pvList {
  775. params, ok := storageClassMap[pv.Spec.StorageClassName]
  776. if !ok {
  777. log.Infof("Unable to find params for storageClassName %s, falling back to default pricing", pv.Spec.StorageClassName)
  778. continue
  779. }
  780. key := aws.GetPVKey(pv, params, "")
  781. pvkeys[key.Features()] = key
  782. }
  783. // RIDataRunning establishes the existence of the goroutine. Since it's possible we
  784. // run multiple downloads, we don't want to create multiple go routines if one already exists
  785. if !aws.RIDataRunning {
  786. err = aws.GetReservationDataFromAthena() // Block until one run has completed.
  787. if err != nil {
  788. log.Errorf("Failed to lookup reserved instance data: %s", err.Error())
  789. } else { // If we make one successful run, check on new reservation data every hour
  790. go func() {
  791. defer errs.HandlePanic()
  792. aws.RIDataRunning = true
  793. for {
  794. log.Infof("Reserved Instance watcher running... next update in 1h")
  795. time.Sleep(time.Hour)
  796. err := aws.GetReservationDataFromAthena()
  797. if err != nil {
  798. log.Infof("Error updating RI data: %s", err.Error())
  799. }
  800. }
  801. }()
  802. }
  803. }
  804. if !aws.SavingsPlanDataRunning {
  805. err = aws.GetSavingsPlanDataFromAthena()
  806. if err != nil {
  807. log.Errorf("Failed to lookup savings plan data: %s", err.Error())
  808. } else {
  809. go func() {
  810. defer errs.HandlePanic()
  811. aws.SavingsPlanDataRunning = true
  812. for {
  813. log.Infof("Savings Plan watcher running... next update in 1h")
  814. time.Sleep(time.Hour)
  815. err := aws.GetSavingsPlanDataFromAthena()
  816. if err != nil {
  817. log.Infof("Error updating Savings Plan data: %s", err.Error())
  818. }
  819. }
  820. }()
  821. }
  822. }
  823. aws.Pricing = make(map[string]*AWSProductTerms)
  824. aws.ValidPricingKeys = make(map[string]bool)
  825. skusToKeys := make(map[string]string)
  826. resp, pricingURL, err := aws.getRegionPricing(nodeList)
  827. if err != nil {
  828. return err
  829. }
  830. dec := json.NewDecoder(resp.Body)
  831. for {
  832. t, err := dec.Token()
  833. if err == io.EOF {
  834. log.Infof("done loading \"%s\"\n", pricingURL)
  835. break
  836. } else if err != nil {
  837. log.Errorf("error parsing response json %v", resp.Body)
  838. break
  839. }
  840. if t == "products" {
  841. _, err := dec.Token() // this should parse the opening "{""
  842. if err != nil {
  843. return err
  844. }
  845. for dec.More() {
  846. _, err := dec.Token() // the sku token
  847. if err != nil {
  848. return err
  849. }
  850. product := &AWSProduct{}
  851. err = dec.Decode(&product)
  852. if err != nil {
  853. log.Errorf("Error parsing response from \"%s\": %v", pricingURL, err.Error())
  854. break
  855. }
  856. if product.Attributes.PreInstalledSw == "NA" &&
  857. (strings.HasPrefix(product.Attributes.UsageType, "BoxUsage") || strings.Contains(product.Attributes.UsageType, "-BoxUsage")) &&
  858. product.Attributes.CapacityStatus == "Used" {
  859. key := aws.KubeAttrConversion(product.Attributes.Location, product.Attributes.InstanceType, product.Attributes.OperatingSystem)
  860. spotKey := key + ",preemptible"
  861. if inputkeys[key] || inputkeys[spotKey] { // Just grab the sku even if spot, and change the price later.
  862. productTerms := &AWSProductTerms{
  863. Sku: product.Sku,
  864. Memory: product.Attributes.Memory,
  865. Storage: product.Attributes.Storage,
  866. VCpu: product.Attributes.VCpu,
  867. GPU: product.Attributes.GPU,
  868. }
  869. aws.Pricing[key] = productTerms
  870. aws.Pricing[spotKey] = productTerms
  871. skusToKeys[product.Sku] = key
  872. }
  873. aws.ValidPricingKeys[key] = true
  874. aws.ValidPricingKeys[spotKey] = true
  875. } else if strings.Contains(product.Attributes.UsageType, "EBS:Volume") {
  876. // UsageTypes may be prefixed with a region code - we're removing this when using
  877. // volTypes to keep lookups generic
  878. usageTypeMatch := usageTypeRegx.FindStringSubmatch(product.Attributes.UsageType)
  879. usageTypeNoRegion := usageTypeMatch[len(usageTypeMatch)-1]
  880. key := locationToRegion[product.Attributes.Location] + "," + usageTypeNoRegion
  881. spotKey := key + ",preemptible"
  882. pv := &PV{
  883. Class: volTypes[usageTypeNoRegion],
  884. Region: locationToRegion[product.Attributes.Location],
  885. }
  886. productTerms := &AWSProductTerms{
  887. Sku: product.Sku,
  888. PV: pv,
  889. }
  890. aws.Pricing[key] = productTerms
  891. aws.Pricing[spotKey] = productTerms
  892. skusToKeys[product.Sku] = key
  893. aws.ValidPricingKeys[key] = true
  894. aws.ValidPricingKeys[spotKey] = true
  895. }
  896. }
  897. }
  898. if t == "terms" {
  899. _, err := dec.Token() // this should parse the opening "{""
  900. if err != nil {
  901. return err
  902. }
  903. termType, err := dec.Token()
  904. if err != nil {
  905. return err
  906. }
  907. if termType == "OnDemand" {
  908. _, err := dec.Token()
  909. if err != nil { // again, should parse an opening "{"
  910. return err
  911. }
  912. for dec.More() {
  913. sku, err := dec.Token()
  914. if err != nil {
  915. return err
  916. }
  917. _, err = dec.Token() // another opening "{"
  918. if err != nil {
  919. return err
  920. }
  921. skuOnDemand, err := dec.Token()
  922. if err != nil {
  923. return err
  924. }
  925. offerTerm := &AWSOfferTerm{}
  926. err = dec.Decode(&offerTerm)
  927. if err != nil {
  928. log.Errorf("Error decoding AWS Offer Term: " + err.Error())
  929. }
  930. key, ok := skusToKeys[sku.(string)]
  931. spotKey := key + ",preemptible"
  932. if ok {
  933. aws.Pricing[key].OnDemand = offerTerm
  934. aws.Pricing[spotKey].OnDemand = offerTerm
  935. var cost string
  936. if sku.(string)+OnDemandRateCode == skuOnDemand {
  937. cost = offerTerm.PriceDimensions[sku.(string)+OnDemandRateCode+HourlyRateCode].PricePerUnit.USD
  938. } else if sku.(string)+OnDemandRateCodeCn == skuOnDemand {
  939. cost = offerTerm.PriceDimensions[sku.(string)+OnDemandRateCodeCn+HourlyRateCodeCn].PricePerUnit.CNY
  940. }
  941. if strings.Contains(key, "EBS:VolumeP-IOPS.piops") {
  942. // If the specific UsageType is the per IO cost used on io1 volumes
  943. // we need to add the per IO cost to the io1 PV cost
  944. // Add the per IO cost to the PV object for the io1 volume type
  945. aws.Pricing[key].PV.CostPerIO = cost
  946. } else if strings.Contains(key, "EBS:Volume") {
  947. // If volume, we need to get hourly cost and add it to the PV object
  948. costFloat, _ := strconv.ParseFloat(cost, 64)
  949. hourlyPrice := costFloat / 730
  950. aws.Pricing[key].PV.Cost = strconv.FormatFloat(hourlyPrice, 'f', -1, 64)
  951. }
  952. }
  953. _, err = dec.Token()
  954. if err != nil {
  955. return err
  956. }
  957. }
  958. _, err = dec.Token()
  959. if err != nil {
  960. return err
  961. }
  962. }
  963. }
  964. }
  965. log.Infof("Finished downloading \"%s\"", pricingURL)
  966. if !aws.SpotRefreshEnabled() {
  967. return nil
  968. }
  969. // Always run spot pricing refresh when performing download
  970. aws.refreshSpotPricing(true)
  971. // Only start a single refresh goroutine
  972. if !aws.SpotRefreshRunning {
  973. aws.SpotRefreshRunning = true
  974. go func() {
  975. defer errs.HandlePanic()
  976. for {
  977. log.Infof("Spot Pricing Refresh scheduled in %.2f minutes.", SpotRefreshDuration.Minutes())
  978. time.Sleep(SpotRefreshDuration)
  979. // Reoccurring refresh checks update times
  980. aws.refreshSpotPricing(false)
  981. }
  982. }()
  983. }
  984. return nil
  985. }
  986. func (aws *AWS) refreshSpotPricing(force bool) {
  987. aws.SpotPricingLock.Lock()
  988. defer aws.SpotPricingLock.Unlock()
  989. now := time.Now().UTC()
  990. updateTime := now.Add(-SpotRefreshDuration)
  991. // Return if there was an update time set and an hour hasn't elapsed
  992. if !force && aws.SpotPricingUpdatedAt != nil && aws.SpotPricingUpdatedAt.After(updateTime) {
  993. return
  994. }
  995. sp, err := aws.parseSpotData(aws.SpotDataBucket, aws.SpotDataPrefix, aws.ProjectID, aws.SpotDataRegion)
  996. if err != nil {
  997. log.Warnf("Skipping AWS spot data download: %s", err.Error())
  998. aws.SpotPricingError = err
  999. return
  1000. }
  1001. aws.SpotPricingError = nil
  1002. // update time last updated
  1003. aws.SpotPricingUpdatedAt = &now
  1004. aws.SpotPricingByInstanceID = sp
  1005. }
  1006. // Stubbed NetworkPricing for AWS. Pull directly from aws.json for now
  1007. func (aws *AWS) NetworkPricing() (*Network, error) {
  1008. cpricing, err := aws.Config.GetCustomPricingData()
  1009. if err != nil {
  1010. return nil, err
  1011. }
  1012. znec, err := strconv.ParseFloat(cpricing.ZoneNetworkEgress, 64)
  1013. if err != nil {
  1014. return nil, err
  1015. }
  1016. rnec, err := strconv.ParseFloat(cpricing.RegionNetworkEgress, 64)
  1017. if err != nil {
  1018. return nil, err
  1019. }
  1020. inec, err := strconv.ParseFloat(cpricing.InternetNetworkEgress, 64)
  1021. if err != nil {
  1022. return nil, err
  1023. }
  1024. return &Network{
  1025. ZoneNetworkEgressCost: znec,
  1026. RegionNetworkEgressCost: rnec,
  1027. InternetNetworkEgressCost: inec,
  1028. }, nil
  1029. }
  1030. func (aws *AWS) LoadBalancerPricing() (*LoadBalancer, error) {
  1031. fffrc := 0.025
  1032. afrc := 0.010
  1033. lbidc := 0.008
  1034. numForwardingRules := 1.0
  1035. dataIngressGB := 0.0
  1036. var totalCost float64
  1037. if numForwardingRules < 5 {
  1038. totalCost = fffrc*numForwardingRules + lbidc*dataIngressGB
  1039. } else {
  1040. totalCost = fffrc*5 + afrc*(numForwardingRules-5) + lbidc*dataIngressGB
  1041. }
  1042. return &LoadBalancer{
  1043. Cost: totalCost,
  1044. }, nil
  1045. }
  1046. // AllNodePricing returns all the billing data fetched.
  1047. func (aws *AWS) AllNodePricing() (interface{}, error) {
  1048. aws.DownloadPricingDataLock.RLock()
  1049. defer aws.DownloadPricingDataLock.RUnlock()
  1050. return aws.Pricing, nil
  1051. }
  1052. func (aws *AWS) spotPricing(instanceID string) (*spotInfo, bool) {
  1053. aws.SpotPricingLock.RLock()
  1054. defer aws.SpotPricingLock.RUnlock()
  1055. info, ok := aws.SpotPricingByInstanceID[instanceID]
  1056. return info, ok
  1057. }
  1058. func (aws *AWS) reservedInstancePricing(instanceID string) (*RIData, bool) {
  1059. aws.RIDataLock.RLock()
  1060. defer aws.RIDataLock.RUnlock()
  1061. data, ok := aws.RIPricingByInstanceID[instanceID]
  1062. return data, ok
  1063. }
  1064. func (aws *AWS) savingsPlanPricing(instanceID string) (*SavingsPlanData, bool) {
  1065. aws.SavingsPlanDataLock.RLock()
  1066. defer aws.SavingsPlanDataLock.RUnlock()
  1067. data, ok := aws.SavingsPlanDataByInstanceID[instanceID]
  1068. return data, ok
  1069. }
  1070. func (aws *AWS) createNode(terms *AWSProductTerms, usageType string, k Key) (*Node, error) {
  1071. key := k.Features()
  1072. if spotInfo, ok := aws.spotPricing(k.ID()); ok {
  1073. var spotcost string
  1074. log.DedupedInfof(5, "Looking up spot data from feed for node %s", k.ID())
  1075. arr := strings.Split(spotInfo.Charge, " ")
  1076. if len(arr) == 2 {
  1077. spotcost = arr[0]
  1078. } else {
  1079. log.Infof("Spot data for node %s is missing", k.ID())
  1080. }
  1081. return &Node{
  1082. Cost: spotcost,
  1083. VCPU: terms.VCpu,
  1084. RAM: terms.Memory,
  1085. GPU: terms.GPU,
  1086. Storage: terms.Storage,
  1087. BaseCPUPrice: aws.BaseCPUPrice,
  1088. BaseRAMPrice: aws.BaseRAMPrice,
  1089. BaseGPUPrice: aws.BaseGPUPrice,
  1090. UsageType: PreemptibleType,
  1091. }, nil
  1092. } else if aws.isPreemptible(key) { // Preemptible but we don't have any data in the pricing report.
  1093. log.DedupedWarningf(5, "Node %s marked preemptible but we have no data in spot feed", k.ID())
  1094. return &Node{
  1095. VCPU: terms.VCpu,
  1096. VCPUCost: aws.BaseSpotCPUPrice,
  1097. RAM: terms.Memory,
  1098. GPU: terms.GPU,
  1099. Storage: terms.Storage,
  1100. BaseCPUPrice: aws.BaseCPUPrice,
  1101. BaseRAMPrice: aws.BaseRAMPrice,
  1102. BaseGPUPrice: aws.BaseGPUPrice,
  1103. UsageType: PreemptibleType,
  1104. }, nil
  1105. } else if sp, ok := aws.savingsPlanPricing(k.ID()); ok {
  1106. strCost := fmt.Sprintf("%f", sp.EffectiveCost)
  1107. return &Node{
  1108. Cost: strCost,
  1109. VCPU: terms.VCpu,
  1110. RAM: terms.Memory,
  1111. GPU: terms.GPU,
  1112. Storage: terms.Storage,
  1113. BaseCPUPrice: aws.BaseCPUPrice,
  1114. BaseRAMPrice: aws.BaseRAMPrice,
  1115. BaseGPUPrice: aws.BaseGPUPrice,
  1116. UsageType: usageType,
  1117. }, nil
  1118. } else if ri, ok := aws.reservedInstancePricing(k.ID()); ok {
  1119. strCost := fmt.Sprintf("%f", ri.EffectiveCost)
  1120. return &Node{
  1121. Cost: strCost,
  1122. VCPU: terms.VCpu,
  1123. RAM: terms.Memory,
  1124. GPU: terms.GPU,
  1125. Storage: terms.Storage,
  1126. BaseCPUPrice: aws.BaseCPUPrice,
  1127. BaseRAMPrice: aws.BaseRAMPrice,
  1128. BaseGPUPrice: aws.BaseGPUPrice,
  1129. UsageType: usageType,
  1130. }, nil
  1131. }
  1132. var cost string
  1133. c, ok := terms.OnDemand.PriceDimensions[terms.Sku+OnDemandRateCode+HourlyRateCode]
  1134. if ok {
  1135. cost = c.PricePerUnit.USD
  1136. } else {
  1137. // Check for Chinese pricing before throwing error
  1138. c, ok = terms.OnDemand.PriceDimensions[terms.Sku+OnDemandRateCodeCn+HourlyRateCodeCn]
  1139. if ok {
  1140. cost = c.PricePerUnit.CNY
  1141. } else {
  1142. return nil, fmt.Errorf("Could not fetch data for \"%s\"", k.ID())
  1143. }
  1144. }
  1145. return &Node{
  1146. Cost: cost,
  1147. VCPU: terms.VCpu,
  1148. RAM: terms.Memory,
  1149. GPU: terms.GPU,
  1150. Storage: terms.Storage,
  1151. BaseCPUPrice: aws.BaseCPUPrice,
  1152. BaseRAMPrice: aws.BaseRAMPrice,
  1153. BaseGPUPrice: aws.BaseGPUPrice,
  1154. UsageType: usageType,
  1155. }, nil
  1156. }
  1157. // NodePricing takes in a key from GetKey and returns a Node object for use in building the cost model.
  1158. func (aws *AWS) NodePricing(k Key) (*Node, error) {
  1159. aws.DownloadPricingDataLock.RLock()
  1160. defer aws.DownloadPricingDataLock.RUnlock()
  1161. key := k.Features()
  1162. usageType := "ondemand"
  1163. if aws.isPreemptible(key) {
  1164. usageType = PreemptibleType
  1165. }
  1166. terms, ok := aws.Pricing[key]
  1167. if ok {
  1168. return aws.createNode(terms, usageType, k)
  1169. } else if _, ok := aws.ValidPricingKeys[key]; ok {
  1170. aws.DownloadPricingDataLock.RUnlock()
  1171. err := aws.DownloadPricingData()
  1172. aws.DownloadPricingDataLock.RLock()
  1173. if err != nil {
  1174. return &Node{
  1175. Cost: aws.BaseCPUPrice,
  1176. BaseCPUPrice: aws.BaseCPUPrice,
  1177. BaseRAMPrice: aws.BaseRAMPrice,
  1178. BaseGPUPrice: aws.BaseGPUPrice,
  1179. UsageType: usageType,
  1180. UsesBaseCPUPrice: true,
  1181. }, err
  1182. }
  1183. terms, termsOk := aws.Pricing[key]
  1184. if !termsOk {
  1185. return &Node{
  1186. Cost: aws.BaseCPUPrice,
  1187. BaseCPUPrice: aws.BaseCPUPrice,
  1188. BaseRAMPrice: aws.BaseRAMPrice,
  1189. BaseGPUPrice: aws.BaseGPUPrice,
  1190. UsageType: usageType,
  1191. UsesBaseCPUPrice: true,
  1192. }, fmt.Errorf("Unable to find any Pricing data for \"%s\"", key)
  1193. }
  1194. return aws.createNode(terms, usageType, k)
  1195. } else { // Fall back to base pricing if we can't find the key. Base pricing is handled at the costmodel level.
  1196. return nil, fmt.Errorf("Invalid Pricing Key \"%s\"", key)
  1197. }
  1198. }
  1199. // ClusterInfo returns an object that represents the cluster. TODO: actually return the name of the cluster. Blocked on cluster federation.
  1200. func (awsProvider *AWS) ClusterInfo() (map[string]string, error) {
  1201. defaultClusterName := "AWS Cluster #1"
  1202. c, err := awsProvider.GetConfig()
  1203. if err != nil {
  1204. return nil, err
  1205. }
  1206. remoteEnabled := env.IsRemoteEnabled()
  1207. makeStructure := func(clusterName string) (map[string]string, error) {
  1208. m := make(map[string]string)
  1209. m["name"] = clusterName
  1210. m["provider"] = kubecost.AWSProvider
  1211. m["account"] = c.AthenaProjectID // this value requires configuration but is unavailable else where
  1212. m["region"] = awsProvider.clusterRegion
  1213. m["id"] = env.GetClusterID()
  1214. m["remoteReadEnabled"] = strconv.FormatBool(remoteEnabled)
  1215. m["provisioner"] = awsProvider.clusterProvisioner
  1216. return m, nil
  1217. }
  1218. if c.ClusterName != "" {
  1219. return makeStructure(c.ClusterName)
  1220. }
  1221. maybeClusterId := env.GetAWSClusterID()
  1222. if len(maybeClusterId) != 0 {
  1223. log.Infof("Returning \"%s\" as ClusterName", maybeClusterId)
  1224. return makeStructure(maybeClusterId)
  1225. }
  1226. log.Infof("Unable to sniff out cluster ID, perhaps set $%s to force one", env.AWSClusterIDEnvVar)
  1227. return makeStructure(defaultClusterName)
  1228. }
  1229. // updates the authentication to the latest values (via config or secret)
  1230. func (aws *AWS) ConfigureAuth() error {
  1231. c, err := aws.Config.GetCustomPricingData()
  1232. if err != nil {
  1233. log.Errorf("Error downloading default pricing data: %s", err.Error())
  1234. }
  1235. return aws.ConfigureAuthWith(c)
  1236. }
  1237. // updates the authentication to the latest values (via config or secret)
  1238. func (aws *AWS) ConfigureAuthWith(config *CustomPricing) error {
  1239. accessKeyID, accessKeySecret := aws.getAWSAuth(false, config)
  1240. if accessKeyID != "" && accessKeySecret != "" { // credentials may exist on the actual AWS node-- if so, use those. If not, override with the service key
  1241. err := env.Set(env.AWSAccessKeyIDEnvVar, accessKeyID)
  1242. if err != nil {
  1243. return err
  1244. }
  1245. err = env.Set(env.AWSAccessKeySecretEnvVar, accessKeySecret)
  1246. if err != nil {
  1247. return err
  1248. }
  1249. }
  1250. return nil
  1251. }
  1252. // Gets the aws key id and secret
  1253. func (aws *AWS) getAWSAuth(forceReload bool, cp *CustomPricing) (string, string) {
  1254. // 1. Check config values first (set from frontend UI)
  1255. if cp.ServiceKeyName != "" && cp.ServiceKeySecret != "" {
  1256. aws.serviceAccountChecks.set("hasKey", &ServiceAccountCheck{
  1257. Message: "AWS ServiceKey exists",
  1258. Status: true,
  1259. })
  1260. return cp.ServiceKeyName, cp.ServiceKeySecret
  1261. }
  1262. // 2. Check for secret
  1263. s, _ := aws.loadAWSAuthSecret(forceReload)
  1264. if s != nil && s.AccessKeyID != "" && s.SecretAccessKey != "" {
  1265. aws.serviceAccountChecks.set("hasKey", &ServiceAccountCheck{
  1266. Message: "AWS ServiceKey exists",
  1267. Status: true,
  1268. })
  1269. return s.AccessKeyID, s.SecretAccessKey
  1270. }
  1271. // 3. Fall back to env vars
  1272. if env.GetAWSAccessKeyID() == "" || env.GetAWSAccessKeyID() == "" {
  1273. aws.serviceAccountChecks.set("hasKey", &ServiceAccountCheck{
  1274. Message: "AWS ServiceKey exists",
  1275. Status: false,
  1276. })
  1277. } else {
  1278. aws.serviceAccountChecks.set("hasKey", &ServiceAccountCheck{
  1279. Message: "AWS ServiceKey exists",
  1280. Status: true,
  1281. })
  1282. }
  1283. return env.GetAWSAccessKeyID(), env.GetAWSAccessKeySecret()
  1284. }
  1285. // Load once and cache the result (even on failure). This is an install time secret, so
  1286. // we don't expect the secret to change. If it does, however, we can force reload using
  1287. // the input parameter.
  1288. func (aws *AWS) loadAWSAuthSecret(force bool) (*AWSAccessKey, error) {
  1289. if !force && loadedAWSSecret {
  1290. return awsSecret, nil
  1291. }
  1292. loadedAWSSecret = true
  1293. exists, err := fileutil.FileExists(authSecretPath)
  1294. if !exists || err != nil {
  1295. return nil, fmt.Errorf("Failed to locate service account file: %s", authSecretPath)
  1296. }
  1297. result, err := os.ReadFile(authSecretPath)
  1298. if err != nil {
  1299. return nil, err
  1300. }
  1301. var ak AWSAccessKey
  1302. err = json.Unmarshal(result, &ak)
  1303. if err != nil {
  1304. return nil, err
  1305. }
  1306. awsSecret = &ak
  1307. return awsSecret, nil
  1308. }
  1309. func (aws *AWS) getAddressesForRegion(ctx context.Context, region string) (*ec2.DescribeAddressesOutput, error) {
  1310. aak, err := aws.GetAWSAccessKey()
  1311. if err != nil {
  1312. return nil, err
  1313. }
  1314. cfg, err := aak.CreateConfig(region)
  1315. if err != nil {
  1316. return nil, err
  1317. }
  1318. cli := ec2.NewFromConfig(cfg)
  1319. return cli.DescribeAddresses(ctx, &ec2.DescribeAddressesInput{})
  1320. }
  1321. func (aws *AWS) getAllAddresses() ([]*ec2Types.Address, error) {
  1322. aws.ConfigureAuth() // load authentication data into env vars
  1323. addressCh := make(chan *ec2.DescribeAddressesOutput, len(awsRegions))
  1324. errorCh := make(chan error, len(awsRegions))
  1325. var wg sync.WaitGroup
  1326. wg.Add(len(awsRegions))
  1327. // Get volumes from each AWS region
  1328. for _, r := range awsRegions {
  1329. // Fetch IP address response and send results and errors to their
  1330. // respective channels
  1331. go func(region string) {
  1332. defer wg.Done()
  1333. defer errs.HandlePanic()
  1334. // Query for first page of volume results
  1335. resp, err := aws.getAddressesForRegion(context.TODO(), region)
  1336. if err != nil {
  1337. errorCh <- err
  1338. return
  1339. }
  1340. addressCh <- resp
  1341. }(r)
  1342. }
  1343. // Close the result channels after everything has been sent
  1344. go func() {
  1345. defer errs.HandlePanic()
  1346. wg.Wait()
  1347. close(errorCh)
  1348. close(addressCh)
  1349. }()
  1350. var addresses []*ec2Types.Address
  1351. for adds := range addressCh {
  1352. for _, add := range adds.Addresses {
  1353. a := add // duplicate to avoid pointer to iterator
  1354. addresses = append(addresses, &a)
  1355. }
  1356. }
  1357. var errs []error
  1358. for err := range errorCh {
  1359. log.DedupedWarningf(5, "unable to get addresses: %s", err)
  1360. errs = append(errs, err)
  1361. }
  1362. // Return error if no addresses are returned
  1363. if len(errs) > 0 && len(addresses) == 0 {
  1364. return nil, fmt.Errorf("%d error(s) retrieving addresses: %v", len(errs), errs)
  1365. }
  1366. return addresses, nil
  1367. }
  1368. // GetAddresses retrieves EC2 addresses
  1369. func (aws *AWS) GetAddresses() ([]byte, error) {
  1370. addresses, err := aws.getAllAddresses()
  1371. if err != nil {
  1372. return nil, err
  1373. }
  1374. // Format the response this way to match the JSON-encoded formatting of a single response
  1375. // from DescribeAddresss, so that consumers can always expect AWS disk responses to have
  1376. // a "Addresss" key at the top level.
  1377. return json.Marshal(map[string][]*ec2Types.Address{
  1378. "Addresses": addresses,
  1379. })
  1380. }
  1381. func (aws *AWS) isAddressOrphaned(address *ec2Types.Address) bool {
  1382. if address.AssociationId != nil {
  1383. return false
  1384. }
  1385. return true
  1386. }
  1387. func (aws *AWS) getDisksForRegion(ctx context.Context, region string, maxResults int32, nextToken *string) (*ec2.DescribeVolumesOutput, error) {
  1388. aak, err := aws.GetAWSAccessKey()
  1389. if err != nil {
  1390. return nil, err
  1391. }
  1392. cfg, err := aak.CreateConfig(region)
  1393. if err != nil {
  1394. return nil, err
  1395. }
  1396. cli := ec2.NewFromConfig(cfg)
  1397. return cli.DescribeVolumes(ctx, &ec2.DescribeVolumesInput{
  1398. MaxResults: &maxResults,
  1399. NextToken: nextToken,
  1400. })
  1401. }
  1402. func (aws *AWS) getAllDisks() ([]*ec2Types.Volume, error) {
  1403. aws.ConfigureAuth() // load authentication data into env vars
  1404. volumeCh := make(chan *ec2.DescribeVolumesOutput, len(awsRegions))
  1405. errorCh := make(chan error, len(awsRegions))
  1406. var wg sync.WaitGroup
  1407. wg.Add(len(awsRegions))
  1408. // Get volumes from each AWS region
  1409. for _, r := range awsRegions {
  1410. // Fetch volume response and send results and errors to their
  1411. // respective channels
  1412. go func(region string) {
  1413. defer wg.Done()
  1414. defer errs.HandlePanic()
  1415. // Query for first page of volume results
  1416. resp, err := aws.getDisksForRegion(context.TODO(), region, 1000, nil)
  1417. if err != nil {
  1418. errorCh <- err
  1419. return
  1420. }
  1421. volumeCh <- resp
  1422. // A NextToken indicates more pages of results. Keep querying
  1423. // until all pages are retrieved.
  1424. for resp.NextToken != nil {
  1425. resp, err = aws.getDisksForRegion(context.TODO(), region, 100, resp.NextToken)
  1426. if err != nil {
  1427. errorCh <- err
  1428. return
  1429. }
  1430. volumeCh <- resp
  1431. }
  1432. }(r)
  1433. }
  1434. // Close the result channels after everything has been sent
  1435. go func() {
  1436. defer errs.HandlePanic()
  1437. wg.Wait()
  1438. close(errorCh)
  1439. close(volumeCh)
  1440. }()
  1441. var volumes []*ec2Types.Volume
  1442. for vols := range volumeCh {
  1443. for _, vol := range vols.Volumes {
  1444. v := vol // duplicate to avoid pointer to iterator
  1445. volumes = append(volumes, &v)
  1446. }
  1447. }
  1448. var errs []error
  1449. for err := range errorCh {
  1450. log.DedupedWarningf(5, "unable to get disks: %s", err)
  1451. errs = append(errs, err)
  1452. }
  1453. // Return error if no volumes are returned
  1454. if len(errs) > 0 && len(volumes) == 0 {
  1455. return nil, fmt.Errorf("%d error(s) retrieving volumes: %v", len(errs), errs)
  1456. }
  1457. return volumes, nil
  1458. }
  1459. // GetDisks returns the AWS disks backing PVs. Useful because sometimes k8s will not clean up PVs correctly. Requires a json config in /var/configs with key region.
  1460. func (aws *AWS) GetDisks() ([]byte, error) {
  1461. volumes, err := aws.getAllDisks()
  1462. if err != nil {
  1463. return nil, err
  1464. }
  1465. // Format the response this way to match the JSON-encoded formatting of a single response
  1466. // from DescribeVolumes, so that consumers can always expect AWS disk responses to have
  1467. // a "Volumes" key at the top level.
  1468. return json.Marshal(map[string][]*ec2Types.Volume{
  1469. "Volumes": volumes,
  1470. })
  1471. }
  1472. func (aws *AWS) isDiskOrphaned(vol *ec2Types.Volume) bool {
  1473. // Do not consider volume orphaned if in use
  1474. if vol.State == InUseState {
  1475. return false
  1476. }
  1477. // Do not consider volume orphaned if volume is attached to any attachments
  1478. if len(vol.Attachments) != 0 {
  1479. for _, attachment := range vol.Attachments {
  1480. if attachment.State == AttachedState {
  1481. return false
  1482. }
  1483. }
  1484. }
  1485. return true
  1486. }
  1487. func (aws *AWS) GetOrphanedResources() ([]OrphanedResource, error) {
  1488. volumes, err := aws.getAllDisks()
  1489. if err != nil {
  1490. return nil, err
  1491. }
  1492. addresses, err := aws.getAllAddresses()
  1493. if err != nil {
  1494. return nil, err
  1495. }
  1496. var orphanedResources []OrphanedResource
  1497. for _, volume := range volumes {
  1498. if aws.isDiskOrphaned(volume) {
  1499. cost, err := aws.findCostForDisk(volume)
  1500. if err != nil {
  1501. return nil, err
  1502. }
  1503. var volumeSize int64
  1504. if volume.Size != nil {
  1505. volumeSize = int64(*volume.Size)
  1506. }
  1507. // This is turning us-east-1a into us-east-1
  1508. var zone string
  1509. if volume.AvailabilityZone != nil {
  1510. zone = *volume.AvailabilityZone
  1511. }
  1512. var region, url string
  1513. region = regionRx.FindString(zone)
  1514. if region != "" {
  1515. url = "https://console.aws.amazon.com/ec2/home?region=" + region + "#Volumes:sort=desc:createTime"
  1516. } else {
  1517. url = "https://console.aws.amazon.com/ec2/home?#Volumes:sort=desc:createTime"
  1518. }
  1519. or := OrphanedResource{
  1520. Kind: "disk",
  1521. Region: zone,
  1522. Size: &volumeSize,
  1523. DiskName: *volume.VolumeId,
  1524. Url: url,
  1525. MonthlyCost: cost,
  1526. }
  1527. orphanedResources = append(orphanedResources, or)
  1528. }
  1529. }
  1530. for _, address := range addresses {
  1531. if aws.isAddressOrphaned(address) {
  1532. cost := AWSHourlyPublicIPCost * timeutil.HoursPerMonth
  1533. desc := map[string]string{}
  1534. for _, tag := range address.Tags {
  1535. if tag.Key == nil {
  1536. continue
  1537. }
  1538. if tag.Value == nil {
  1539. desc[*tag.Key] = ""
  1540. } else {
  1541. desc[*tag.Key] = *tag.Value
  1542. }
  1543. }
  1544. or := OrphanedResource{
  1545. Kind: "address",
  1546. Address: *address.PublicIp,
  1547. Description: desc,
  1548. Url: "http://console.aws.amazon.com/ec2/home?#Addresses",
  1549. MonthlyCost: &cost,
  1550. }
  1551. orphanedResources = append(orphanedResources, or)
  1552. }
  1553. }
  1554. return orphanedResources, nil
  1555. }
  1556. func (aws *AWS) findCostForDisk(disk *ec2Types.Volume) (*float64, error) {
  1557. //todo: use AWS pricing from all regions
  1558. if disk.AvailabilityZone == nil {
  1559. return nil, fmt.Errorf("nil region")
  1560. }
  1561. if disk.Size == nil {
  1562. return nil, fmt.Errorf("nil disk size")
  1563. }
  1564. class := volTypes[string(disk.VolumeType)]
  1565. key := "us-east-2" + "," + class
  1566. priceStr := aws.Pricing[key].PV.Cost
  1567. price, err := strconv.ParseFloat(priceStr, 64)
  1568. if err != nil {
  1569. return nil, err
  1570. }
  1571. cost := price * timeutil.HoursPerMonth * float64(*disk.Size)
  1572. return &cost, nil
  1573. }
  1574. // QueryAthenaPaginated executes athena query and processes results.
  1575. func (aws *AWS) QueryAthenaPaginated(ctx context.Context, query string, fn func(*athena.GetQueryResultsOutput) bool) error {
  1576. awsAthenaInfo, err := aws.GetAWSAthenaInfo()
  1577. if err != nil {
  1578. return err
  1579. }
  1580. if awsAthenaInfo.AthenaDatabase == "" || awsAthenaInfo.AthenaTable == "" || awsAthenaInfo.AthenaRegion == "" ||
  1581. awsAthenaInfo.AthenaBucketName == "" || awsAthenaInfo.AccountID == "" {
  1582. return fmt.Errorf("QueryAthenaPaginated: athena configuration incomplete")
  1583. }
  1584. queryExecutionCtx := &athenaTypes.QueryExecutionContext{
  1585. Database: awsSDK.String(awsAthenaInfo.AthenaDatabase),
  1586. }
  1587. resultConfiguration := &athenaTypes.ResultConfiguration{
  1588. OutputLocation: awsSDK.String(awsAthenaInfo.AthenaBucketName),
  1589. }
  1590. startQueryExecutionInput := &athena.StartQueryExecutionInput{
  1591. QueryString: awsSDK.String(query),
  1592. QueryExecutionContext: queryExecutionCtx,
  1593. ResultConfiguration: resultConfiguration,
  1594. }
  1595. // Only set if there is a value, the default input is nil which defaults to the 'primary' workgroup
  1596. if awsAthenaInfo.AthenaWorkgroup != "" {
  1597. startQueryExecutionInput.WorkGroup = awsSDK.String(awsAthenaInfo.AthenaWorkgroup)
  1598. }
  1599. // Create Athena Client
  1600. cfg, err := awsAthenaInfo.CreateConfig()
  1601. if err != nil {
  1602. log.Errorf("Could not retrieve Athena Configuration: %s", err.Error())
  1603. }
  1604. cli := athena.NewFromConfig(cfg)
  1605. // Query Athena
  1606. startQueryExecutionOutput, err := cli.StartQueryExecution(ctx, startQueryExecutionInput)
  1607. if err != nil {
  1608. return fmt.Errorf("QueryAthenaPaginated: start query error: %s", err.Error())
  1609. }
  1610. err = waitForQueryToComplete(ctx, cli, startQueryExecutionOutput.QueryExecutionId)
  1611. if err != nil {
  1612. return fmt.Errorf("QueryAthenaPaginated: query execution error: %s", err.Error())
  1613. }
  1614. queryResultsInput := &athena.GetQueryResultsInput{
  1615. QueryExecutionId: startQueryExecutionOutput.QueryExecutionId,
  1616. }
  1617. getQueryResultsPaginator := athena.NewGetQueryResultsPaginator(cli, queryResultsInput)
  1618. for getQueryResultsPaginator.HasMorePages() {
  1619. pg, err := getQueryResultsPaginator.NextPage(ctx)
  1620. if err != nil {
  1621. log.Errorf("QueryAthenaPaginated: NextPage error: %s", err.Error())
  1622. continue
  1623. }
  1624. fn(pg)
  1625. }
  1626. return nil
  1627. }
  1628. func waitForQueryToComplete(ctx context.Context, client *athena.Client, queryExecutionID *string) error {
  1629. inp := &athena.GetQueryExecutionInput{
  1630. QueryExecutionId: queryExecutionID,
  1631. }
  1632. isQueryStillRunning := true
  1633. for isQueryStillRunning {
  1634. qe, err := client.GetQueryExecution(ctx, inp)
  1635. if err != nil {
  1636. return err
  1637. }
  1638. if qe.QueryExecution.Status.State == "SUCCEEDED" {
  1639. isQueryStillRunning = false
  1640. continue
  1641. }
  1642. if qe.QueryExecution.Status.State != "RUNNING" && qe.QueryExecution.Status.State != "QUEUED" {
  1643. return fmt.Errorf("no query results available for query %s", *queryExecutionID)
  1644. }
  1645. time.Sleep(2 * time.Second)
  1646. }
  1647. return nil
  1648. }
  1649. type SavingsPlanData struct {
  1650. ResourceID string
  1651. EffectiveCost float64
  1652. SavingsPlanARN string
  1653. MostRecentDate string
  1654. }
  1655. func (aws *AWS) GetSavingsPlanDataFromAthena() error {
  1656. cfg, err := aws.GetConfig()
  1657. if err != nil {
  1658. aws.RIPricingError = err
  1659. return err
  1660. }
  1661. if cfg.AthenaBucketName == "" {
  1662. err = fmt.Errorf("No Athena Bucket configured")
  1663. aws.RIPricingError = err
  1664. return err
  1665. }
  1666. if aws.SavingsPlanDataByInstanceID == nil {
  1667. aws.SavingsPlanDataByInstanceID = make(map[string]*SavingsPlanData)
  1668. }
  1669. tNow := time.Now()
  1670. tOneDayAgo := tNow.Add(time.Duration(-25) * time.Hour) // Also get files from one day ago to avoid boundary conditions
  1671. start := tOneDayAgo.Format("2006-01-02")
  1672. end := tNow.Format("2006-01-02")
  1673. // Use Savings Plan Effective Rate as an estimation for cost, assuming the 1h most recent period got a fully loaded savings plan.
  1674. //
  1675. q := `SELECT
  1676. line_item_usage_start_date,
  1677. savings_plan_savings_plan_a_r_n,
  1678. line_item_resource_id,
  1679. savings_plan_savings_plan_rate
  1680. FROM %s as cost_data
  1681. WHERE line_item_usage_start_date BETWEEN date '%s' AND date '%s'
  1682. AND line_item_line_item_type = 'SavingsPlanCoveredUsage' ORDER BY
  1683. line_item_usage_start_date DESC`
  1684. page := 0
  1685. processResults := func(op *athena.GetQueryResultsOutput) bool {
  1686. if op == nil {
  1687. log.Errorf("GetSavingsPlanDataFromAthena: Athena page is nil")
  1688. return false
  1689. } else if op.ResultSet == nil {
  1690. log.Errorf("GetSavingsPlanDataFromAthena: Athena page.ResultSet is nil")
  1691. return false
  1692. }
  1693. aws.SavingsPlanDataLock.Lock()
  1694. aws.SavingsPlanDataByInstanceID = make(map[string]*SavingsPlanData) // Clean out the old data and only report a savingsplan price if its in the most recent run.
  1695. mostRecentDate := ""
  1696. iter := op.ResultSet.Rows
  1697. if page == 0 && len(iter) > 0 {
  1698. iter = op.ResultSet.Rows[1:len(op.ResultSet.Rows)]
  1699. }
  1700. page++
  1701. for _, r := range iter {
  1702. d := *r.Data[0].VarCharValue
  1703. if mostRecentDate == "" {
  1704. mostRecentDate = d
  1705. } else if mostRecentDate != d { // Get all most recent assignments
  1706. break
  1707. }
  1708. cost, err := strconv.ParseFloat(*r.Data[3].VarCharValue, 64)
  1709. if err != nil {
  1710. log.Infof("Error converting `%s` from float ", *r.Data[3].VarCharValue)
  1711. }
  1712. r := &SavingsPlanData{
  1713. ResourceID: *r.Data[2].VarCharValue,
  1714. EffectiveCost: cost,
  1715. SavingsPlanARN: *r.Data[1].VarCharValue,
  1716. MostRecentDate: d,
  1717. }
  1718. aws.SavingsPlanDataByInstanceID[r.ResourceID] = r
  1719. }
  1720. log.Debugf("Found %d savings plan applied instances", len(aws.SavingsPlanDataByInstanceID))
  1721. for k, r := range aws.SavingsPlanDataByInstanceID {
  1722. log.DedupedInfof(5, "Savings Plan Instance Data found for node %s : %f at time %s", k, r.EffectiveCost, r.MostRecentDate)
  1723. }
  1724. aws.SavingsPlanDataLock.Unlock()
  1725. return true
  1726. }
  1727. query := fmt.Sprintf(q, cfg.AthenaTable, start, end)
  1728. log.Debugf("Running Query: %s", query)
  1729. err = aws.QueryAthenaPaginated(context.TODO(), query, processResults)
  1730. if err != nil {
  1731. aws.RIPricingError = err
  1732. return fmt.Errorf("Error fetching Savings Plan Data: %s", err)
  1733. }
  1734. return nil
  1735. }
  1736. type RIData struct {
  1737. ResourceID string
  1738. EffectiveCost float64
  1739. ReservationARN string
  1740. MostRecentDate string
  1741. }
  1742. func (aws *AWS) GetReservationDataFromAthena() error {
  1743. cfg, err := aws.GetConfig()
  1744. if err != nil {
  1745. aws.RIPricingError = err
  1746. return err
  1747. }
  1748. if cfg.AthenaBucketName == "" {
  1749. err = fmt.Errorf("No Athena Bucket configured")
  1750. aws.RIPricingError = err
  1751. return err
  1752. }
  1753. // Query for all column names in advance in order to validate configured
  1754. // label columns
  1755. columns, _ := aws.fetchColumns()
  1756. if !columns["reservation_reservation_a_r_n"] || !columns["reservation_effective_cost"] {
  1757. err = fmt.Errorf("no reservation data available in Athena")
  1758. aws.RIPricingError = err
  1759. return err
  1760. }
  1761. if aws.RIPricingByInstanceID == nil {
  1762. aws.RIPricingByInstanceID = make(map[string]*RIData)
  1763. }
  1764. tNow := time.Now()
  1765. tOneDayAgo := tNow.Add(time.Duration(-25) * time.Hour) // Also get files from one day ago to avoid boundary conditions
  1766. start := tOneDayAgo.Format("2006-01-02")
  1767. end := tNow.Format("2006-01-02")
  1768. q := `SELECT
  1769. line_item_usage_start_date,
  1770. reservation_reservation_a_r_n,
  1771. line_item_resource_id,
  1772. reservation_effective_cost
  1773. FROM %s as cost_data
  1774. WHERE line_item_usage_start_date BETWEEN date '%s' AND date '%s'
  1775. AND reservation_reservation_a_r_n <> '' ORDER BY
  1776. line_item_usage_start_date DESC`
  1777. page := 0
  1778. processResults := func(op *athena.GetQueryResultsOutput) bool {
  1779. if op == nil {
  1780. log.Errorf("GetReservationDataFromAthena: Athena page is nil")
  1781. return false
  1782. } else if op.ResultSet == nil {
  1783. log.Errorf("GetReservationDataFromAthena: Athena page.ResultSet is nil")
  1784. return false
  1785. }
  1786. aws.RIDataLock.Lock()
  1787. aws.RIPricingByInstanceID = make(map[string]*RIData) // Clean out the old data and only report a RI price if its in the most recent run.
  1788. mostRecentDate := ""
  1789. iter := op.ResultSet.Rows
  1790. if page == 0 && len(iter) > 0 {
  1791. iter = op.ResultSet.Rows[1:len(op.ResultSet.Rows)]
  1792. }
  1793. page++
  1794. for _, r := range iter {
  1795. d := *r.Data[0].VarCharValue
  1796. if mostRecentDate == "" {
  1797. mostRecentDate = d
  1798. } else if mostRecentDate != d { // Get all most recent assignments
  1799. break
  1800. }
  1801. cost, err := strconv.ParseFloat(*r.Data[3].VarCharValue, 64)
  1802. if err != nil {
  1803. log.Infof("Error converting `%s` from float ", *r.Data[3].VarCharValue)
  1804. }
  1805. r := &RIData{
  1806. ResourceID: *r.Data[2].VarCharValue,
  1807. EffectiveCost: cost,
  1808. ReservationARN: *r.Data[1].VarCharValue,
  1809. MostRecentDate: d,
  1810. }
  1811. aws.RIPricingByInstanceID[r.ResourceID] = r
  1812. }
  1813. log.Debugf("Found %d reserved instances", len(aws.RIPricingByInstanceID))
  1814. for k, r := range aws.RIPricingByInstanceID {
  1815. log.DedupedInfof(5, "Reserved Instance Data found for node %s : %f at time %s", k, r.EffectiveCost, r.MostRecentDate)
  1816. }
  1817. aws.RIDataLock.Unlock()
  1818. return true
  1819. }
  1820. query := fmt.Sprintf(q, cfg.AthenaTable, start, end)
  1821. log.Debugf("Running Query: %s", query)
  1822. err = aws.QueryAthenaPaginated(context.TODO(), query, processResults)
  1823. if err != nil {
  1824. aws.RIPricingError = err
  1825. return fmt.Errorf("Error fetching Reserved Instance Data: %s", err)
  1826. }
  1827. aws.RIPricingError = nil
  1828. return nil
  1829. }
  1830. // fetchColumns returns a list of the names of all columns in the configured
  1831. // Athena tables
  1832. func (aws *AWS) fetchColumns() (map[string]bool, error) {
  1833. columnSet := map[string]bool{}
  1834. awsAthenaInfo, err := aws.GetAWSAthenaInfo()
  1835. if err != nil {
  1836. return nil, err
  1837. }
  1838. // This Query is supported by Athena tables and views
  1839. q := `SELECT column_name FROM information_schema.columns WHERE table_schema = '%s' AND table_name = '%s'`
  1840. query := fmt.Sprintf(q, awsAthenaInfo.AthenaDatabase, awsAthenaInfo.AthenaTable)
  1841. pageNum := 0
  1842. athenaErr := aws.QueryAthenaPaginated(context.TODO(), query, func(page *athena.GetQueryResultsOutput) bool {
  1843. if page == nil {
  1844. log.Errorf("fetchColumns: Athena page is nil")
  1845. return false
  1846. } else if page.ResultSet == nil {
  1847. log.Errorf("fetchColumns: Athena page.ResultSet is nil")
  1848. return false
  1849. }
  1850. // remove header row 'column_name'
  1851. rows := page.ResultSet.Rows[1:]
  1852. for _, row := range rows {
  1853. columnSet[*row.Data[0].VarCharValue] = true
  1854. }
  1855. pageNum++
  1856. return true
  1857. })
  1858. if athenaErr != nil {
  1859. return columnSet, athenaErr
  1860. }
  1861. if len(columnSet) == 0 {
  1862. log.Infof("No columns retrieved from Athena")
  1863. }
  1864. return columnSet, nil
  1865. }
  1866. type spotInfo struct {
  1867. Timestamp string `csv:"Timestamp"`
  1868. UsageType string `csv:"UsageType"`
  1869. Operation string `csv:"Operation"`
  1870. InstanceID string `csv:"InstanceID"`
  1871. MyBidID string `csv:"MyBidID"`
  1872. MyMaxPrice string `csv:"MyMaxPrice"`
  1873. MarketPrice string `csv:"MarketPrice"`
  1874. Charge string `csv:"Charge"`
  1875. Version string `csv:"Version"`
  1876. }
  1877. func (aws *AWS) parseSpotData(bucket string, prefix string, projectID string, region string) (map[string]*spotInfo, error) {
  1878. aws.ConfigureAuth() // configure aws api authentication by setting env vars
  1879. s3Prefix := projectID
  1880. if len(prefix) != 0 {
  1881. s3Prefix = prefix + "/" + s3Prefix
  1882. }
  1883. aak, err := aws.GetAWSAccessKey()
  1884. if err != nil {
  1885. return nil, err
  1886. }
  1887. cfg, err := aak.CreateConfig(region)
  1888. if err != nil {
  1889. return nil, err
  1890. }
  1891. cli := s3.NewFromConfig(cfg)
  1892. downloader := manager.NewDownloader(cli)
  1893. tNow := time.Now()
  1894. tOneDayAgo := tNow.Add(time.Duration(-24) * time.Hour) // Also get files from one day ago to avoid boundary conditions
  1895. ls := &s3.ListObjectsInput{
  1896. Bucket: awsSDK.String(bucket),
  1897. Prefix: awsSDK.String(s3Prefix + "." + tOneDayAgo.Format("2006-01-02")),
  1898. }
  1899. ls2 := &s3.ListObjectsInput{
  1900. Bucket: awsSDK.String(bucket),
  1901. Prefix: awsSDK.String(s3Prefix + "." + tNow.Format("2006-01-02")),
  1902. }
  1903. lso, err := cli.ListObjects(context.TODO(), ls)
  1904. if err != nil {
  1905. aws.serviceAccountChecks.set("bucketList", &ServiceAccountCheck{
  1906. Message: "Bucket List Permissions Available",
  1907. Status: false,
  1908. AdditionalInfo: err.Error(),
  1909. })
  1910. return nil, err
  1911. } else {
  1912. aws.serviceAccountChecks.set("bucketList", &ServiceAccountCheck{
  1913. Message: "Bucket List Permissions Available",
  1914. Status: true,
  1915. })
  1916. }
  1917. lsoLen := len(lso.Contents)
  1918. log.Debugf("Found %d spot data files from yesterday", lsoLen)
  1919. if lsoLen == 0 {
  1920. log.Debugf("ListObjects \"s3://%s/%s\" produced no keys", *ls.Bucket, *ls.Prefix)
  1921. }
  1922. lso2, err := cli.ListObjects(context.TODO(), ls2)
  1923. if err != nil {
  1924. return nil, err
  1925. }
  1926. lso2Len := len(lso2.Contents)
  1927. log.Debugf("Found %d spot data files from today", lso2Len)
  1928. if lso2Len == 0 {
  1929. log.Debugf("ListObjects \"s3://%s/%s\" produced no keys", *ls2.Bucket, *ls2.Prefix)
  1930. }
  1931. // TODO: Worth it to use LastModifiedDate to determine if we should reparse the spot data?
  1932. var keys []*string
  1933. for _, obj := range lso.Contents {
  1934. keys = append(keys, obj.Key)
  1935. }
  1936. for _, obj := range lso2.Contents {
  1937. keys = append(keys, obj.Key)
  1938. }
  1939. header, err := csvutil.Header(spotInfo{}, "csv")
  1940. if err != nil {
  1941. return nil, err
  1942. }
  1943. fieldsPerRecord := len(header)
  1944. spots := make(map[string]*spotInfo)
  1945. for _, key := range keys {
  1946. getObj := &s3.GetObjectInput{
  1947. Bucket: awsSDK.String(bucket),
  1948. Key: key,
  1949. }
  1950. buf := manager.NewWriteAtBuffer([]byte{})
  1951. _, err := downloader.Download(context.TODO(), buf, getObj)
  1952. if err != nil {
  1953. aws.serviceAccountChecks.set("objectList", &ServiceAccountCheck{
  1954. Message: "Object Get Permissions Available",
  1955. Status: false,
  1956. AdditionalInfo: err.Error(),
  1957. })
  1958. return nil, err
  1959. } else {
  1960. aws.serviceAccountChecks.set("objectList", &ServiceAccountCheck{
  1961. Message: "Object Get Permissions Available",
  1962. Status: true,
  1963. })
  1964. }
  1965. r := bytes.NewReader(buf.Bytes())
  1966. gr, err := gzip.NewReader(r)
  1967. if err != nil {
  1968. return nil, err
  1969. }
  1970. csvReader := csv.NewReader(gr)
  1971. csvReader.Comma = '\t'
  1972. csvReader.FieldsPerRecord = fieldsPerRecord
  1973. dec, err := csvutil.NewDecoder(csvReader, header...)
  1974. if err != nil {
  1975. return nil, err
  1976. }
  1977. var foundVersion string
  1978. for {
  1979. spot := spotInfo{}
  1980. err := dec.Decode(&spot)
  1981. csvParseErr, isCsvParseErr := err.(*csv.ParseError)
  1982. if err == io.EOF {
  1983. break
  1984. } else if err == csvutil.ErrFieldCount || (isCsvParseErr && csvParseErr.Err == csv.ErrFieldCount) {
  1985. rec := dec.Record()
  1986. // the first two "Record()" will be the comment lines
  1987. // and they show up as len() == 1
  1988. // the first of which is "#Version"
  1989. // the second of which is "#Fields: "
  1990. if len(rec) != 1 {
  1991. log.Infof("Expected %d spot info fields but received %d: %s", fieldsPerRecord, len(rec), rec)
  1992. continue
  1993. }
  1994. if len(foundVersion) == 0 {
  1995. spotFeedVersion := rec[0]
  1996. log.Debugf("Spot feed version is \"%s\"", spotFeedVersion)
  1997. matches := versionRx.FindStringSubmatch(spotFeedVersion)
  1998. if matches != nil {
  1999. foundVersion = matches[1]
  2000. if foundVersion != supportedSpotFeedVersion {
  2001. log.Infof("Unsupported spot info feed version: wanted \"%s\" got \"%s\"", supportedSpotFeedVersion, foundVersion)
  2002. break
  2003. }
  2004. }
  2005. continue
  2006. } else if strings.Index(rec[0], "#") == 0 {
  2007. continue
  2008. } else {
  2009. log.Infof("skipping non-TSV line: %s", rec)
  2010. continue
  2011. }
  2012. } else if err != nil {
  2013. log.Warnf("Error during spot info decode: %+v", err)
  2014. continue
  2015. }
  2016. log.DedupedInfof(5, "Found spot info for: %s", spot.InstanceID)
  2017. spots[spot.InstanceID] = &spot
  2018. }
  2019. gr.Close()
  2020. }
  2021. return spots, nil
  2022. }
  2023. // ApplyReservedInstancePricing TODO
  2024. func (aws *AWS) ApplyReservedInstancePricing(nodes map[string]*Node) {
  2025. }
  2026. func (aws *AWS) ServiceAccountStatus() *ServiceAccountStatus {
  2027. return aws.serviceAccountChecks.getStatus()
  2028. }
  2029. func (aws *AWS) CombinedDiscountForNode(instanceType string, isPreemptible bool, defaultDiscount, negotiatedDiscount float64) float64 {
  2030. return 1.0 - ((1.0 - defaultDiscount) * (1.0 - negotiatedDiscount))
  2031. }
  2032. // Regions returns a predefined list of AWS regions
  2033. func (aws *AWS) Regions() []string {
  2034. return awsRegions
  2035. }