awsprovider.go 39 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320
  1. package cloud
  2. import (
  3. "bytes"
  4. "compress/gzip"
  5. "encoding/csv"
  6. "encoding/json"
  7. "fmt"
  8. "io"
  9. "io/ioutil"
  10. "net/http"
  11. "net/url"
  12. "os"
  13. "regexp"
  14. "strconv"
  15. "strings"
  16. "sync"
  17. "time"
  18. "k8s.io/klog"
  19. "github.com/aws/aws-sdk-go/aws"
  20. "github.com/aws/aws-sdk-go/aws/awserr"
  21. "github.com/aws/aws-sdk-go/aws/session"
  22. "github.com/aws/aws-sdk-go/service/athena"
  23. "github.com/aws/aws-sdk-go/service/ec2"
  24. "github.com/aws/aws-sdk-go/service/s3"
  25. "github.com/aws/aws-sdk-go/service/s3/s3manager"
  26. "github.com/jszwec/csvutil"
  27. v1 "k8s.io/api/core/v1"
  28. metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
  29. "k8s.io/client-go/kubernetes"
  30. )
  31. const awsAccessKeyIDEnvVar = "AWS_ACCESS_KEY_ID"
  32. const awsAccessKeySecretEnvVar = "AWS_SECRET_ACCESS_KEY"
  33. const supportedSpotFeedVersion = "1"
  34. const SpotInfoUpdateType = "spotinfo"
  35. const AthenaInfoUpdateType = "athenainfo"
  36. // AWS represents an Amazon Provider
  37. type AWS struct {
  38. Pricing map[string]*AWSProductTerms
  39. SpotPricingByInstanceID map[string]*spotInfo
  40. ValidPricingKeys map[string]bool
  41. Clientset *kubernetes.Clientset
  42. BaseCPUPrice string
  43. BaseRAMPrice string
  44. BaseGPUPrice string
  45. BaseSpotCPUPrice string
  46. BaseSpotRAMPrice string
  47. SpotLabelName string
  48. SpotLabelValue string
  49. ServiceKeyName string
  50. ServiceKeySecret string
  51. SpotDataRegion string
  52. SpotDataBucket string
  53. SpotDataPrefix string
  54. ProjectID string
  55. DownloadPricingDataLock sync.RWMutex
  56. *CustomProvider
  57. }
  58. // AWSPricing maps a k8s node to an AWS Pricing "product"
  59. type AWSPricing struct {
  60. Products map[string]*AWSProduct `json:"products"`
  61. Terms AWSPricingTerms `json:"terms"`
  62. }
  63. // AWSProduct represents a purchased SKU
  64. type AWSProduct struct {
  65. Sku string `json:"sku"`
  66. Attributes AWSProductAttributes `json:"attributes"`
  67. }
  68. // AWSProductAttributes represents metadata about the product used to map to a node.
  69. type AWSProductAttributes struct {
  70. Location string `json:"location"`
  71. InstanceType string `json:"instanceType"`
  72. Memory string `json:"memory"`
  73. Storage string `json:"storage"`
  74. VCpu string `json:"vcpu"`
  75. UsageType string `json:"usagetype"`
  76. OperatingSystem string `json:"operatingSystem"`
  77. PreInstalledSw string `json:"preInstalledSw"`
  78. InstanceFamily string `json:"instanceFamily"`
  79. GPU string `json:"gpu"` // GPU represents the number of GPU on the instance
  80. }
  81. // AWSPricingTerms are how you pay for the node: OnDemand, Reserved, or (TODO) Spot
  82. type AWSPricingTerms struct {
  83. OnDemand map[string]map[string]*AWSOfferTerm `json:"OnDemand"`
  84. Reserved map[string]map[string]*AWSOfferTerm `json:"Reserved"`
  85. }
  86. // AWSOfferTerm is a sku extension used to pay for the node.
  87. type AWSOfferTerm struct {
  88. Sku string `json:"sku"`
  89. PriceDimensions map[string]*AWSRateCode `json:"priceDimensions"`
  90. }
  91. // AWSRateCode encodes data about the price of a product
  92. type AWSRateCode struct {
  93. Unit string `json:"unit"`
  94. PricePerUnit AWSCurrencyCode `json:"pricePerUnit"`
  95. }
  96. // AWSCurrencyCode is the localized currency. (TODO: support non-USD)
  97. type AWSCurrencyCode struct {
  98. USD string `json:"USD"`
  99. }
  100. // AWSProductTerms represents the full terms of the product
  101. type AWSProductTerms struct {
  102. Sku string `json:"sku"`
  103. OnDemand *AWSOfferTerm `json:"OnDemand"`
  104. Reserved *AWSOfferTerm `json:"Reserved"`
  105. Memory string `json:"memory"`
  106. Storage string `json:"storage"`
  107. VCpu string `json:"vcpu"`
  108. GPU string `json:"gpu"` // GPU represents the number of GPU on the instance
  109. PV *PV `json:"pv"`
  110. }
  111. // ClusterIdEnvVar is the environment variable in which one can manually set the ClusterId
  112. const ClusterIdEnvVar = "AWS_CLUSTER_ID"
  113. // OnDemandRateCode is appended to an node sku
  114. const OnDemandRateCode = ".JRTCKXETXF"
  115. // ReservedRateCode is appended to a node sku
  116. const ReservedRateCode = ".38NPMPTW36"
  117. // HourlyRateCode is appended to a node sku
  118. const HourlyRateCode = ".6YS6EN2CT7"
  119. // volTypes are used to map between AWS UsageTypes and
  120. // EBS volume types, as they would appear in K8s storage class
  121. // name and the EC2 API.
  122. var volTypes = map[string]string{
  123. "EBS:VolumeUsage.gp2": "gp2",
  124. "EBS:VolumeUsage": "standard",
  125. "EBS:VolumeUsage.sc1": "sc1",
  126. "EBS:VolumeP-IOPS.piops": "io1",
  127. "EBS:VolumeUsage.st1": "st1",
  128. "EBS:VolumeUsage.piops": "io1",
  129. "gp2": "EBS:VolumeUsage.gp2",
  130. "standard": "EBS:VolumeUsage",
  131. "sc1": "EBS:VolumeUsage.sc1",
  132. "io1": "EBS:VolumeUsage.piops",
  133. "st1": "EBS:VolumeUsage.st1",
  134. }
  135. // locationToRegion maps AWS region names (As they come from Billing)
  136. // to actual region identifiers
  137. var locationToRegion = map[string]string{
  138. "US East (Ohio)": "us-east-2",
  139. "US East (N. Virginia)": "us-east-1",
  140. "US West (N. California)": "us-west-1",
  141. "US West (Oregon)": "us-west-2",
  142. "Asia Pacific (Hong Kong)": "ap-east-1",
  143. "Asia Pacific (Mumbai)": "ap-south-1",
  144. "Asia Pacific (Osaka-Local)": "ap-northeast-3",
  145. "Asia Pacific (Seoul)": "ap-northeast-2",
  146. "Asia Pacific (Singapore)": "ap-southeast-1",
  147. "Asia Pacific (Sydney)": "ap-southeast-2",
  148. "Asia Pacific (Tokyo)": "ap-northeast-1",
  149. "Canada (Central)": "ca-central-1",
  150. "China (Beijing)": "cn-north-1",
  151. "China (Ningxia)": "cn-northwest-1",
  152. "EU (Frankfurt)": "eu-central-1",
  153. "EU (Ireland)": "eu-west-1",
  154. "EU (London)": "eu-west-2",
  155. "EU (Paris)": "eu-west-3",
  156. "EU (Stockholm)": "eu-north-1",
  157. "South America (Sao Paulo)": "sa-east-1",
  158. "AWS GovCloud (US-East)": "us-gov-east-1",
  159. "AWS GovCloud (US)": "us-gov-west-1",
  160. }
  161. var regionToBillingRegionCode = map[string]string{
  162. "us-east-2": "USE2",
  163. "us-east-1": "",
  164. "us-west-1": "USW1",
  165. "us-west-2": "USW2",
  166. "ap-east-1": "APE1",
  167. "ap-south-1": "APS3",
  168. "ap-northeast-3": "APN3",
  169. "ap-northeast-2": "APN2",
  170. "ap-southeast-1": "APS1",
  171. "ap-southeast-2": "APS2",
  172. "ap-northeast-1": "APN1",
  173. "ca-central-1": "CAN1",
  174. "cn-north-1": "",
  175. "cn-northwest-1": "",
  176. "eu-central-1": "EUC1",
  177. "eu-west-1": "EU",
  178. "eu-west-2": "EUW2",
  179. "eu-west-3": "EUW3",
  180. "eu-north-1": "EUN1",
  181. "sa-east-1": "SAE1",
  182. "us-gov-east-1": "UGE1",
  183. "us-gov-west-1": "UGW1",
  184. }
  185. func (aws *AWS) GetLocalStorageQuery() (string, error) {
  186. return "", nil
  187. }
  188. // KubeAttrConversion maps the k8s labels for region to an aws region
  189. func (aws *AWS) KubeAttrConversion(location, instanceType, operatingSystem string) string {
  190. operatingSystem = strings.ToLower(operatingSystem)
  191. region := locationToRegion[location]
  192. return region + "," + instanceType + "," + operatingSystem
  193. }
  194. type AwsSpotFeedInfo struct {
  195. BucketName string `json:"bucketName"`
  196. Prefix string `json:"prefix"`
  197. Region string `json:"region"`
  198. AccountID string `json:"projectID"`
  199. ServiceKeyName string `json:"serviceKeyName"`
  200. ServiceKeySecret string `json:"serviceKeySecret"`
  201. SpotLabel string `json:"spotLabel"`
  202. SpotLabelValue string `json:"spotLabelValue"`
  203. }
  204. type AwsAthenaInfo struct {
  205. AthenaBucketName string `json:"athenaBucketName"`
  206. AthenaRegion string `json:"athenaRegion"`
  207. AthenaDatabase string `json:"athenaDatabase"`
  208. AthenaTable string `json:"athenaTable"`
  209. ServiceKeyName string `json:"serviceKeyName"`
  210. ServiceKeySecret string `json:"serviceKeySecret"`
  211. AccountID string `json:"projectID"`
  212. }
  213. func (aws *AWS) GetManagementPlatform() (string, error) {
  214. nodes, err := aws.Clientset.CoreV1().Nodes().List(metav1.ListOptions{})
  215. if err != nil {
  216. return "", err
  217. }
  218. if len(nodes.Items) > 0 {
  219. n := nodes.Items[0]
  220. version := n.Status.NodeInfo.KubeletVersion
  221. if strings.Contains(version, "eks") {
  222. return "eks", nil
  223. }
  224. if _, ok := n.Labels["kops.k8s.io/instancegroup"]; ok {
  225. return "kops", nil
  226. }
  227. }
  228. return "", nil
  229. }
  230. func (aws *AWS) GetConfig() (*CustomPricing, error) {
  231. c, err := GetDefaultPricingData("aws.json")
  232. if c.Discount == "" {
  233. c.Discount = "0%"
  234. }
  235. if err != nil {
  236. return nil, err
  237. }
  238. return c, nil
  239. }
  240. func (aws *AWS) UpdateConfig(r io.Reader, updateType string) (*CustomPricing, error) {
  241. c, err := GetDefaultPricingData("aws.json")
  242. if err != nil {
  243. return nil, err
  244. }
  245. if updateType == SpotInfoUpdateType {
  246. a := AwsSpotFeedInfo{}
  247. err := json.NewDecoder(r).Decode(&a)
  248. if err != nil {
  249. return nil, err
  250. }
  251. if err != nil {
  252. return nil, err
  253. }
  254. c.ServiceKeyName = a.ServiceKeyName
  255. c.ServiceKeySecret = a.ServiceKeySecret
  256. c.SpotDataPrefix = a.Prefix
  257. c.SpotDataBucket = a.BucketName
  258. c.ProjectID = a.AccountID
  259. c.SpotDataRegion = a.Region
  260. c.SpotLabel = a.SpotLabel
  261. c.SpotLabelValue = a.SpotLabelValue
  262. } else if updateType == AthenaInfoUpdateType {
  263. a := AwsAthenaInfo{}
  264. err := json.NewDecoder(r).Decode(&a)
  265. if err != nil {
  266. return nil, err
  267. }
  268. c.AthenaBucketName = a.AthenaBucketName
  269. c.AthenaRegion = a.AthenaRegion
  270. c.AthenaDatabase = a.AthenaDatabase
  271. c.AthenaTable = a.AthenaTable
  272. c.ServiceKeyName = a.ServiceKeyName
  273. c.ServiceKeySecret = a.ServiceKeySecret
  274. c.ProjectID = a.AccountID
  275. } else {
  276. a := make(map[string]string)
  277. err = json.NewDecoder(r).Decode(&a)
  278. if err != nil {
  279. return nil, err
  280. }
  281. for k, v := range a {
  282. kUpper := strings.Title(k) // Just so we consistently supply / receive the same values, uppercase the first letter.
  283. err := SetCustomPricingField(c, kUpper, v)
  284. if err != nil {
  285. return nil, err
  286. }
  287. }
  288. }
  289. cj, err := json.Marshal(c)
  290. if err != nil {
  291. return nil, err
  292. }
  293. path := os.Getenv("CONFIG_PATH")
  294. if path == "" {
  295. path = "/models/"
  296. }
  297. path += "aws.json"
  298. err = ioutil.WriteFile(path, cj, 0644)
  299. if err != nil {
  300. return nil, err
  301. }
  302. return c, nil
  303. }
  304. type awsKey struct {
  305. SpotLabelName string
  306. SpotLabelValue string
  307. Labels map[string]string
  308. ProviderID string
  309. }
  310. func (k *awsKey) GPUType() string {
  311. return ""
  312. }
  313. func (k *awsKey) ID() string {
  314. provIdRx := regexp.MustCompile("aws:///([^/]+)/([^/]+)") // It's of the form aws:///us-east-2a/i-0fea4fd46592d050b and we want i-0fea4fd46592d050b, if it exists
  315. for matchNum, group := range provIdRx.FindStringSubmatch(k.ProviderID) {
  316. if matchNum == 2 {
  317. return group
  318. }
  319. }
  320. klog.V(3).Infof("Could not find instance ID in \"%s\"", k.ProviderID)
  321. return ""
  322. }
  323. func (k *awsKey) Features() string {
  324. instanceType := k.Labels[v1.LabelInstanceType]
  325. var operatingSystem string
  326. operatingSystem, ok := k.Labels[v1.LabelOSStable]
  327. if !ok {
  328. operatingSystem = k.Labels["beta.kubernetes.io/os"]
  329. }
  330. region := k.Labels[v1.LabelZoneRegion]
  331. key := region + "," + instanceType + "," + operatingSystem
  332. usageType := "preemptible"
  333. spotKey := key + "," + usageType
  334. if l, ok := k.Labels["lifecycle"]; ok && l == "EC2Spot" {
  335. return spotKey
  336. }
  337. if l, ok := k.Labels[k.SpotLabelName]; ok && l == k.SpotLabelValue {
  338. return spotKey
  339. }
  340. return key
  341. }
  342. func (aws *AWS) PVPricing(pvk PVKey) (*PV, error) {
  343. pricing, ok := aws.Pricing[pvk.Features()]
  344. if !ok {
  345. klog.V(2).Infof("Persistent Volume pricing not found for %s", pvk.Features())
  346. return &PV{}, nil
  347. }
  348. return pricing.PV, nil
  349. }
  350. type awsPVKey struct {
  351. Labels map[string]string
  352. StorageClassParameters map[string]string
  353. StorageClassName string
  354. }
  355. func (aws *AWS) GetPVKey(pv *v1.PersistentVolume, parameters map[string]string) PVKey {
  356. return &awsPVKey{
  357. Labels: pv.Labels,
  358. StorageClassName: pv.Spec.StorageClassName,
  359. }
  360. }
  361. func (key *awsPVKey) Features() string {
  362. storageClass := key.StorageClassName
  363. if storageClass == "standard" {
  364. storageClass = "gp2"
  365. }
  366. // Storage class names are generally EBS volume types (gp2)
  367. // Keys in Pricing are based on UsageTypes (EBS:VolumeType.gp2)
  368. // Converts between the 2
  369. return key.Labels[v1.LabelZoneRegion] + "," + volTypes[storageClass]
  370. }
  371. // GetKey maps node labels to information needed to retrieve pricing data
  372. func (aws *AWS) GetKey(labels map[string]string) Key {
  373. return &awsKey{
  374. SpotLabelName: aws.SpotLabelName,
  375. SpotLabelValue: aws.SpotLabelValue,
  376. Labels: labels,
  377. ProviderID: labels["providerID"],
  378. }
  379. }
  380. func (aws *AWS) isPreemptible(key string) bool {
  381. s := strings.Split(key, ",")
  382. if len(s) == 4 && s[3] == "preemptible" {
  383. return true
  384. }
  385. return false
  386. }
  387. // DownloadPricingData fetches data from the AWS Pricing API
  388. func (aws *AWS) DownloadPricingData() error {
  389. aws.DownloadPricingDataLock.Lock()
  390. defer aws.DownloadPricingDataLock.Unlock()
  391. c, err := GetDefaultPricingData("aws.json")
  392. if err != nil {
  393. klog.V(1).Infof("Error downloading default pricing data: %s", err.Error())
  394. }
  395. aws.BaseCPUPrice = c.CPU
  396. aws.BaseRAMPrice = c.RAM
  397. aws.BaseGPUPrice = c.GPU
  398. aws.BaseSpotCPUPrice = c.SpotCPU
  399. aws.BaseSpotRAMPrice = c.SpotRAM
  400. aws.SpotLabelName = c.SpotLabel
  401. aws.SpotLabelValue = c.SpotLabelValue
  402. aws.SpotDataBucket = c.SpotDataBucket
  403. aws.SpotDataPrefix = c.SpotDataPrefix
  404. aws.ProjectID = c.ProjectID
  405. aws.SpotDataRegion = c.SpotDataRegion
  406. aws.ServiceKeyName = c.ServiceKeyName
  407. aws.ServiceKeySecret = c.ServiceKeySecret
  408. if len(aws.SpotDataBucket) != 0 && len(aws.ProjectID) == 0 {
  409. klog.V(1).Infof("using SpotDataBucket \"%s\" without ProjectID will not end well", aws.SpotDataBucket)
  410. }
  411. nodeList, err := aws.Clientset.CoreV1().Nodes().List(metav1.ListOptions{})
  412. if err != nil {
  413. return err
  414. }
  415. inputkeys := make(map[string]bool)
  416. for _, n := range nodeList.Items {
  417. labels := n.GetObjectMeta().GetLabels()
  418. key := aws.GetKey(labels)
  419. inputkeys[key.Features()] = true
  420. }
  421. pvList, err := aws.Clientset.CoreV1().PersistentVolumes().List(metav1.ListOptions{})
  422. if err != nil {
  423. return err
  424. }
  425. storageClasses, err := aws.Clientset.StorageV1().StorageClasses().List(metav1.ListOptions{})
  426. storageClassMap := make(map[string]map[string]string)
  427. for _, storageClass := range storageClasses.Items {
  428. params := storageClass.Parameters
  429. storageClassMap[storageClass.ObjectMeta.Name] = params
  430. }
  431. pvkeys := make(map[string]PVKey)
  432. for _, pv := range pvList.Items {
  433. params, ok := storageClassMap[pv.Spec.StorageClassName]
  434. if !ok {
  435. klog.V(2).Infof("Unable to find params for storageClassName %s, falling back to default pricing", pv.Name)
  436. continue
  437. }
  438. key := aws.GetPVKey(&pv, params)
  439. pvkeys[key.Features()] = key
  440. }
  441. aws.Pricing = make(map[string]*AWSProductTerms)
  442. aws.ValidPricingKeys = make(map[string]bool)
  443. skusToKeys := make(map[string]string)
  444. pricingURL := "https://pricing.us-east-1.amazonaws.com/offers/v1.0/aws/AmazonEC2/current/index.json"
  445. klog.V(2).Infof("starting download of \"%s\", which is quite large ...", pricingURL)
  446. resp, err := http.Get(pricingURL)
  447. if err != nil {
  448. klog.V(2).Infof("Bogus fetch of \"%s\": %v", pricingURL, err)
  449. return err
  450. }
  451. klog.V(2).Infof("Finished downloading \"%s\"", pricingURL)
  452. dec := json.NewDecoder(resp.Body)
  453. for {
  454. t, err := dec.Token()
  455. if err == io.EOF {
  456. klog.V(2).Infof("done loading \"%s\"\n", pricingURL)
  457. break
  458. }
  459. if t == "products" {
  460. _, err := dec.Token() // this should parse the opening "{""
  461. if err != nil {
  462. return err
  463. }
  464. for dec.More() {
  465. _, err := dec.Token() // the sku token
  466. if err != nil {
  467. return err
  468. }
  469. product := &AWSProduct{}
  470. err = dec.Decode(&product)
  471. if err != nil {
  472. klog.V(1).Infof("Error parsing response from \"%s\": %v", pricingURL, err.Error())
  473. break
  474. }
  475. if product.Attributes.PreInstalledSw == "NA" &&
  476. (strings.HasPrefix(product.Attributes.UsageType, "BoxUsage") || strings.Contains(product.Attributes.UsageType, "-BoxUsage")) {
  477. key := aws.KubeAttrConversion(product.Attributes.Location, product.Attributes.InstanceType, product.Attributes.OperatingSystem)
  478. spotKey := key + ",preemptible"
  479. if inputkeys[key] || inputkeys[spotKey] { // Just grab the sku even if spot, and change the price later.
  480. productTerms := &AWSProductTerms{
  481. Sku: product.Sku,
  482. Memory: product.Attributes.Memory,
  483. Storage: product.Attributes.Storage,
  484. VCpu: product.Attributes.VCpu,
  485. GPU: product.Attributes.GPU,
  486. }
  487. aws.Pricing[key] = productTerms
  488. aws.Pricing[spotKey] = productTerms
  489. skusToKeys[product.Sku] = key
  490. }
  491. aws.ValidPricingKeys[key] = true
  492. aws.ValidPricingKeys[spotKey] = true
  493. } else if strings.Contains(product.Attributes.UsageType, "EBS:Volume") {
  494. // UsageTypes may be prefixed with a region code - we're removing this when using
  495. // volTypes to keep lookups generic
  496. usageTypeRegx := regexp.MustCompile(".*(-|^)(EBS.+)")
  497. usageTypeMatch := usageTypeRegx.FindStringSubmatch(product.Attributes.UsageType)
  498. usageTypeNoRegion := usageTypeMatch[len(usageTypeMatch)-1]
  499. key := locationToRegion[product.Attributes.Location] + "," + usageTypeNoRegion
  500. spotKey := key + ",preemptible"
  501. pv := &PV{
  502. Class: volTypes[usageTypeNoRegion],
  503. Region: locationToRegion[product.Attributes.Location],
  504. }
  505. productTerms := &AWSProductTerms{
  506. Sku: product.Sku,
  507. PV: pv,
  508. }
  509. aws.Pricing[key] = productTerms
  510. aws.Pricing[spotKey] = productTerms
  511. skusToKeys[product.Sku] = key
  512. aws.ValidPricingKeys[key] = true
  513. aws.ValidPricingKeys[spotKey] = true
  514. }
  515. }
  516. }
  517. if t == "terms" {
  518. _, err := dec.Token() // this should parse the opening "{""
  519. if err != nil {
  520. return err
  521. }
  522. termType, err := dec.Token()
  523. if err != nil {
  524. return err
  525. }
  526. if termType == "OnDemand" {
  527. _, err := dec.Token()
  528. if err != nil { // again, should parse an opening "{"
  529. return err
  530. }
  531. for dec.More() {
  532. sku, err := dec.Token()
  533. if err != nil {
  534. return err
  535. }
  536. _, err = dec.Token() // another opening "{"
  537. if err != nil {
  538. return err
  539. }
  540. skuOnDemand, err := dec.Token()
  541. if err != nil {
  542. return err
  543. }
  544. offerTerm := &AWSOfferTerm{}
  545. err = dec.Decode(&offerTerm)
  546. if err != nil {
  547. klog.V(1).Infof("Error decoding AWS Offer Term: " + err.Error())
  548. }
  549. if sku.(string)+OnDemandRateCode == skuOnDemand {
  550. key, ok := skusToKeys[sku.(string)]
  551. spotKey := key + ",preemptible"
  552. if ok {
  553. aws.Pricing[key].OnDemand = offerTerm
  554. aws.Pricing[spotKey].OnDemand = offerTerm
  555. if strings.Contains(key, "EBS:VolumeP-IOPS.piops") {
  556. // If the specific UsageType is the per IO cost used on io1 volumes
  557. // we need to add the per IO cost to the io1 PV cost
  558. cost := offerTerm.PriceDimensions[sku.(string)+OnDemandRateCode+HourlyRateCode].PricePerUnit.USD
  559. // Add the per IO cost to the PV object for the io1 volume type
  560. aws.Pricing[key].PV.CostPerIO = cost
  561. } else if strings.Contains(key, "EBS:Volume") {
  562. // If volume, we need to get hourly cost and add it to the PV object
  563. cost := offerTerm.PriceDimensions[sku.(string)+OnDemandRateCode+HourlyRateCode].PricePerUnit.USD
  564. costFloat, _ := strconv.ParseFloat(cost, 64)
  565. hourlyPrice := costFloat / 730
  566. aws.Pricing[key].PV.Cost = strconv.FormatFloat(hourlyPrice, 'f', -1, 64)
  567. }
  568. }
  569. }
  570. _, err = dec.Token()
  571. if err != nil {
  572. return err
  573. }
  574. }
  575. _, err = dec.Token()
  576. if err != nil {
  577. return err
  578. }
  579. }
  580. }
  581. }
  582. sp, err := parseSpotData(aws.SpotDataBucket, aws.SpotDataPrefix, aws.ProjectID, aws.SpotDataRegion, aws.ServiceKeyName, aws.ServiceKeySecret)
  583. if err != nil {
  584. klog.V(1).Infof("Skipping AWS spot data download: %s", err.Error())
  585. } else {
  586. aws.SpotPricingByInstanceID = sp
  587. }
  588. return nil
  589. }
  590. // AllNodePricing returns all the billing data fetched.
  591. func (aws *AWS) AllNodePricing() (interface{}, error) {
  592. aws.DownloadPricingDataLock.RLock()
  593. defer aws.DownloadPricingDataLock.RUnlock()
  594. return aws.Pricing, nil
  595. }
  596. func (aws *AWS) createNode(terms *AWSProductTerms, usageType string, k Key) (*Node, error) {
  597. key := k.Features()
  598. if aws.isPreemptible(key) {
  599. if spotInfo, ok := aws.SpotPricingByInstanceID[k.ID()]; ok { // try and match directly to an ID for pricing. We'll still need the features
  600. var spotcost string
  601. arr := strings.Split(spotInfo.Charge, " ")
  602. if len(arr) == 2 {
  603. spotcost = arr[0]
  604. } else {
  605. klog.V(2).Infof("Spot data for node %s is missing", k.ID())
  606. }
  607. klog.V(1).Infof("SPOT COST FOR %s: %s", k.Features, spotcost)
  608. return &Node{
  609. Cost: spotcost,
  610. VCPU: terms.VCpu,
  611. RAM: terms.Memory,
  612. GPU: terms.GPU,
  613. Storage: terms.Storage,
  614. BaseCPUPrice: aws.BaseCPUPrice,
  615. BaseRAMPrice: aws.BaseRAMPrice,
  616. BaseGPUPrice: aws.BaseGPUPrice,
  617. UsageType: usageType,
  618. }, nil
  619. }
  620. return &Node{
  621. VCPU: terms.VCpu,
  622. VCPUCost: aws.BaseSpotCPUPrice,
  623. RAM: terms.Memory,
  624. GPU: terms.GPU,
  625. RAMCost: aws.BaseSpotRAMPrice,
  626. Storage: terms.Storage,
  627. BaseCPUPrice: aws.BaseCPUPrice,
  628. BaseRAMPrice: aws.BaseRAMPrice,
  629. BaseGPUPrice: aws.BaseGPUPrice,
  630. UsageType: usageType,
  631. }, nil
  632. }
  633. c, ok := terms.OnDemand.PriceDimensions[terms.Sku+OnDemandRateCode+HourlyRateCode]
  634. if !ok {
  635. return nil, fmt.Errorf("Could not fetch data for \"%s\"", k.ID())
  636. }
  637. cost := c.PricePerUnit.USD
  638. return &Node{
  639. Cost: cost,
  640. VCPU: terms.VCpu,
  641. RAM: terms.Memory,
  642. GPU: terms.GPU,
  643. Storage: terms.Storage,
  644. BaseCPUPrice: aws.BaseCPUPrice,
  645. BaseRAMPrice: aws.BaseRAMPrice,
  646. BaseGPUPrice: aws.BaseGPUPrice,
  647. UsageType: usageType,
  648. }, nil
  649. }
  650. // NodePricing takes in a key from GetKey and returns a Node object for use in building the cost model.
  651. func (aws *AWS) NodePricing(k Key) (*Node, error) {
  652. aws.DownloadPricingDataLock.RLock()
  653. defer aws.DownloadPricingDataLock.RUnlock()
  654. key := k.Features()
  655. usageType := "ondemand"
  656. if aws.isPreemptible(key) {
  657. usageType = "preemptible"
  658. }
  659. terms, ok := aws.Pricing[key]
  660. if ok {
  661. return aws.createNode(terms, usageType, k)
  662. } else if _, ok := aws.ValidPricingKeys[key]; ok {
  663. aws.DownloadPricingDataLock.RUnlock()
  664. err := aws.DownloadPricingData()
  665. aws.DownloadPricingDataLock.RLock()
  666. if err != nil {
  667. return nil, err
  668. }
  669. terms, termsOk := aws.Pricing[key]
  670. if !termsOk {
  671. return nil, fmt.Errorf("Unable to find any Pricing data for \"%s\"", key)
  672. }
  673. return aws.createNode(terms, usageType, k)
  674. } else { // Fall back to base pricing if we can't find the key.
  675. klog.V(1).Infof("Invalid Pricing Key \"%s\"", key)
  676. return &Node{
  677. Cost: aws.BaseCPUPrice,
  678. BaseCPUPrice: aws.BaseCPUPrice,
  679. BaseRAMPrice: aws.BaseRAMPrice,
  680. BaseGPUPrice: aws.BaseGPUPrice,
  681. UsageType: usageType,
  682. UsesBaseCPUPrice: true,
  683. }, nil
  684. }
  685. }
  686. // ClusterInfo returns an object that represents the cluster. TODO: actually return the name of the cluster. Blocked on cluster federation.
  687. func (awsProvider *AWS) ClusterInfo() (map[string]string, error) {
  688. defaultClusterName := "AWS Cluster #1"
  689. makeStructure := func(clusterName string) (map[string]string, error) {
  690. klog.V(2).Infof("Returning \"%s\" as ClusterName", clusterName)
  691. m := make(map[string]string)
  692. m["name"] = clusterName
  693. m["provider"] = "AWS"
  694. return m, nil
  695. }
  696. maybeClusterId := os.Getenv(ClusterIdEnvVar)
  697. if len(maybeClusterId) != 0 {
  698. return makeStructure(maybeClusterId)
  699. }
  700. provIdRx := regexp.MustCompile("aws:///([^/]+)/([^/]+)")
  701. clusterIdRx := regexp.MustCompile("^kubernetes\\.io/cluster/([^/]+)")
  702. nodeList, err := awsProvider.Clientset.CoreV1().Nodes().List(metav1.ListOptions{})
  703. if err != nil {
  704. return nil, err
  705. }
  706. for _, n := range nodeList.Items {
  707. region := ""
  708. instanceId := ""
  709. providerId := n.Spec.ProviderID
  710. for matchNum, group := range provIdRx.FindStringSubmatch(providerId) {
  711. if matchNum == 1 {
  712. region = group
  713. } else if matchNum == 2 {
  714. instanceId = group
  715. }
  716. }
  717. if len(instanceId) == 0 {
  718. klog.V(2).Infof("Unable to decode Node.ProviderID \"%s\", skipping it", providerId)
  719. continue
  720. }
  721. c := &aws.Config{
  722. Region: aws.String(region),
  723. }
  724. s := session.Must(session.NewSession(c))
  725. ec2Svc := ec2.New(s)
  726. di, diErr := ec2Svc.DescribeInstances(&ec2.DescribeInstancesInput{
  727. InstanceIds: []*string{
  728. aws.String(instanceId),
  729. },
  730. })
  731. if diErr != nil {
  732. // maybe log this?
  733. continue
  734. }
  735. if len(di.Reservations) != 1 {
  736. klog.V(2).Infof("Expected 1 Reservation back from DescribeInstances(%s), received %d", instanceId, len(di.Reservations))
  737. continue
  738. }
  739. res := di.Reservations[0]
  740. if len(res.Instances) != 1 {
  741. klog.V(2).Infof("Expected 1 Instance back from DescribeInstances(%s), received %d", instanceId, len(res.Instances))
  742. continue
  743. }
  744. inst := res.Instances[0]
  745. for _, tag := range inst.Tags {
  746. tagKey := *tag.Key
  747. for matchNum, group := range clusterIdRx.FindStringSubmatch(tagKey) {
  748. if matchNum != 1 {
  749. continue
  750. }
  751. return makeStructure(group)
  752. }
  753. }
  754. }
  755. klog.V(2).Infof("Unable to sniff out cluster ID, perhaps set $%s to force one", ClusterIdEnvVar)
  756. return makeStructure(defaultClusterName)
  757. }
  758. // AddServiceKey adds an AWS service key, useful for pulling down out-of-cluster costs. Optional-- the container this runs in can be directly authorized.
  759. func (*AWS) AddServiceKey(formValues url.Values) error {
  760. keyID := formValues.Get("access_key_ID")
  761. key := formValues.Get("secret_access_key")
  762. m := make(map[string]string)
  763. m["access_key_ID"] = keyID
  764. m["secret_access_key"] = key
  765. result, err := json.Marshal(m)
  766. if err != nil {
  767. return err
  768. }
  769. return ioutil.WriteFile("/var/configs/key.json", result, 0644)
  770. }
  771. // GetDisks returns the AWS disks backing PVs. Useful because sometimes k8s will not clean up PVs correctly. Requires a json config in /var/configs with key region.
  772. func (*AWS) GetDisks() ([]byte, error) {
  773. jsonFile, err := os.Open("/var/configs/key.json")
  774. if err == nil {
  775. byteValue, _ := ioutil.ReadAll(jsonFile)
  776. var result map[string]string
  777. err := json.Unmarshal([]byte(byteValue), &result)
  778. if err != nil {
  779. return nil, err
  780. }
  781. err = os.Setenv(awsAccessKeyIDEnvVar, result["access_key_ID"])
  782. if err != nil {
  783. return nil, err
  784. }
  785. err = os.Setenv(awsAccessKeySecretEnvVar, result["secret_access_key"])
  786. if err != nil {
  787. return nil, err
  788. }
  789. } else if os.IsNotExist(err) {
  790. klog.V(2).Infof("Using Default Credentials")
  791. } else {
  792. return nil, err
  793. }
  794. defer jsonFile.Close()
  795. clusterConfig, err := os.Open("/var/configs/cluster.json")
  796. if err != nil {
  797. return nil, err
  798. }
  799. defer clusterConfig.Close()
  800. b, err := ioutil.ReadAll(clusterConfig)
  801. if err != nil {
  802. return nil, err
  803. }
  804. var clusterConf map[string]string
  805. err = json.Unmarshal([]byte(b), &clusterConf)
  806. if err != nil {
  807. return nil, err
  808. }
  809. region := aws.String(clusterConf["region"])
  810. c := &aws.Config{
  811. Region: region,
  812. }
  813. s := session.Must(session.NewSession(c))
  814. ec2Svc := ec2.New(s)
  815. input := &ec2.DescribeVolumesInput{}
  816. volumeResult, err := ec2Svc.DescribeVolumes(input)
  817. if err != nil {
  818. if aerr, ok := err.(awserr.Error); ok {
  819. switch aerr.Code() {
  820. default:
  821. return nil, aerr
  822. }
  823. } else {
  824. return nil, err
  825. }
  826. }
  827. return json.Marshal(volumeResult)
  828. }
  829. // ConvertToGlueColumnFormat takes a string and runs through various regex
  830. // and string replacement statements to convert it to a format compatible
  831. // with AWS Glue and Athena column names.
  832. // Following guidance from AWS provided here ('Column Names' section):
  833. // https://docs.aws.amazon.com/awsaccountbilling/latest/aboutv2/run-athena-sql.html
  834. // It returns a string containing the column name in proper column name format and length.
  835. func ConvertToGlueColumnFormat(column_name string) string {
  836. klog.V(5).Infof("Converting string \"%s\" to proper AWS Glue column name.", column_name)
  837. // An underscore is added in front of uppercase letters
  838. capital_underscore := regexp.MustCompile(`[A-Z]`)
  839. final := capital_underscore.ReplaceAllString(column_name, `_$0`)
  840. // Any non-alphanumeric characters are replaced with an underscore
  841. no_space_punc := regexp.MustCompile(`[\s]{1,}|[^A-Za-z0-9]`)
  842. final = no_space_punc.ReplaceAllString(final, "_")
  843. // Duplicate underscores are removed
  844. no_dup_underscore := regexp.MustCompile(`_{2,}`)
  845. final = no_dup_underscore.ReplaceAllString(final, "_")
  846. // Any leading and trailing underscores are removed
  847. no_front_end_underscore := regexp.MustCompile(`(^\_|\_$)`)
  848. final = no_front_end_underscore.ReplaceAllString(final, "")
  849. // Uppercase to lowercase
  850. final = strings.ToLower(final)
  851. // Longer column name than expected - remove _ left to right
  852. allowed_col_len := 128
  853. undersc_to_remove := len(final) - allowed_col_len
  854. if undersc_to_remove > 0 {
  855. final = strings.Replace(final, "_", "", undersc_to_remove)
  856. }
  857. // If removing all of the underscores still didn't
  858. // make the column name < 128 characters, trim it!
  859. if len(final) > allowed_col_len {
  860. final = final[:allowed_col_len]
  861. }
  862. klog.V(5).Infof("Column name being returned: \"%s\". Length: \"%d\".", final, len(final))
  863. return final
  864. }
  865. // ExternalAllocations represents tagged assets outside the scope of kubernetes.
  866. // "start" and "end" are dates of the format YYYY-MM-DD
  867. // "aggregator" is the tag used to determine how to allocate those assets, ie namespace, pod, etc.
  868. func (a *AWS) ExternalAllocations(start string, end string, aggregator string) ([]*OutOfClusterAllocation, error) {
  869. customPricing, err := a.GetConfig()
  870. if err != nil {
  871. return nil, err
  872. }
  873. aggregator_column_name := "resource_tags_user_kubernetes_" + aggregator
  874. aggregator_column_name = ConvertToGlueColumnFormat(aggregator_column_name)
  875. query := fmt.Sprintf(`SELECT
  876. CAST(line_item_usage_start_date AS DATE) as start_date,
  877. %s,
  878. line_item_product_code,
  879. SUM(line_item_blended_cost) as blended_cost
  880. FROM %s as cost_data
  881. WHERE line_item_usage_start_date BETWEEN date '%s' AND date '%s'
  882. GROUP BY 1,2,3`, aggregator_column_name, customPricing.AthenaTable, start, end)
  883. if customPricing.ServiceKeyName != "" {
  884. err = os.Setenv(awsAccessKeyIDEnvVar, customPricing.ServiceKeyName)
  885. if err != nil {
  886. return nil, err
  887. }
  888. err = os.Setenv(awsAccessKeySecretEnvVar, customPricing.ServiceKeySecret)
  889. if err != nil {
  890. return nil, err
  891. }
  892. }
  893. region := aws.String(customPricing.AthenaRegion)
  894. resultsBucket := customPricing.AthenaBucketName
  895. database := customPricing.AthenaDatabase
  896. c := &aws.Config{
  897. Region: region,
  898. }
  899. s := session.Must(session.NewSession(c))
  900. svc := athena.New(s)
  901. var e athena.StartQueryExecutionInput
  902. var r athena.ResultConfiguration
  903. r.SetOutputLocation(resultsBucket)
  904. e.SetResultConfiguration(&r)
  905. e.SetQueryString(query)
  906. var q athena.QueryExecutionContext
  907. q.SetDatabase(database)
  908. e.SetQueryExecutionContext(&q)
  909. res, err := svc.StartQueryExecution(&e)
  910. if err != nil {
  911. return nil, err
  912. }
  913. klog.V(2).Infof("StartQueryExecution result:")
  914. klog.V(2).Infof(res.GoString())
  915. var qri athena.GetQueryExecutionInput
  916. qri.SetQueryExecutionId(*res.QueryExecutionId)
  917. var qrop *athena.GetQueryExecutionOutput
  918. duration := time.Duration(2) * time.Second // Pause for 2 seconds
  919. for {
  920. qrop, err = svc.GetQueryExecution(&qri)
  921. if err != nil {
  922. return nil, err
  923. }
  924. if *qrop.QueryExecution.Status.State != "RUNNING" {
  925. break
  926. }
  927. time.Sleep(duration)
  928. }
  929. var oocAllocs []*OutOfClusterAllocation
  930. if *qrop.QueryExecution.Status.State == "SUCCEEDED" {
  931. var ip athena.GetQueryResultsInput
  932. ip.SetQueryExecutionId(*res.QueryExecutionId)
  933. op, err := svc.GetQueryResults(&ip)
  934. if err != nil {
  935. return nil, err
  936. }
  937. for _, r := range op.ResultSet.Rows[1:(len(op.ResultSet.Rows) - 1)] {
  938. cost, err := strconv.ParseFloat(*r.Data[3].VarCharValue, 64)
  939. if err != nil {
  940. return nil, err
  941. }
  942. ooc := &OutOfClusterAllocation{
  943. Aggregator: aggregator,
  944. Environment: *r.Data[1].VarCharValue,
  945. Service: *r.Data[2].VarCharValue,
  946. Cost: cost,
  947. }
  948. oocAllocs = append(oocAllocs, ooc)
  949. }
  950. }
  951. return oocAllocs, nil // TODO: transform the QuerySQL lines into the new OutOfClusterAllocation Struct
  952. }
  953. // QuerySQL can query a properly configured Athena database.
  954. // Used to fetch billing data.
  955. // Requires a json config in /var/configs with key region, output, and database.
  956. func (a *AWS) QuerySQL(query string) ([]byte, error) {
  957. customPricing, err := a.GetConfig()
  958. if err != nil {
  959. return nil, err
  960. }
  961. if customPricing.ServiceKeyName != "" {
  962. err = os.Setenv(awsAccessKeyIDEnvVar, customPricing.ServiceKeyName)
  963. if err != nil {
  964. return nil, err
  965. }
  966. err = os.Setenv(awsAccessKeySecretEnvVar, customPricing.ServiceKeySecret)
  967. if err != nil {
  968. return nil, err
  969. }
  970. }
  971. athenaConfigs, err := os.Open("/var/configs/athena.json")
  972. if err != nil {
  973. return nil, err
  974. }
  975. defer athenaConfigs.Close()
  976. b, err := ioutil.ReadAll(athenaConfigs)
  977. if err != nil {
  978. return nil, err
  979. }
  980. var athenaConf map[string]string
  981. json.Unmarshal([]byte(b), &athenaConf)
  982. region := aws.String(customPricing.AthenaRegion)
  983. resultsBucket := customPricing.AthenaBucketName
  984. database := customPricing.AthenaDatabase
  985. c := &aws.Config{
  986. Region: region,
  987. }
  988. s := session.Must(session.NewSession(c))
  989. svc := athena.New(s)
  990. var e athena.StartQueryExecutionInput
  991. var r athena.ResultConfiguration
  992. r.SetOutputLocation(resultsBucket)
  993. e.SetResultConfiguration(&r)
  994. e.SetQueryString(query)
  995. var q athena.QueryExecutionContext
  996. q.SetDatabase(database)
  997. e.SetQueryExecutionContext(&q)
  998. res, err := svc.StartQueryExecution(&e)
  999. if err != nil {
  1000. return nil, err
  1001. }
  1002. klog.V(2).Infof("StartQueryExecution result:")
  1003. klog.V(2).Infof(res.GoString())
  1004. var qri athena.GetQueryExecutionInput
  1005. qri.SetQueryExecutionId(*res.QueryExecutionId)
  1006. var qrop *athena.GetQueryExecutionOutput
  1007. duration := time.Duration(2) * time.Second // Pause for 2 seconds
  1008. for {
  1009. qrop, err = svc.GetQueryExecution(&qri)
  1010. if err != nil {
  1011. return nil, err
  1012. }
  1013. if *qrop.QueryExecution.Status.State != "RUNNING" {
  1014. break
  1015. }
  1016. time.Sleep(duration)
  1017. }
  1018. if *qrop.QueryExecution.Status.State == "SUCCEEDED" {
  1019. var ip athena.GetQueryResultsInput
  1020. ip.SetQueryExecutionId(*res.QueryExecutionId)
  1021. op, err := svc.GetQueryResults(&ip)
  1022. if err != nil {
  1023. return nil, err
  1024. }
  1025. b, err := json.Marshal(op.ResultSet)
  1026. if err != nil {
  1027. return nil, err
  1028. }
  1029. return b, nil
  1030. }
  1031. return nil, fmt.Errorf("Error getting query results : %s", *qrop.QueryExecution.Status.State)
  1032. }
  1033. type spotInfo struct {
  1034. Timestamp string `csv:"Timestamp"`
  1035. UsageType string `csv:"UsageType"`
  1036. Operation string `csv:"Operation"`
  1037. InstanceID string `csv:"InstanceID"`
  1038. MyBidID string `csv:"MyBidID"`
  1039. MyMaxPrice string `csv:"MyMaxPrice"`
  1040. MarketPrice string `csv:"MarketPrice"`
  1041. Charge string `csv:"Charge"`
  1042. Version string `csv:"Version"`
  1043. }
  1044. type fnames []*string
  1045. func (f fnames) Len() int {
  1046. return len(f)
  1047. }
  1048. func (f fnames) Swap(i, j int) {
  1049. f[i], f[j] = f[j], f[i]
  1050. }
  1051. func (f fnames) Less(i, j int) bool {
  1052. key1 := strings.Split(*f[i], ".")
  1053. key2 := strings.Split(*f[j], ".")
  1054. t1, err := time.Parse("2006-01-02-15", key1[1])
  1055. if err != nil {
  1056. klog.V(1).Info("Unable to parse timestamp" + key1[1])
  1057. return false
  1058. }
  1059. t2, err := time.Parse("2006-01-02-15", key2[1])
  1060. if err != nil {
  1061. klog.V(1).Info("Unable to parse timestamp" + key2[1])
  1062. return false
  1063. }
  1064. return t1.Before(t2)
  1065. }
  1066. func parseSpotData(bucket string, prefix string, projectID string, region string, accessKeyID string, accessKeySecret string) (map[string]*spotInfo, error) {
  1067. if accessKeyID != "" && accessKeySecret != "" { // credentials may exist on the actual AWS node-- if so, use those. If not, override with the service key
  1068. err := os.Setenv(awsAccessKeyIDEnvVar, accessKeyID)
  1069. if err != nil {
  1070. return nil, err
  1071. }
  1072. err = os.Setenv(awsAccessKeySecretEnvVar, accessKeySecret)
  1073. if err != nil {
  1074. return nil, err
  1075. }
  1076. }
  1077. s3Prefix := projectID
  1078. if len(prefix) != 0 {
  1079. s3Prefix = prefix + "/" + s3Prefix
  1080. }
  1081. c := aws.NewConfig().WithRegion(region)
  1082. s := session.Must(session.NewSession(c))
  1083. s3Svc := s3.New(s)
  1084. downloader := s3manager.NewDownloaderWithClient(s3Svc)
  1085. tNow := time.Now()
  1086. tOneDayAgo := tNow.Add(time.Duration(-24) * time.Hour) // Also get files from one day ago to avoid boundary conditions
  1087. ls := &s3.ListObjectsInput{
  1088. Bucket: aws.String(bucket),
  1089. Prefix: aws.String(s3Prefix + "." + tOneDayAgo.Format("2006-01-02")),
  1090. }
  1091. ls2 := &s3.ListObjectsInput{
  1092. Bucket: aws.String(bucket),
  1093. Prefix: aws.String(s3Prefix + "." + tNow.Format("2006-01-02")),
  1094. }
  1095. lso, err := s3Svc.ListObjects(ls)
  1096. if err != nil {
  1097. return nil, err
  1098. }
  1099. lsoLen := len(lso.Contents)
  1100. klog.V(2).Infof("Found %d spot data files from yesterday", lsoLen)
  1101. if lsoLen == 0 {
  1102. klog.V(5).Infof("ListObjects \"s3://%s/%s\" produced no keys", *ls.Bucket, *ls.Prefix)
  1103. }
  1104. lso2, err := s3Svc.ListObjects(ls2)
  1105. if err != nil {
  1106. return nil, err
  1107. }
  1108. lso2Len := len(lso2.Contents)
  1109. klog.V(2).Infof("Found %d spot data files from today", lso2Len)
  1110. if lso2Len == 0 {
  1111. klog.V(5).Infof("ListObjects \"s3://%s/%s\" produced no keys", *ls2.Bucket, *ls2.Prefix)
  1112. }
  1113. var keys []*string
  1114. for _, obj := range lso.Contents {
  1115. keys = append(keys, obj.Key)
  1116. }
  1117. for _, obj := range lso2.Contents {
  1118. keys = append(keys, obj.Key)
  1119. }
  1120. versionRx := regexp.MustCompile("^#Version: (\\d+)\\.\\d+$")
  1121. header, err := csvutil.Header(spotInfo{}, "csv")
  1122. if err != nil {
  1123. return nil, err
  1124. }
  1125. fieldsPerRecord := len(header)
  1126. spots := make(map[string]*spotInfo)
  1127. for _, key := range keys {
  1128. getObj := &s3.GetObjectInput{
  1129. Bucket: aws.String(bucket),
  1130. Key: key,
  1131. }
  1132. buf := aws.NewWriteAtBuffer([]byte{})
  1133. _, err := downloader.Download(buf, getObj)
  1134. if err != nil {
  1135. return nil, err
  1136. }
  1137. r := bytes.NewReader(buf.Bytes())
  1138. gr, err := gzip.NewReader(r)
  1139. if err != nil {
  1140. return nil, err
  1141. }
  1142. csvReader := csv.NewReader(gr)
  1143. csvReader.Comma = '\t'
  1144. csvReader.FieldsPerRecord = fieldsPerRecord
  1145. dec, err := csvutil.NewDecoder(csvReader, header...)
  1146. if err != nil {
  1147. return nil, err
  1148. }
  1149. var foundVersion string
  1150. for {
  1151. spot := spotInfo{}
  1152. err := dec.Decode(&spot)
  1153. csvParseErr, isCsvParseErr := err.(*csv.ParseError)
  1154. if err == io.EOF {
  1155. break
  1156. } else if err == csvutil.ErrFieldCount || (isCsvParseErr && csvParseErr.Err == csv.ErrFieldCount) {
  1157. rec := dec.Record()
  1158. // the first two "Record()" will be the comment lines
  1159. // and they show up as len() == 1
  1160. // the first of which is "#Version"
  1161. // the second of which is "#Fields: "
  1162. if len(rec) != 1 {
  1163. klog.V(2).Infof("Expected %d spot info fields but received %d: %s", fieldsPerRecord, len(rec), rec)
  1164. continue
  1165. }
  1166. if len(foundVersion) == 0 {
  1167. spotFeedVersion := rec[0]
  1168. klog.V(3).Infof("Spot feed version is \"%s\"", spotFeedVersion)
  1169. matches := versionRx.FindStringSubmatch(spotFeedVersion)
  1170. if matches != nil {
  1171. foundVersion = matches[1]
  1172. if foundVersion != supportedSpotFeedVersion {
  1173. klog.V(2).Infof("Unsupported spot info feed version: wanted \"%s\" got \"%s\"", supportedSpotFeedVersion, foundVersion)
  1174. break
  1175. }
  1176. }
  1177. continue
  1178. } else if strings.Index(rec[0], "#") == 0 {
  1179. continue
  1180. } else {
  1181. klog.V(3).Infof("skipping non-TSV line: %s", rec)
  1182. continue
  1183. }
  1184. } else if err != nil {
  1185. klog.V(2).Infof("Error during spot info decode: %+v", err)
  1186. continue
  1187. }
  1188. klog.V(3).Infof("Found spot info %+v", spot)
  1189. spots[spot.InstanceID] = &spot
  1190. }
  1191. gr.Close()
  1192. }
  1193. return spots, nil
  1194. }