Skip to content

Commit

Permalink
add: Scaleway Cloud Provider for k8s CA
Browse files Browse the repository at this point in the history
  • Loading branch information
louisportay committed Jul 29, 2022
1 parent 7eec219 commit 5323047
Show file tree
Hide file tree
Showing 10 changed files with 1,502 additions and 2 deletions.
1 change: 1 addition & 0 deletions cluster-autoscaler/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -32,6 +32,7 @@ You should also take a look at the notes and "gotchas" for your specific cloud p
* [BizflyCloud](./cloudprovider/bizflycloud/README.md)
* [Vultr](./cloudprovider/vultr/README.md)
* [TencentCloud](./cloudprovider/tencentcloud/README.md)
* [Scaleway](./cloudprovider/scaleway/README.md)

# Releases

Expand Down
8 changes: 6 additions & 2 deletions cluster-autoscaler/cloudprovider/builder/builder_all.go
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
//go:build !gce && !aws && !azure && !kubemark && !alicloud && !magnum && !digitalocean && !clusterapi && !huaweicloud && !ionoscloud && !linode && !hetzner && !bizflycloud && !brightbox && !packet && !oci && !vultr && !tencentcloud && !externalgrpc
// +build !gce,!aws,!azure,!kubemark,!alicloud,!magnum,!digitalocean,!clusterapi,!huaweicloud,!ionoscloud,!linode,!hetzner,!bizflycloud,!brightbox,!packet,!oci,!vultr,!tencentcloud,!externalgrpc
//go:build !gce && !aws && !azure && !kubemark && !alicloud && !magnum && !digitalocean && !clusterapi && !huaweicloud && !ionoscloud && !linode && !hetzner && !bizflycloud && !brightbox && !packet && !oci && !vultr && !tencentcloud && !scaleway && !externalgrpc
// +build !gce,!aws,!azure,!kubemark,!alicloud,!magnum,!digitalocean,!clusterapi,!huaweicloud,!ionoscloud,!linode,!hetzner,!bizflycloud,!brightbox,!packet,!oci,!vultr,!tencentcloud,!scaleway,!externalgrpc

/*
Copyright 2018 The Kubernetes Authors.
Expand Down Expand Up @@ -42,6 +42,7 @@ import (
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider/oci"
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider/ovhcloud"
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider/packet"
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider/scaleway"
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider/tencentcloud"
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider/vultr"
"k8s.io/autoscaler/cluster-autoscaler/config"
Expand Down Expand Up @@ -72,6 +73,7 @@ var AvailableCloudProviders = []string{
cloudprovider.PacketProviderName,
cloudprovider.VultrProviderName,
cloudprovider.TencentcloudProviderName,
cloudprovider.ScalewayProviderName,
}

// DefaultCloudProvider is GCE.
Expand Down Expand Up @@ -125,6 +127,8 @@ func buildCloudProvider(opts config.AutoscalingOptions, do cloudprovider.NodeGro
return vultr.BuildVultr(opts, do, rl)
case cloudprovider.TencentcloudProviderName:
return tencentcloud.BuildTencentcloud(opts, do, rl)
case cloudprovider.ScalewayProviderName:
return scaleway.BuildScaleway(opts, do, rl)
}
return nil
}
43 changes: 43 additions & 0 deletions cluster-autoscaler/cloudprovider/builder/builder_scaleway.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,43 @@
//go:build scaleway
// +build scaleway

/*
Copyright 2022 The Kubernetes Authors.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/

package builder

import (
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider"
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider/scaleway"
"k8s.io/autoscaler/cluster-autoscaler/config"
)

// AvailableCloudProviders supported by the scaleway cloud provider builder.
var AvailableCloudProviders = []string{
cloudprovider.ScalewayProviderName,
}

// DefaultCloudProvider for do-only build is Scaleway.
const DefaultCloudProvider = cloudprovider.ScalewayProviderName

func buildCloudProvider(opts config.AutoscalingOptions, do cloudprovider.NodeGroupDiscoveryOptions, rl *cloudprovider.ResourceLimiter) cloudprovider.CloudProvider {
switch opts.CloudProviderName {
case cloudprovider.ScalewayProviderName:
return scaleway.BuildScaleway(opts, do, rl)
}

return nil
}
2 changes: 2 additions & 0 deletions cluster-autoscaler/cloudprovider/cloud_provider.go
Original file line number Diff line number Diff line change
Expand Up @@ -68,6 +68,8 @@ const (
OVHcloudProviderName = "ovhcloud"
// LinodeProviderName gets the provider name of linode
LinodeProviderName = "linode"
// ScalewayProviderName gets the provider name of scaleway
ScalewayProviderName = "scaleway"
// VultrProviderName gets the provider name of vultr
VultrProviderName = "vultr"
// PacketProviderName gets the provider name of packet
Expand Down
29 changes: 29 additions & 0 deletions cluster-autoscaler/cloudprovider/scaleway/README.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,29 @@
# Cluster Autoscaler for Scaleway

The Scaleway Cloud Provider implementation scales nodes on different pools
attached to a Kapsule cluster. It can be configured from Scaleway Kapsule API.
The cluster pools need to have the option `Autoscaling` set to true to be managed by the autoscaler.

## Configuration

Cluster Autoscaler can be configured with 2 options
### Config file
a config file can be passed with the `--cloud-config` flag.
here is the corresponding JSON schema:
* `cluster_id`: Kapsule Cluster Id
* `secret_key`: Secret Key used to manage associated Kapsule resources
* `region`: Region where the control-plane is runnning
* `api_url`: URL to contact Scaleway, defaults to `api.scaleway.com`

### Env variables

The values expected by the autoscaler are the same as above

- `CLUSTER_ID`
- `SCW_SECRET_KEY`
- `SCW_REGION`
- `SCW_API_URL`

## Notes

k8s nodes are identified through `node.Spec.ProviderId`, the scaleway node name or id MUST NOT be used.
265 changes: 265 additions & 0 deletions cluster-autoscaler/cloudprovider/scaleway/scaleway_cloud_provider.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,265 @@
/*
Copyright 2022 The Kubernetes Authors.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/

package scaleway

import (
"context"
"encoding/json"
"fmt"
"io"
"io/ioutil"
"math"
"os"
"time"

apiv1 "k8s.io/api/core/v1"
"k8s.io/apimachinery/pkg/api/resource"
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider"
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider/scaleway/scalewaygo"
"k8s.io/autoscaler/cluster-autoscaler/config"
ca_errors "k8s.io/autoscaler/cluster-autoscaler/utils/errors"
"k8s.io/klog/v2"
)

const (
// GPULabel is the label added to GPU nodes
GPULabel = "k8s.scaleway.com/gpu"
)

type scalewayCloudProvider struct {
// client talks to Kapsule API
client scalewaygo.Client
// ClusterID is the cluster id where the Autoscaler is running.
clusterID string
// nodeGroups is an abstraction around the Pool object returned by the API
nodeGroups []*NodeGroup

resourceLimiter *cloudprovider.ResourceLimiter
}

func readConf(config *scalewaygo.Config, configFile io.Reader) error {
body, err := ioutil.ReadAll(configFile)
if err != nil {
return err
}
err = json.Unmarshal(body, config)
return err
}

func newScalewayCloudProvider(configFile io.Reader, defaultUserAgent string, rl *cloudprovider.ResourceLimiter) *scalewayCloudProvider {
getenvOr := func(key, defaultValue string) string {
value := os.Getenv(key)
if value != "" {
return value
}
return defaultValue
}

// Config file passed with `cloud-config` flag
cfg := scalewaygo.Config{}
if configFile != nil {
err := readConf(&cfg, configFile)
if err != nil {
klog.Errorf("failed to read/parse scaleway config file: %s", err)
}
}

// env takes precedence over config passed by command-line
cfg.ClusterID = getenvOr("CLUSTER_ID", cfg.ClusterID)
cfg.SecretKey = getenvOr("SCW_SECRET_KEY", cfg.SecretKey)
cfg.Region = getenvOr("SCW_REGION", cfg.Region)
cfg.ApiUrl = getenvOr("SCW_API_URL", cfg.ApiUrl)

cfg.UserAgent = defaultUserAgent

client, err := scalewaygo.NewClient(cfg)
if err != nil {
klog.Fatalf("failed to create scaleway cloud provider: %v", err)
}

klog.V(4).Infof("Scaleway Cloud Provider built; ClusterId=%s,SecretKey=%s-***,Region=%s,ApiURL=%s", cfg.ClusterID, client.Token()[:8], client.Region(), client.ApiURL())

return &scalewayCloudProvider{
client: client,
clusterID: cfg.ClusterID,
resourceLimiter: rl,
}
}

func BuildScaleway(
opts config.AutoscalingOptions,
do cloudprovider.NodeGroupDiscoveryOptions,
rl *cloudprovider.ResourceLimiter,
) cloudprovider.CloudProvider {
var configFile io.Reader

if opts.CloudConfig != "" {
configFile, err := os.Open(opts.CloudConfig)

if err != nil {
klog.Errorf("could not open scaleway configuration %s: %s", opts.CloudConfig, err)
} else {
defer func() {
err = configFile.Close()
if err != nil {
klog.Errorf("failed to close scaleway config file: %s", err)
}
}()
}
}
return newScalewayCloudProvider(configFile, opts.UserAgent, rl)
}

// Name returns 'scaleway'
func (*scalewayCloudProvider) Name() string {
return cloudprovider.ScalewayProviderName
}

// NodeGroups returns all node groups configured for this cluster.
// critical endpoint, make it fast
func (scw *scalewayCloudProvider) NodeGroups() []cloudprovider.NodeGroup {

klog.V(4).Info("NodeGroups,ClusterID=", scw.clusterID)

nodeGroups := make([]cloudprovider.NodeGroup, len(scw.nodeGroups))
for i, ng := range scw.nodeGroups {
nodeGroups[i] = ng
}
return nodeGroups
}

func (scw *scalewayCloudProvider) nodeGroupForNode(node *apiv1.Node) (*NodeGroup, error) {
for _, ng := range scw.nodeGroups {
if _, ok := ng.nodes[node.Spec.ProviderID]; ok {
return ng, nil
}
}
return nil, nil
}

// NodeGroupForNode returns the node group for the given node, nil if the node
// should not be processed by cluster autoscaler, or non-nil error if such
// occurred.
// critical endpoint, make it fast
func (scw *scalewayCloudProvider) NodeGroupForNode(node *apiv1.Node) (cloudprovider.NodeGroup, error) {
klog.V(4).Infof("NodeGroupForNode,NodeSpecProviderID=%s", node.Spec.ProviderID)

return scw.nodeGroupForNode(node)
}

func (scw *scalewayCloudProvider) NodePrice(node *apiv1.Node, startTime time.Time, endTime time.Time) (float64, error) {
ng, err := scw.nodeGroupForNode(node)
if err != nil {
return 0.0, err
}

d := endTime.Sub(startTime)
hours := math.Ceil(d.Hours())

return hours * float64(ng.specs.NodePricePerHour), nil
}

func (scw *scalewayCloudProvider) PodPrice(pod *apiv1.Pod, startTime time.Time, endTime time.Time) (float64, error) {
return 0.0, nil
}

// Pricing return pricing model for scaleway.
func (scw *scalewayCloudProvider) Pricing() (cloudprovider.PricingModel, ca_errors.AutoscalerError) {
klog.V(4).Info("Pricing,called")
return scw, nil
}

// GetAvailableMachineTypes get all machine types that can be requested from scaleway.
// Not implemented
func (scw *scalewayCloudProvider) GetAvailableMachineTypes() ([]string, error) {
return []string{}, nil
}

func (scw *scalewayCloudProvider) NewNodeGroup(
machineType string,
labels map[string]string,
systemLabels map[string]string,
taints []apiv1.Taint,
extraResources map[string]resource.Quantity,
) (cloudprovider.NodeGroup, error) {
klog.V(4).Info("NewNodeGroup,called")
return nil, cloudprovider.ErrNotImplemented
}

// GetResourceLimiter returns struct containing limits (max, min) for resources (cores, memory etc.).
func (scw *scalewayCloudProvider) GetResourceLimiter() (*cloudprovider.ResourceLimiter, error) {
klog.V(4).Info("GetResourceLimiter,called")
return scw.resourceLimiter, nil
}

// GPULabel returns the label added to nodes with GPU resource.
func (scw *scalewayCloudProvider) GPULabel() string {
klog.V(6).Info("GPULabel,called")
return GPULabel
}

// GetAvailableGPUTypes return all available GPU types cloud provider supports.
// not yet implemented.
func (scw *scalewayCloudProvider) GetAvailableGPUTypes() map[string]struct{} {
klog.V(4).Info("GetAvailableGPUTypes,called")
return nil
}

// Cleanup cleans up open resources before the cloud provider is destroyed, i.e. go routines etc.
func (scw *scalewayCloudProvider) Cleanup() error {
klog.V(4).Info("Cleanup,called")
return nil
}

// Refresh is called before every main loop and can be used to dynamically update cloud provider state.
// In particular the list of node groups returned by NodeGroups can change as a result of CloudProvider.Refresh().
func (scw *scalewayCloudProvider) Refresh() error {
klog.V(4).Info("Refresh,ClusterID=", scw.clusterID)

ctx := context.Background()
resp, err := scw.client.ListPools(ctx, &scalewaygo.ListPoolsRequest{ClusterID: scw.clusterID})

if err != nil {
klog.Errorf("Refresh,failed to list pools for cluster %s: %s", scw.clusterID, err)
return err
}

var ng []*NodeGroup

for _, p := range resp.Pools {

if p.Pool.Autoscaling == false {
continue
}

nodes, err := nodesFromPool(scw.client, p.Pool)
if err != nil {
return fmt.Errorf("Refresh,failed to list nodes for pool %s: %w", p.Pool.ID, err)
}
ng = append(ng, &NodeGroup{
Client: scw.client,
nodes: nodes,
specs: &p.Specs,
p: p.Pool,
})
}
klog.V(4).Infof("Refresh,ClusterID=%s,%d pools found", scw.clusterID, len(ng))

scw.nodeGroups = ng

return nil
}
Loading

0 comments on commit 5323047

Please sign in to comment.