-
Notifications
You must be signed in to change notification settings - Fork 4k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #5062 from louisportay/lportay/master
add: Scaleway Cloud Provider for k8s CA
- Loading branch information
Showing
11 changed files
with
1,576 additions
and
2 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
43 changes: 43 additions & 0 deletions
43
cluster-autoscaler/cloudprovider/builder/builder_scaleway.go
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,43 @@ | ||
//go:build scaleway | ||
// +build scaleway | ||
|
||
/* | ||
Copyright 2022 The Kubernetes Authors. | ||
Licensed under the Apache License, Version 2.0 (the "License"); | ||
you may not use this file except in compliance with the License. | ||
You may obtain a copy of the License at | ||
http://www.apache.org/licenses/LICENSE-2.0 | ||
Unless required by applicable law or agreed to in writing, software | ||
distributed under the License is distributed on an "AS IS" BASIS, | ||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
See the License for the specific language governing permissions and | ||
limitations under the License. | ||
*/ | ||
|
||
package builder | ||
|
||
import ( | ||
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider" | ||
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider/scaleway" | ||
"k8s.io/autoscaler/cluster-autoscaler/config" | ||
) | ||
|
||
// AvailableCloudProviders supported by the scaleway cloud provider builder. | ||
var AvailableCloudProviders = []string{ | ||
cloudprovider.ScalewayProviderName, | ||
} | ||
|
||
// DefaultCloudProvider for do-only build is Scaleway. | ||
const DefaultCloudProvider = cloudprovider.ScalewayProviderName | ||
|
||
func buildCloudProvider(opts config.AutoscalingOptions, do cloudprovider.NodeGroupDiscoveryOptions, rl *cloudprovider.ResourceLimiter) cloudprovider.CloudProvider { | ||
switch opts.CloudProviderName { | ||
case cloudprovider.ScalewayProviderName: | ||
return scaleway.BuildScaleway(opts, do, rl) | ||
} | ||
|
||
return nil | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,6 @@ | ||
#approvers: | ||
#- louisportay | ||
#- jtherin | ||
reviewers: | ||
- remyleone | ||
- Sh4d1 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,29 @@ | ||
# Cluster Autoscaler for Scaleway | ||
|
||
The Scaleway Cloud Provider implementation scales nodes on different pools | ||
attached to a Kapsule cluster. It can be configured from Scaleway Kapsule API. | ||
The cluster pools need to have the option `Autoscaling` set to true to be managed by the autoscaler. | ||
|
||
## Configuration | ||
|
||
Cluster Autoscaler can be configured with 2 options | ||
### Config file | ||
a config file can be passed with the `--cloud-config` flag. | ||
here is the corresponding JSON schema: | ||
* `cluster_id`: Kapsule Cluster Id | ||
* `secret_key`: Secret Key used to manage associated Kapsule resources | ||
* `region`: Region where the control-plane is runnning | ||
* `api_url`: URL to contact Scaleway, defaults to `api.scaleway.com` | ||
|
||
### Env variables | ||
|
||
The values expected by the autoscaler are the same as above | ||
|
||
- `CLUSTER_ID` | ||
- `SCW_SECRET_KEY` | ||
- `SCW_REGION` | ||
- `SCW_API_URL` | ||
|
||
## Notes | ||
|
||
k8s nodes are identified through `node.Spec.ProviderId`, the scaleway node name or id MUST NOT be used. |
266 changes: 266 additions & 0 deletions
266
cluster-autoscaler/cloudprovider/scaleway/scaleway_cloud_provider.go
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,266 @@ | ||
/* | ||
Copyright 2022 The Kubernetes Authors. | ||
Licensed under the Apache License, Version 2.0 (the "License"); | ||
you may not use this file except in compliance with the License. | ||
You may obtain a copy of the License at | ||
http://www.apache.org/licenses/LICENSE-2.0 | ||
Unless required by applicable law or agreed to in writing, software | ||
distributed under the License is distributed on an "AS IS" BASIS, | ||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
See the License for the specific language governing permissions and | ||
limitations under the License. | ||
*/ | ||
|
||
package scaleway | ||
|
||
import ( | ||
"context" | ||
"encoding/json" | ||
"fmt" | ||
"io" | ||
"io/ioutil" | ||
"math" | ||
"os" | ||
"time" | ||
|
||
apiv1 "k8s.io/api/core/v1" | ||
"k8s.io/apimachinery/pkg/api/resource" | ||
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider" | ||
"k8s.io/autoscaler/cluster-autoscaler/cloudprovider/scaleway/scalewaygo" | ||
"k8s.io/autoscaler/cluster-autoscaler/config" | ||
ca_errors "k8s.io/autoscaler/cluster-autoscaler/utils/errors" | ||
"k8s.io/klog/v2" | ||
) | ||
|
||
const ( | ||
// GPULabel is the label added to GPU nodes | ||
GPULabel = "k8s.scaleway.com/gpu" | ||
) | ||
|
||
type scalewayCloudProvider struct { | ||
// client talks to Kapsule API | ||
client scalewaygo.Client | ||
// ClusterID is the cluster id where the Autoscaler is running. | ||
clusterID string | ||
// nodeGroups is an abstraction around the Pool object returned by the API | ||
nodeGroups []*NodeGroup | ||
|
||
resourceLimiter *cloudprovider.ResourceLimiter | ||
} | ||
|
||
func readConf(config *scalewaygo.Config, configFile io.Reader) error { | ||
body, err := ioutil.ReadAll(configFile) | ||
if err != nil { | ||
return err | ||
} | ||
err = json.Unmarshal(body, config) | ||
return err | ||
} | ||
|
||
func newScalewayCloudProvider(configFile io.Reader, defaultUserAgent string, rl *cloudprovider.ResourceLimiter) *scalewayCloudProvider { | ||
getenvOr := func(key, defaultValue string) string { | ||
value := os.Getenv(key) | ||
if value != "" { | ||
return value | ||
} | ||
return defaultValue | ||
} | ||
|
||
// Config file passed with `cloud-config` flag | ||
cfg := scalewaygo.Config{} | ||
if configFile != nil { | ||
err := readConf(&cfg, configFile) | ||
if err != nil { | ||
klog.Errorf("failed to read/parse scaleway config file: %s", err) | ||
} | ||
} | ||
|
||
// env takes precedence over config passed by command-line | ||
cfg.ClusterID = getenvOr("CLUSTER_ID", cfg.ClusterID) | ||
cfg.SecretKey = getenvOr("SCW_SECRET_KEY", cfg.SecretKey) | ||
cfg.Region = getenvOr("SCW_REGION", cfg.Region) | ||
cfg.ApiUrl = getenvOr("SCW_API_URL", cfg.ApiUrl) | ||
|
||
cfg.UserAgent = defaultUserAgent | ||
|
||
client, err := scalewaygo.NewClient(cfg) | ||
if err != nil { | ||
klog.Fatalf("failed to create scaleway cloud provider: %v", err) | ||
} | ||
|
||
klog.V(4).Infof("Scaleway Cloud Provider built; ClusterId=%s,SecretKey=%s-***,Region=%s,ApiURL=%s", cfg.ClusterID, client.Token()[:8], client.Region(), client.ApiURL()) | ||
|
||
return &scalewayCloudProvider{ | ||
client: client, | ||
clusterID: cfg.ClusterID, | ||
resourceLimiter: rl, | ||
} | ||
} | ||
|
||
// BuildScaleway returns CloudProvider implementation for Scaleway. | ||
func BuildScaleway( | ||
opts config.AutoscalingOptions, | ||
do cloudprovider.NodeGroupDiscoveryOptions, | ||
rl *cloudprovider.ResourceLimiter, | ||
) cloudprovider.CloudProvider { | ||
var configFile io.Reader | ||
|
||
if opts.CloudConfig != "" { | ||
configFile, err := os.Open(opts.CloudConfig) | ||
|
||
if err != nil { | ||
klog.Errorf("could not open scaleway configuration %s: %s", opts.CloudConfig, err) | ||
} else { | ||
defer func() { | ||
err = configFile.Close() | ||
if err != nil { | ||
klog.Errorf("failed to close scaleway config file: %s", err) | ||
} | ||
}() | ||
} | ||
} | ||
return newScalewayCloudProvider(configFile, opts.UserAgent, rl) | ||
} | ||
|
||
// Name returns 'scaleway' | ||
func (*scalewayCloudProvider) Name() string { | ||
return cloudprovider.ScalewayProviderName | ||
} | ||
|
||
// NodeGroups returns all node groups configured for this cluster. | ||
// critical endpoint, make it fast | ||
func (scw *scalewayCloudProvider) NodeGroups() []cloudprovider.NodeGroup { | ||
|
||
klog.V(4).Info("NodeGroups,ClusterID=", scw.clusterID) | ||
|
||
nodeGroups := make([]cloudprovider.NodeGroup, len(scw.nodeGroups)) | ||
for i, ng := range scw.nodeGroups { | ||
nodeGroups[i] = ng | ||
} | ||
return nodeGroups | ||
} | ||
|
||
func (scw *scalewayCloudProvider) nodeGroupForNode(node *apiv1.Node) (*NodeGroup, error) { | ||
for _, ng := range scw.nodeGroups { | ||
if _, ok := ng.nodes[node.Spec.ProviderID]; ok { | ||
return ng, nil | ||
} | ||
} | ||
return nil, nil | ||
} | ||
|
||
// NodeGroupForNode returns the node group for the given node, nil if the node | ||
// should not be processed by cluster autoscaler, or non-nil error if such | ||
// occurred. | ||
// critical endpoint, make it fast | ||
func (scw *scalewayCloudProvider) NodeGroupForNode(node *apiv1.Node) (cloudprovider.NodeGroup, error) { | ||
klog.V(4).Infof("NodeGroupForNode,NodeSpecProviderID=%s", node.Spec.ProviderID) | ||
|
||
return scw.nodeGroupForNode(node) | ||
} | ||
|
||
func (scw *scalewayCloudProvider) NodePrice(node *apiv1.Node, startTime time.Time, endTime time.Time) (float64, error) { | ||
ng, err := scw.nodeGroupForNode(node) | ||
if err != nil { | ||
return 0.0, err | ||
} | ||
|
||
d := endTime.Sub(startTime) | ||
hours := math.Ceil(d.Hours()) | ||
|
||
return hours * float64(ng.specs.NodePricePerHour), nil | ||
} | ||
|
||
func (scw *scalewayCloudProvider) PodPrice(pod *apiv1.Pod, startTime time.Time, endTime time.Time) (float64, error) { | ||
return 0.0, nil | ||
} | ||
|
||
// Pricing return pricing model for scaleway. | ||
func (scw *scalewayCloudProvider) Pricing() (cloudprovider.PricingModel, ca_errors.AutoscalerError) { | ||
klog.V(4).Info("Pricing,called") | ||
return scw, nil | ||
} | ||
|
||
// GetAvailableMachineTypes get all machine types that can be requested from scaleway. | ||
// Not implemented | ||
func (scw *scalewayCloudProvider) GetAvailableMachineTypes() ([]string, error) { | ||
return []string{}, nil | ||
} | ||
|
||
func (scw *scalewayCloudProvider) NewNodeGroup( | ||
machineType string, | ||
labels map[string]string, | ||
systemLabels map[string]string, | ||
taints []apiv1.Taint, | ||
extraResources map[string]resource.Quantity, | ||
) (cloudprovider.NodeGroup, error) { | ||
klog.V(4).Info("NewNodeGroup,called") | ||
return nil, cloudprovider.ErrNotImplemented | ||
} | ||
|
||
// GetResourceLimiter returns struct containing limits (max, min) for resources (cores, memory etc.). | ||
func (scw *scalewayCloudProvider) GetResourceLimiter() (*cloudprovider.ResourceLimiter, error) { | ||
klog.V(4).Info("GetResourceLimiter,called") | ||
return scw.resourceLimiter, nil | ||
} | ||
|
||
// GPULabel returns the label added to nodes with GPU resource. | ||
func (scw *scalewayCloudProvider) GPULabel() string { | ||
klog.V(6).Info("GPULabel,called") | ||
return GPULabel | ||
} | ||
|
||
// GetAvailableGPUTypes return all available GPU types cloud provider supports. | ||
// not yet implemented. | ||
func (scw *scalewayCloudProvider) GetAvailableGPUTypes() map[string]struct{} { | ||
klog.V(4).Info("GetAvailableGPUTypes,called") | ||
return nil | ||
} | ||
|
||
// Cleanup cleans up open resources before the cloud provider is destroyed, i.e. go routines etc. | ||
func (scw *scalewayCloudProvider) Cleanup() error { | ||
klog.V(4).Info("Cleanup,called") | ||
return nil | ||
} | ||
|
||
// Refresh is called before every main loop and can be used to dynamically update cloud provider state. | ||
// In particular the list of node groups returned by NodeGroups can change as a result of CloudProvider.Refresh(). | ||
func (scw *scalewayCloudProvider) Refresh() error { | ||
klog.V(4).Info("Refresh,ClusterID=", scw.clusterID) | ||
|
||
ctx := context.Background() | ||
resp, err := scw.client.ListPools(ctx, &scalewaygo.ListPoolsRequest{ClusterID: scw.clusterID}) | ||
|
||
if err != nil { | ||
klog.Errorf("Refresh,failed to list pools for cluster %s: %s", scw.clusterID, err) | ||
return err | ||
} | ||
|
||
var ng []*NodeGroup | ||
|
||
for _, p := range resp.Pools { | ||
|
||
if p.Pool.Autoscaling == false { | ||
continue | ||
} | ||
|
||
nodes, err := nodesFromPool(scw.client, p.Pool) | ||
if err != nil { | ||
return fmt.Errorf("Refresh,failed to list nodes for pool %s: %w", p.Pool.ID, err) | ||
} | ||
ng = append(ng, &NodeGroup{ | ||
Client: scw.client, | ||
nodes: nodes, | ||
specs: &p.Specs, | ||
p: p.Pool, | ||
}) | ||
} | ||
klog.V(4).Infof("Refresh,ClusterID=%s,%d pools found", scw.clusterID, len(ng)) | ||
|
||
scw.nodeGroups = ng | ||
|
||
return nil | ||
} |
Oops, something went wrong.