Skip to content

Commit

Permalink
Prioritize node/machine linkage using ProviderID
Browse files Browse the repository at this point in the history
This is a merge openshift#100
  • Loading branch information
frobware committed Jun 3, 2019
1 parent a3e2049 commit 8b32581
Show file tree
Hide file tree
Showing 3 changed files with 300 additions and 49 deletions.
111 changes: 86 additions & 25 deletions cluster-autoscaler/cloudprovider/clusterapi/clusterapi_controller.go
Original file line number Diff line number Diff line change
Expand Up @@ -33,7 +33,8 @@ import (
)

const (
nodeProviderIDIndex = "clusterapi-nodeProviderIDIndex"
machineProviderIDIndex = "clusterapi-machineProviderIDIndex"
nodeProviderIDIndex = "clusterapi-nodeProviderIDIndex"
)

// machineController watches for Nodes, Machines, MachineSets and
Expand All @@ -52,9 +53,22 @@ type machineController struct {

type machineSetFilterFunc func(machineSet *v1alpha1.MachineSet) error

func indexNodeByNodeProviderID(obj interface{}) ([]string, error) {
func indexMachineByProviderID(obj interface{}) ([]string, error) {
if machine, ok := obj.(*v1alpha1.Machine); ok {
if machine.Spec.ProviderID != nil && *machine.Spec.ProviderID != "" {
return []string{*machine.Spec.ProviderID}, nil
}
return []string{}, nil
}
return []string{}, nil
}

func indexNodeByProviderID(obj interface{}) ([]string, error) {
if node, ok := obj.(*corev1.Node); ok {
return []string{node.Spec.ProviderID}, nil
if node.Spec.ProviderID != "" {
return []string{node.Spec.ProviderID}, nil
}
return []string{}, nil
}
return []string{}, nil
}
Expand Down Expand Up @@ -143,36 +157,43 @@ func (c *machineController) run(stopCh <-chan struct{}) error {
return nil
}

// findMachineByNodeProviderID find associated machine using
// node.Spec.ProviderID as the key. Returns nil if either the Node by
// node.Spec.ProviderID cannot be found or if the node has no machine
// annotation. A DeepCopy() of the object is returned on success.
func (c *machineController) findMachineByNodeProviderID(node *corev1.Node) (*v1alpha1.Machine, error) {
objs, err := c.nodeInformer.GetIndexer().ByIndex(nodeProviderIDIndex, node.Spec.ProviderID)
// findMachineByProviderID finds machine matching providerID. A
// DeepCopy() of the object is returned on success.
func (c *machineController) findMachineByProviderID(providerID string) (*v1alpha1.Machine, error) {
objs, err := c.machineInformer.Informer().GetIndexer().ByIndex(machineProviderIDIndex, providerID)
if err != nil {
return nil, err
}

switch n := len(objs); {
case n == 0:
return nil, nil
case n > 1:
return nil, fmt.Errorf("internal error; expected len==1, got %v", n)
case n == 1:
machine, ok := objs[0].(*v1alpha1.Machine)
if !ok {
return nil, fmt.Errorf("internal error; unexpected type %T", machine)
}
if machine != nil {
return machine.DeepCopy(), nil
}
}

node, ok := objs[0].(*corev1.Node)
if !ok {
return nil, fmt.Errorf("internal error; unexpected type %T", node)
// If the machine object has no providerID--maybe actuator
// does not set this value (e.g., OpenStack)--then first
// lookup the node using ProviderID. If that is successful
// then the machine can be found using the annotation (should
// it exist).
node, err := c.findNodeByProviderID(providerID)
if err != nil {
return nil, err
}

if machineName, found := node.Annotations[machineAnnotationKey]; found {
return c.findMachine(machineName)
if node == nil {
return nil, nil
}

return nil, nil
return c.findMachine(node.Annotations[machineAnnotationKey])
}

// findNodeByNodeName find the Node object keyed by node.Name. Returns
// findNodeByNodeName finds the Node object keyed by name.. Returns
// nil if it cannot be found. A DeepCopy() of the object is returned
// on success.
func (c *machineController) findNodeByNodeName(name string) (*corev1.Node, error) {
Expand Down Expand Up @@ -235,12 +256,16 @@ func newMachineController(
nodeInformer := kubeInformerFactory.Core().V1().Nodes().Informer()
nodeInformer.AddEventHandler(cache.ResourceEventHandlerFuncs{})

indexerFuncs := cache.Indexers{
nodeProviderIDIndex: indexNodeByNodeProviderID,
if err := machineInformer.Informer().GetIndexer().AddIndexers(cache.Indexers{
machineProviderIDIndex: indexMachineByProviderID,
}); err != nil {
return nil, fmt.Errorf("cannot add machine indexer: %v", err)
}

if err := nodeInformer.GetIndexer().AddIndexers(indexerFuncs); err != nil {
return nil, fmt.Errorf("cannot add indexers: %v", err)
if err := nodeInformer.GetIndexer().AddIndexers(cache.Indexers{
nodeProviderIDIndex: indexNodeByProviderID,
}); err != nil {
return nil, fmt.Errorf("cannot add node indexer: %v", err)
}

return &machineController{
Expand All @@ -263,6 +288,18 @@ func (c *machineController) machineSetNodeNames(machineSet *v1alpha1.MachineSet)
var nodes []string

for _, machine := range machines {
if machine.Spec.ProviderID != nil && *machine.Spec.ProviderID != "" {
// Prefer machine<=>node mapping using ProviderID
node, err := c.findNodeByProviderID(*machine.Spec.ProviderID)
if err != nil {
return nil, err
}
if node != nil {
nodes = append(nodes, node.Spec.ProviderID)
continue
}
}

if machine.Status.NodeRef == nil {
klog.V(4).Infof("Status.NodeRef of machine %q is currently nil", machine.Name)
continue
Expand Down Expand Up @@ -362,7 +399,7 @@ func (c *machineController) nodeGroups() ([]*nodegroup, error) {
}

func (c *machineController) nodeGroupForNode(node *corev1.Node) (*nodegroup, error) {
machine, err := c.findMachineByNodeProviderID(node)
machine, err := c.findMachineByProviderID(node.Spec.ProviderID)
if err != nil {
return nil, err
}
Expand Down Expand Up @@ -415,3 +452,27 @@ func (c *machineController) nodeGroupForNode(node *corev1.Node) (*nodegroup, err
klog.V(4).Infof("node %q is in nodegroup %q", node.Name, machineSet.Name)
return nodegroup, nil
}

// findNodeByProviderID find the Node object keyed by provideID.
// Returns nil if it cannot be found. A DeepCopy() of the object is
// returned on success.
func (c *machineController) findNodeByProviderID(providerID string) (*corev1.Node, error) {
objs, err := c.nodeInformer.GetIndexer().ByIndex(nodeProviderIDIndex, providerID)
if err != nil {
return nil, err
}

switch n := len(objs); {
case n == 0:
return nil, nil
case n > 1:
return nil, fmt.Errorf("internal error; expected len==1, got %v", n)
}

node, ok := objs[0].(*corev1.Node)
if !ok {
return nil, fmt.Errorf("internal error; unexpected type %T", node)
}

return node.DeepCopy(), nil
}
Loading

0 comments on commit 8b32581

Please sign in to comment.