Skip to content
This repository has been archived by the owner on Sep 30, 2020. It is now read-only.

Create etcd and workers in private subnets, controllers in public subnet #169

Merged
merged 20 commits into from
Jan 24, 2017
Merged
Show file tree
Hide file tree
Changes from 7 commits
Commits
Show all changes
20 commits
Select commit Hold shift + click to select a range
d04a698
first pass at public private network topology
icereval Dec 27, 2016
7d93778
use function for logical name and refs
icereval Dec 27, 2016
57f57a0
define subnets in cluster, code review updates
icereval Dec 28, 2016
3137b09
simplify route tables, add node pool private logic
icereval Dec 29, 2016
e8fab45
workers private subnet and controller elb subnet selection
neoandroid Dec 29, 2016
096bd5c
fix tests
neoandroid Dec 29, 2016
3e8d431
fix go format
neoandroid Dec 30, 2016
fb99a1f
create nat gateways when workers are private yet somehow etcd & contr…
neoandroid Dec 31, 2016
e4db361
private worker efs mount targets
icereval Dec 31, 2016
6c5f04f
Merge pull request #2 from icereval/feature/private-worker-efs
neoandroid Dec 31, 2016
ce9f075
fix parameter comment
neoandroid Jan 3, 2017
34024ed
Merge branch 'master' into masters-private-subnet
neoandroid Jan 10, 2017
83dc882
remove duplicated code introduced by private subnets from cfn templates
neoandroid Jan 10, 2017
03d19fe
remove AvailabilityZones property from cfn template because its redun…
neoandroid Jan 11, 2017
a601020
Merge branch 'master' into masters-private-subnet
neoandroid Jan 11, 2017
70d791c
fix wrong variable type
neoandroid Jan 17, 2017
08a45e7
Merge branch 'master' into masters-private-subnet
neoandroid Jan 17, 2017
6dce8c8
Merge branch 'master' into masters-private-subnet
neoandroid Jan 19, 2017
0c0060b
fix format
neoandroid Jan 19, 2017
b379650
refactor private subnet support to improve stability and maintainability
neoandroid Jan 20, 2017
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion cmd/nodepool/up.go
Original file line number Diff line number Diff line change
Expand Up @@ -42,7 +42,7 @@ func runCmdUp(cmd *cobra.Command, args []string) error {
return fmt.Errorf("Failed to validate user data: %v", err)
}

data, err := conf.RenderStackTemplate(stackTemplateOptions(), upOpts.export)
data, err := conf.RenderStackTemplate(stackTemplateOptions(), upOpts.prettyPrint)
if err != nil {
return fmt.Errorf("Failed to render stack template: %v", err)
}
Expand Down
147 changes: 79 additions & 68 deletions config/config.go
Original file line number Diff line number Diff line change
Expand Up @@ -75,7 +75,8 @@ func NewDefaultCluster() *Cluster {
AWSCliImageRepo: "quay.io/coreos/awscli",
AWSCliTag: "master",
ContainerRuntime: "docker",
Subnets: []*Subnet{},
Subnets: []*model.Subnet{},
EIPAllocationIDs: []string{},
MapPublicIPs: true,
Experimental: experimental,
},
Expand Down Expand Up @@ -170,7 +171,7 @@ func ClusterFromBytes(data []byte) (*Cluster, error) {

// For backward-compatibility
if len(c.Subnets) == 0 {
c.Subnets = []*Subnet{
c.Subnets = []*model.Subnet{
{
AvailabilityZone: c.AvailabilityZone,
InstanceCIDR: c.InstanceCIDR,
Expand Down Expand Up @@ -209,14 +210,15 @@ type ComputedDeploymentSettings struct {
// Though it is highly configurable, it's basically users' responsibility to provide `correct` values if they're going beyond the defaults.
type DeploymentSettings struct {
ComputedDeploymentSettings
ClusterName string `yaml:"clusterName,omitempty"`
KeyName string `yaml:"keyName,omitempty"`
Region string `yaml:"region,omitempty"`
AvailabilityZone string `yaml:"availabilityZone,omitempty"`
ReleaseChannel string `yaml:"releaseChannel,omitempty"`
AmiId string `yaml:"amiId,omitempty"`
VPCID string `yaml:"vpcId,omitempty"`
RouteTableID string `yaml:"routeTableId,omitempty"`
ClusterName string `yaml:"clusterName,omitempty"`
KeyName string `yaml:"keyName,omitempty"`
Region string `yaml:"region,omitempty"`
AvailabilityZone string `yaml:"availabilityZone,omitempty"`
ReleaseChannel string `yaml:"releaseChannel,omitempty"`
AmiId string `yaml:"amiId,omitempty"`
VPCID string `yaml:"vpcId,omitempty"`
InternetGatewayID string `yaml:"internetGatewayId,omitempty"`
RouteTableID string `yaml:"routeTableId,omitempty"`
// Required for validations like e.g. if instance cidr is contained in vpc cidr
VPCCIDR string `yaml:"vpcCIDR,omitempty"`
InstanceCIDR string `yaml:"instanceCIDR,omitempty"`
Expand All @@ -227,7 +229,8 @@ type DeploymentSettings struct {
ContainerRuntime string `yaml:"containerRuntime,omitempty"`
KMSKeyARN string `yaml:"kmsKeyArn,omitempty"`
StackTags map[string]string `yaml:"stackTags,omitempty"`
Subnets []*Subnet `yaml:"subnets,omitempty"`
Subnets []*model.Subnet `yaml:"subnets,omitempty"`
EIPAllocationIDs []string `yaml:"eipAllocationIDs,omitempty"`
MapPublicIPs bool `yaml:"mapPublicIPs,omitempty"`
ElasticFileSystemID string `yaml:"elasticFileSystemId,omitempty"`
SSHAuthorizedKeys []string `yaml:"sshAuthorizedKeys,omitempty"`
Expand All @@ -246,22 +249,25 @@ type WorkerSettings struct {
WorkerSpotPrice string `yaml:"workerSpotPrice,omitempty"`
WorkerSecurityGroupIds []string `yaml:"workerSecurityGroupIds,omitempty"`
WorkerTenancy string `yaml:"workerTenancy,omitempty"`
WorkerTopologyPrivate bool `yaml:"workerTopologyPrivate,omitempty"`
}

// Part of configuration which is specific to controller nodes
type ControllerSettings struct {
model.Controller `yaml:"controller,omitempty"`
ControllerCount int `yaml:"controllerCount,omitempty"`
ControllerCreateTimeout string `yaml:"controllerCreateTimeout,omitempty"`
ControllerInstanceType string `yaml:"controllerInstanceType,omitempty"`
ControllerRootVolumeType string `yaml:"controllerRootVolumeType,omitempty"`
ControllerRootVolumeIOPS int `yaml:"controllerRootVolumeIOPS,omitempty"`
ControllerRootVolumeSize int `yaml:"controllerRootVolumeSize,omitempty"`
ControllerTenancy string `yaml:"controllerTenancy,omitempty"`
model.Controller `yaml:"controller,omitempty"`
ControllerCount int `yaml:"controllerCount,omitempty"`
ControllerCreateTimeout string `yaml:"controllerCreateTimeout,omitempty"`
ControllerInstanceType string `yaml:"controllerInstanceType,omitempty"`
ControllerLoadBalancerPrivate string `yaml:"controllerLoadBalancerPrivate,omitempty"`
Copy link

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Should this be a bool?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

You're right. Good catch 👍

ControllerRootVolumeType string `yaml:"controllerRootVolumeType,omitempty"`
ControllerRootVolumeIOPS int `yaml:"controllerRootVolumeIOPS,omitempty"`
ControllerRootVolumeSize int `yaml:"controllerRootVolumeSize,omitempty"`
ControllerTenancy string `yaml:"controllerTenancy,omitempty"`
}

// Part of configuration which is specific to etcd nodes
type EtcdSettings struct {
model.Etcd `yaml:"etcd,omitempty"`
EtcdCount int `yaml:"etcdCount"`
EtcdInstanceType string `yaml:"etcdInstanceType,omitempty"`
EtcdRootVolumeSize int `yaml:"etcdRootVolumeSize,omitempty"`
Expand Down Expand Up @@ -296,12 +302,6 @@ type Cluster struct {
providedEncryptService EncryptService
}

type Subnet struct {
AvailabilityZone string `yaml:"availabilityZone,omitempty"`
InstanceCIDR string `yaml:"instanceCIDR,omitempty"`
lastAllocatedAddr *net.IP
}

type Experimental struct {
AuditLog AuditLog `yaml:"auditLog"`
AwsEnvironment AwsEnvironment `yaml:"awsEnvironment"`
Expand Down Expand Up @@ -385,7 +385,8 @@ type WaitSignal struct {
}

const (
vpcLogicalName = "VPC"
vpcLogicalName = "VPC"
internetGatewayLogicalName = "InternetGateway"
)

var supportedReleaseChannels = map[string]bool{
Expand Down Expand Up @@ -474,52 +475,40 @@ func (c Cluster) Config() (*Config, error) {
config.AMI = c.AmiId
}

//Set logical name constants
config.VPCLogicalName = vpcLogicalName

//Set reference strings

//Assume VPC does not exist, reference by logical name
config.VPCRef = fmt.Sprintf(`{ "Ref" : %q }`, config.VPCLogicalName)
if config.VPCID != "" {
//This means this VPC already exists, and we can reference it directly by ID
config.VPCRef = fmt.Sprintf("%q", config.VPCID)
}

config.EtcdInstances = make([]etcdInstance, config.EtcdCount)
var etcdEndpoints, etcdInitialCluster bytes.Buffer

// Reset lastAllocatedAddr or we'll end up returning different cluster config w/ inconsistent static private ips
// for each time we call this function `cluster.Config()`
for _, subnet := range config.Subnets {
subnet.lastAllocatedAddr = nil
}

var lastAllocatedAddr = make(map[model.Subneter]*net.IP)
for etcdIndex := 0; etcdIndex < config.EtcdCount; etcdIndex++ {

//Round-robbin etcd instances across all available subnets
subnetIndex := etcdIndex % len(config.Subnets)
subnet := config.Subnets[subnetIndex]
subnet := model.Subneter(config.Subnets[subnetIndex])
subnetInstanceCIDR := config.Subnets[subnetIndex].InstanceCIDR
if config.Etcd.TopologyPrivate() {
subnet = model.Subneter(config.Etcd.PrivateSubnets[subnetIndex])
subnetInstanceCIDR = config.Etcd.PrivateSubnets[subnetIndex].InstanceCIDR
}

_, subnetCIDR, err := net.ParseCIDR(subnet.InstanceCIDR)
_, subnetCIDR, err := net.ParseCIDR(subnetInstanceCIDR)
if err != nil {
return nil, fmt.Errorf("error parsing subnet instance cidr %s: %v", subnet.InstanceCIDR, err)
return nil, fmt.Errorf("error parsing subnet instance cidr %s: %v", subnetInstanceCIDR, err)
}

if subnet.lastAllocatedAddr == nil {
if lastAllocatedAddr[subnet] == nil {
ip := subnetCIDR.IP
//TODO:(chom) this is sloppy, but "soon-ish" etcd with be self-hosted so we'll leave this be
for i := 0; i < 3; i++ {
ip = netutil.IncrementIP(ip)
}
subnet.lastAllocatedAddr = &ip
lastAllocatedAddr[subnet] = &ip
}

nextAddr := netutil.IncrementIP(*subnet.lastAllocatedAddr)
subnet.lastAllocatedAddr = &nextAddr
nextAddr := netutil.IncrementIP(*lastAllocatedAddr[subnet])
lastAllocatedAddr[subnet] = &nextAddr
instance := etcdInstance{
IPAddress: *subnet.lastAllocatedAddr,
SubnetIndex: subnetIndex,
IPAddress: *lastAllocatedAddr[subnet],
Subnet: subnet,
}

//TODO(chom): validate we're not overflowing the address space
Expand Down Expand Up @@ -670,8 +659,8 @@ func (c Cluster) RenderStackTemplate(opts StackTemplateOptions, prettyPrint bool
}

type etcdInstance struct {
IPAddress net.IP
SubnetIndex int
IPAddress net.IP
Subnet model.Subneter
}

type Config struct {
Expand All @@ -683,12 +672,6 @@ type Config struct {

// Encoded TLS assets
TLSConfig *CompactTLSAssets

//Logical names of dynamic resources
VPCLogicalName string

//Reference strings for dynamic resources
VPCRef string
}

// CloudFormation stack name which is unique in an AWS account.
Expand All @@ -697,6 +680,30 @@ func (c Config) StackName() string {
return c.ClusterName
}

func (c Config) VPCLogicalName() string {
return vpcLogicalName
}

func (c Config) VPCRef() string {
if c.VPCID != "" {
return fmt.Sprintf("%q", c.VPCID)
} else {
return fmt.Sprintf(`{ "Ref" : %q }`, c.VPCLogicalName())
}
}

func (c Config) InternetGatewayLogicalName() string {
return internetGatewayLogicalName
}

func (c Config) InternetGatewayRef() string {
if c.InternetGatewayID != "" {
return fmt.Sprintf("%q", c.InternetGatewayID)
} else {
return fmt.Sprintf(`{ "Ref" : %q }`, c.InternetGatewayLogicalName())
}
}

func (c Cluster) valid() error {
if c.CreateRecordSet {
if c.HostedZone == "" && c.HostedZoneID == "" {
Expand Down Expand Up @@ -835,8 +842,8 @@ func (c DeploymentSettings) Valid() (*DeploymentValidationResult, error) {
return nil, errors.New("kmsKeyArn must be set")
}

if c.VPCID == "" && c.RouteTableID != "" {
return nil, errors.New("vpcId must be specified if routeTableId is specified")
if c.VPCID == "" && (c.RouteTableID != "" || c.InternetGatewayID != "") {
return nil, errors.New("vpcId must be specified if routeTableId or internetGatewayId are specified")
}

if c.Region == "" {
Expand Down Expand Up @@ -981,12 +988,16 @@ func (c *Cluster) AvailabilityZones() []string {
return []string{c.AvailabilityZone}
}

azs := make([]string, len(c.Subnets))
for i := range azs {
azs[i] = c.Subnets[i].AvailabilityZone
result := []string{}
seen := map[string]bool{}
for _, s := range c.Subnets {
val := s.AvailabilityZone
if _, ok := seen[val]; !ok {
result = append(result, val)
seen[val] = true
}
}

return azs
return result
}

/*
Expand Down
38 changes: 20 additions & 18 deletions config/config_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,8 @@ import (
"strings"
"testing"
"text/template"

model "github.com/coreos/kube-aws/model"
)

const minimalConfigYaml = `externalDNSName: test.staging.core-os.net
Expand Down Expand Up @@ -314,7 +316,7 @@ func TestMultipleSubnets(t *testing.T) {

validConfigs := []struct {
conf string
subnets []*Subnet
subnets []*model.Subnet
}{
{
conf: `
Expand All @@ -327,7 +329,7 @@ subnets:
- availabilityZone: ap-northeast-1c
instanceCIDR: 10.4.4.0/24
`,
subnets: []*Subnet{
subnets: []*model.Subnet{
{
InstanceCIDR: "10.4.3.0/24",
AvailabilityZone: "ap-northeast-1a",
Expand All @@ -346,7 +348,7 @@ controllerIP: 10.4.3.50
availabilityZone: ap-northeast-1a
instanceCIDR: 10.4.3.0/24
`,
subnets: []*Subnet{
subnets: []*model.Subnet{
{
AvailabilityZone: "ap-northeast-1a",
InstanceCIDR: "10.4.3.0/24",
Expand All @@ -362,7 +364,7 @@ availabilityZone: ap-northeast-1a
instanceCIDR: 10.4.3.0/24
subnets: []
`,
subnets: []*Subnet{
subnets: []*model.Subnet{
{
AvailabilityZone: "ap-northeast-1a",
InstanceCIDR: "10.4.3.0/24",
Expand All @@ -375,7 +377,7 @@ subnets: []
availabilityZone: "ap-northeast-1a"
subnets: []
`,
subnets: []*Subnet{
subnets: []*model.Subnet{
{
AvailabilityZone: "ap-northeast-1a",
InstanceCIDR: "10.0.0.0/24",
Expand All @@ -387,7 +389,7 @@ subnets: []
# Missing subnets field fall-backs to the single subnet with the default az/cidr.
availabilityZone: "ap-northeast-1a"
`,
subnets: []*Subnet{
subnets: []*model.Subnet{
{
AvailabilityZone: "ap-northeast-1a",
InstanceCIDR: "10.0.0.0/24",
Expand Down Expand Up @@ -730,12 +732,12 @@ func newMinimalConfig() (*Config, error) {
cluster := NewDefaultCluster()
cluster.ExternalDNSName = "k8s.example.com"
cluster.Region = "us-west-1"
cluster.Subnets = []*Subnet{
&Subnet{
cluster.Subnets = []*model.Subnet{
&model.Subnet{
AvailabilityZone: "us-west-1a",
InstanceCIDR: "10.0.0.0/24",
},
&Subnet{
&model.Subnet{
AvailabilityZone: "us-west-1b",
InstanceCIDR: "10.0.1.0/24",
},
Expand Down Expand Up @@ -873,9 +875,9 @@ func TestValidateExistingVPC(t *testing.T) {
cluster := NewDefaultCluster()

cluster.VPCCIDR = "10.0.0.0/16"
cluster.Subnets = []*Subnet{
{"ap-northeast-1a", "10.0.1.0/24", nil},
{"ap-northeast-1a", "10.0.2.0/24", nil},
cluster.Subnets = []*model.Subnet{
{"ap-northeast-1a", "10.0.1.0/24", "", model.NatGateway{}},
{"ap-northeast-1a", "10.0.2.0/24", "", model.NatGateway{}},
}

for _, testCase := range validCases {
Expand All @@ -899,9 +901,9 @@ func TestValidateUserData(t *testing.T) {
cluster := newDefaultClusterWithDeps(&dummyEncryptService{})

cluster.Region = "us-west-1"
cluster.Subnets = []*Subnet{
{"us-west-1a", "10.0.1.0/16", nil},
{"us-west-1b", "10.0.2.0/16", nil},
cluster.Subnets = []*model.Subnet{
{"us-west-1a", "10.0.1.0/16", "", model.NatGateway{}},
{"us-west-1b", "10.0.2.0/16", "", model.NatGateway{}},
}

helper.WithDummyCredentials(func(dir string) {
Expand All @@ -923,9 +925,9 @@ func TestRenderStackTemplate(t *testing.T) {
cluster := newDefaultClusterWithDeps(&dummyEncryptService{})

cluster.Region = "us-west-1"
cluster.Subnets = []*Subnet{
{"us-west-1a", "10.0.1.0/16", nil},
{"us-west-1b", "10.0.2.0/16", nil},
cluster.Subnets = []*model.Subnet{
{"us-west-1a", "10.0.1.0/16", "", model.NatGateway{}},
{"us-west-1b", "10.0.2.0/16", "", model.NatGateway{}},
}

helper.WithDummyCredentials(func(dir string) {
Expand Down
Loading