Skip to content

Commit

Permalink
Inspect state of local containers to provide more debug information
Browse files Browse the repository at this point in the history
  • Loading branch information
Kirill Maksimov committed Nov 4, 2020
1 parent c4fddb7 commit 5a946b1
Show file tree
Hide file tree
Showing 4 changed files with 91 additions and 14 deletions.
2 changes: 1 addition & 1 deletion .version
Original file line number Diff line number Diff line change
@@ -1 +1 @@
v1.8.2
v1.9.0
7 changes: 7 additions & 0 deletions strelets/adapter/orchestrator.go
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,7 @@ package adapter

import (
"context"
"github.com/docker/docker/api/types"
"github.com/docker/docker/api/types/mount"
"io"
"time"
Expand Down Expand Up @@ -44,6 +45,10 @@ type ServiceConfig struct {
LogsMountPointNames map[string]string // simple name -> namespaced name
}

type ContainerDebugStatus struct {
ContainerState *types.ContainerState
}

type ContainerStatus struct {
Name string
NodeID string
Expand All @@ -52,6 +57,8 @@ type ContainerStatus struct {

Logs string

Debug ContainerDebugStatus

CreatedAt time.Time
}

Expand Down
14 changes: 12 additions & 2 deletions strelets/adapter/swarm_get_status.go
Original file line number Diff line number Diff line change
Expand Up @@ -17,14 +17,24 @@ func (d *dockerSwarmOrchestrator) GetStatus(ctx context.Context, since time.Dura
name, _ := d.getServiceName(ctx, task.ServiceID)
logs, _ := d.getLogs(ctx, task.ServiceID, since)

results = append(results, &ContainerStatus{
status := &ContainerStatus{
Name: name,
State: task.Status.Message,
Error: task.Status.Err,
NodeID: task.NodeID,
CreatedAt: task.CreatedAt,
Logs: logs,
})
}

if task.Status.ContainerStatus != nil {
containerId := task.Status.ContainerStatus.ContainerID
containerJSON, err := d.client.ContainerInspect(ctx, containerId)
if err == nil { // skipping because it only works on the same machine
status.Debug.ContainerState = containerJSON.State
}
}

results = append(results, status)
}
}

Expand Down
82 changes: 71 additions & 11 deletions strelets/adapter/swarm_get_status_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,7 @@ package adapter
import (
"context"
"github.com/docker/docker/api/types"
"github.com/docker/docker/api/types/container"
dockerSwarm "github.com/docker/docker/api/types/swarm"
dockerClient "github.com/docker/docker/client"
"github.com/orbs-network/boyarin/test/helpers"
Expand All @@ -13,13 +14,15 @@ import (
"time"
)

const DEFAULT_DOCKER_IMAGE = "busybox"

func TestDockerSwarm_GetStatusIfUnableToStart(t *testing.T) {
helpers.SkipUnlessSwarmIsEnabled(t)
helpers.WithContext(func(ctx context.Context) {
helpers.InitSwarmEnvironment(t, ctx)

serviceId := startDefunctContainer(t)
defer destroyDefunctBusybox(t, serviceId)
defer destroyDefunctContainer(t, serviceId)

swarm, err := NewDockerSwarm(OrchestratorOptions{}, log.GetLogger())
require.NoError(t, err)
Expand All @@ -28,7 +31,7 @@ func TestDockerSwarm_GetStatusIfUnableToStart(t *testing.T) {
status, err := swarm.GetStatus(context.TODO(), 5*time.Second)
require.NoError(t, err)
for _, s := range status {
if s.Name == defunctName {
if s.Name == DEFUNCT_NAME {
t.Log("polling reloadingBusybox:", "s.Error=", s.Error, "s.Logs=", s.Logs)
return strings.Contains(s.Error, "executable file not found")
}
Expand All @@ -45,7 +48,7 @@ func TestDockerSwarm_GetStatusIfExitsImmediately(t *testing.T) {
helpers.InitSwarmEnvironment(t, ctx)

serviceId := startReloadingContainer(t)
defer destroyDefunctBusybox(t, serviceId)
defer destroyDefunctContainer(t, serviceId)

swarm, err := NewDockerSwarm(OrchestratorOptions{}, log.GetLogger())
require.NoError(t, err)
Expand All @@ -54,7 +57,7 @@ func TestDockerSwarm_GetStatusIfExitsImmediately(t *testing.T) {
status, err := swarm.GetStatus(context.TODO(), 5*time.Second)
require.NoError(t, err)
for _, s := range status {
if s.Name == reloadingName {
if s.Name == RELOADING_NAME {
t.Log("polling reloadingBusybox:", "s.Error=", s.Error, "s.Logs=", s.Logs)
return strings.Contains(s.Error, "non-zero exit") && strings.Contains(s.Logs, "I can not be contained")
}
Expand All @@ -65,7 +68,36 @@ func TestDockerSwarm_GetStatusIfExitsImmediately(t *testing.T) {
})
}

const defunctName = "DefunctContainer"
func TestDockerSwarm_GetStatusOfUnhealthyContainer(t *testing.T) {
helpers.SkipUnlessSwarmIsEnabled(t)
helpers.WithContext(func(ctx context.Context) {
helpers.InitSwarmEnvironment(t, ctx)

serviceId := startUnhealthyContainer(t)
defer destroyDefunctContainer(t, serviceId)

swarm, err := NewDockerSwarm(OrchestratorOptions{}, log.GetLogger())
require.NoError(t, err)

require.True(t, helpers.Eventually(30*time.Second, func() bool {
status, err := swarm.GetStatus(context.TODO(), 5*time.Second)
require.NoError(t, err)
for _, s := range status {
if s.Name == UNHEALTHY_NAME {
t.Log("polling reloadingBusybox:", "s.Error=", s.Error, "s.Logs=", s.Logs)
if s.Debug.ContainerState != nil && len(s.Debug.ContainerState.Health.Log) > 0 {
return strings.Contains(s.Error, "task: non-zero exit (137): dockerexec: unhealthy container") &&
strings.Contains(s.Debug.ContainerState.Health.Log[0].Output, "HEALTHCHECK FAILED")
}
}
}

return false
}), "should be able to retrieve logs from constantly reloading container")
})
}

const DEFUNCT_NAME = "DefunctContainer"

func startDefunctContainer(t *testing.T) (serviceId string) {
client, err := dockerClient.NewClientWithOpts(dockerClient.WithVersion(DOCKER_API_VERSION))
Expand All @@ -74,20 +106,20 @@ func startDefunctContainer(t *testing.T) (serviceId string) {
spec := dockerSwarm.ServiceSpec{
TaskTemplate: dockerSwarm.TaskSpec{
ContainerSpec: &dockerSwarm.ContainerSpec{
Image: "alpine",
Image: DEFAULT_DOCKER_IMAGE,
Command: []string{"this-program-does-not-exist"},
},
},
}
spec.Name = defunctName
spec.Name = DEFUNCT_NAME

resp, err := client.ServiceCreate(context.Background(), spec, types.ServiceCreateOptions{})
require.NoError(t, err)

return resp.ID
}

const reloadingName = "ReloadingContainer"
const RELOADING_NAME = "ReloadingContainer"

func startReloadingContainer(t *testing.T) (serviceId string) {
client, err := dockerClient.NewClientWithOpts(dockerClient.WithVersion(DOCKER_API_VERSION))
Expand All @@ -96,20 +128,48 @@ func startReloadingContainer(t *testing.T) (serviceId string) {
spec := dockerSwarm.ServiceSpec{
TaskTemplate: dockerSwarm.TaskSpec{
ContainerSpec: &dockerSwarm.ContainerSpec{
Image: "alpine",
Image: DEFAULT_DOCKER_IMAGE,
Command: []string{"sh", "-c", "echo I can not be contained && exit 999"},
},
},
}
spec.Name = reloadingName
spec.Name = RELOADING_NAME

resp, err := client.ServiceCreate(context.Background(), spec, types.ServiceCreateOptions{})
require.NoError(t, err)

return resp.ID
}

const UNHEALTHY_NAME = "UnhealthyContainer"

func startUnhealthyContainer(t *testing.T) (serviceId string) {
client, err := dockerClient.NewClientWithOpts(dockerClient.WithVersion(DOCKER_API_VERSION))
require.NoError(t, err)

spec := dockerSwarm.ServiceSpec{
TaskTemplate: dockerSwarm.TaskSpec{
ContainerSpec: &dockerSwarm.ContainerSpec{
Image: DEFAULT_DOCKER_IMAGE,
Command: []string{"sh", "-c", "sleep 10000"},
Healthcheck: &container.HealthConfig{
Interval: 100 * time.Millisecond,
Retries: 1,
Test: []string{"CMD-SHELL",
"sh -c \"echo HEALTHCHECK FAILED; exit 1\""},
},
},
},
}
spec.Name = UNHEALTHY_NAME

resp, err := client.ServiceCreate(context.Background(), spec, types.ServiceCreateOptions{})
require.NoError(t, err)

return resp.ID
}

func destroyDefunctBusybox(t *testing.T, serviceId string) {
func destroyDefunctContainer(t *testing.T, serviceId string) {
client, err := dockerClient.NewClientWithOpts(dockerClient.WithVersion(DOCKER_API_VERSION))
require.NoError(t, err)

Expand Down

0 comments on commit 5a946b1

Please sign in to comment.