Add generic restart test.

Signed-off-by: Lantao Liu <lantaol@google.com>
2018-02-22 03:20:40 +00:00
parent 00cd5b6a0c
commit 09294fca40
2 changed files with 141 additions and 134 deletions
--- a/integration/restart_test.go
+++ b/integration/restart_test.go
@@ -17,8 +17,6 @@ limitations under the License.
 package integration
 import (
 	"os"
 	"path/filepath"
 	"testing"
 	"time"
@@ -26,47 +24,61 @@ import (
 	"github.com/stretchr/testify/assert"
 	"github.com/stretchr/testify/require"
 	"golang.org/x/net/context"
 	"golang.org/x/sys/unix"
 	runtime "k8s.io/kubernetes/pkg/kubelet/apis/cri/runtime/v1alpha2"
 )
 // Restart test must run sequentially.
 // NOTE(random-liu): Current restart test only support standalone cri-containerd mode.
-func TestSandboxAcrossCRIContainerdRestart(t *testing.T) {
+func TestContainerdRestart(t *testing.T) {
-	if !*standaloneCRIContainerd {
+	type container struct {
-		t.Skip("Skip because cri-containerd does not run in standalone mode")
+		name  string
 		id    string
 		state runtime.ContainerState
 	}
 	type sandbox struct {
 		name       string
 		id         string
 		state      runtime.PodSandboxState
 		containers []container
 	}
 	ctx := context.Background()
-	sandboxNS := "sandbox-restart-cri-containerd"
+	sandboxNS := "restart-containerd"
-	sandboxes := []struct {
+	sandboxes := []sandbox{
 		name            string
 		id              string
 		stateBeforeExit runtime.PodSandboxState
 		actionAfterExit string
 		expectedState   runtime.PodSandboxState
 	}{
 		{
-			name:            "task-always-ready",
+			name:  "ready-sandbox",
-			stateBeforeExit: runtime.PodSandboxState_SANDBOX_READY,
+			state: runtime.PodSandboxState_SANDBOX_READY,
-			expectedState:   runtime.PodSandboxState_SANDBOX_READY,
+			containers: []container{
 				{
 					name:  "created-container",
 					state: runtime.ContainerState_CONTAINER_CREATED,
 				},
 				{
 					name:  "running-container",
 					state: runtime.ContainerState_CONTAINER_RUNNING,
 				},
 				{
 					name:  "exited-container",
 					state: runtime.ContainerState_CONTAINER_EXITED,
 				},
 			},
 		},
 		{
-			name:            "task-always-not-ready",
+			name:  "notready-sandbox",
-			stateBeforeExit: runtime.PodSandboxState_SANDBOX_NOTREADY,
+			state: runtime.PodSandboxState_SANDBOX_NOTREADY,
-			expectedState:   runtime.PodSandboxState_SANDBOX_NOTREADY,
+			containers: []container{
-		},
+				{
-		{
+					name:  "created-container",
-			name:            "task-exit-before-restart",
+					state: runtime.ContainerState_CONTAINER_CREATED,
-			stateBeforeExit: runtime.PodSandboxState_SANDBOX_READY,
+				},
-			actionAfterExit: "kill",
+				{
-			expectedState:   runtime.PodSandboxState_SANDBOX_NOTREADY,
+					name:  "running-container",
-		},
+					state: runtime.ContainerState_CONTAINER_RUNNING,
-		{
+				},
-			name:            "task-deleted-before-restart",
+				{
-			stateBeforeExit: runtime.PodSandboxState_SANDBOX_READY,
+					name:  "exited-container",
-			actionAfterExit: "delete",
+					state: runtime.ContainerState_CONTAINER_EXITED,
-			expectedState:   runtime.PodSandboxState_SANDBOX_NOTREADY,
+				},
 			},
 		},
 	}
 	t.Logf("Make sure no sandbox is running before test")
@@ -74,134 +86,97 @@ func TestSandboxAcrossCRIContainerdRestart(t *testing.T) {
 	require.NoError(t, err)
 	require.Empty(t, existingSandboxes)
-	t.Logf("Start test sandboxes")
+	t.Logf("Start test sandboxes and containers")
 	for i := range sandboxes {
 		s := &sandboxes[i]
-		cfg := PodSandboxConfig(s.name, sandboxNS)
+		sbCfg := PodSandboxConfig(s.name, sandboxNS)
-		sb, err := runtimeService.RunPodSandbox(cfg)
+		sid, err := runtimeService.RunPodSandbox(sbCfg)
 		require.NoError(t, err)
 		defer func() {
 			// Make sure the sandbox is cleaned up in any case.
-			runtimeService.StopPodSandbox(sb)
+			runtimeService.StopPodSandbox(sid)
-			runtimeService.RemovePodSandbox(sb)
+			runtimeService.RemovePodSandbox(sid)
 		}()
-		s.id = sb
+		s.id = sid
-		if s.stateBeforeExit == runtime.PodSandboxState_SANDBOX_NOTREADY {
+		for j := range s.containers {
-			require.NoError(t, runtimeService.StopPodSandbox(sb))
+			c := &s.containers[j]
 			cfg := ContainerConfig(c.name, pauseImage,
 				// Set pid namespace as per container, so that container won't die
 				// when sandbox container is killed.
 				WithPidNamespace(runtime.NamespaceMode_CONTAINER),
 			)
 			cid, err := runtimeService.CreateContainer(sid, cfg, sbCfg)
 			require.NoError(t, err)
 			// Reply on sandbox cleanup.
 			c.id = cid
 			switch c.state {
 			case runtime.ContainerState_CONTAINER_CREATED:
 			case runtime.ContainerState_CONTAINER_RUNNING:
 				require.NoError(t, runtimeService.StartContainer(cid))
 			case runtime.ContainerState_CONTAINER_EXITED:
 				require.NoError(t, runtimeService.StartContainer(cid))
 				require.NoError(t, runtimeService.StopContainer(cid, 10))
 			}
 		}
-	}
+		if s.state == runtime.PodSandboxState_SANDBOX_NOTREADY {
-
+			cntr, err := containerdClient.LoadContainer(ctx, sid)
-	t.Logf("Kill cri-containerd")
+			require.NoError(t, err)
-	require.NoError(t, KillProcess("cri-containerd"))
+			task, err := cntr.Task(ctx, nil)
-	defer func() {
+			require.NoError(t, err)
-		assert.NoError(t, Eventually(func() (bool, error) {
+			_, err = task.Delete(ctx, containerd.WithProcessKill)
 			return ConnectDaemons() == nil, nil
 		}, time.Second, 30*time.Second), "make sure cri-containerd is running before test finish")
 	}()
 	t.Logf("Change sandbox state, must finish before cri-containerd is restarted")
 	for _, s := range sandboxes {
 		if s.actionAfterExit == "" {
 			continue
 		}
 		cntr, err := containerdClient.LoadContainer(ctx, s.id)
 		require.NoError(t, err)
 		task, err := cntr.Task(ctx, nil)
 		require.NoError(t, err)
 		switch s.actionAfterExit {
 		case "kill":
 			require.NoError(t, task.Kill(ctx, unix.SIGKILL, containerd.WithKillAll))
 		case "delete":
 			_, err := task.Delete(ctx, containerd.WithProcessKill)
 			require.NoError(t, err)
 		}
 	}
-	t.Logf("Wait until cri-containerd is restarted")
+	t.Logf("Kill containerd")
 	require.NoError(t, KillProcess("containerd"))
 	defer func() {
 		assert.NoError(t, Eventually(func() (bool, error) {
 			return ConnectDaemons() == nil, nil
 		}, time.Second, 30*time.Second), "make sure containerd is running before test finish")
 	}()
 	t.Logf("Wait until containerd is killed")
 	require.NoError(t, Eventually(func() (bool, error) {
 		pid, err := PidOf("containerd")
 		if err != nil {
 			return false, err
 		}
 		return pid == 0, nil
 	}, time.Second, 30*time.Second), "wait for containerd to be killed")
 	t.Logf("Wait until containerd is restarted")
 	require.NoError(t, Eventually(func() (bool, error) {
 		return ConnectDaemons() == nil, nil
-	}, time.Second, 30*time.Second), "wait for cri-containerd to be restarted")
+	}, time.Second, 30*time.Second), "wait for containerd to be restarted")
-	t.Logf("Check sandbox state after restart")
+	t.Logf("Check sandbox and container state after restart")
 	loadedSandboxes, err := runtimeService.ListPodSandbox(&runtime.PodSandboxFilter{})
 	require.NoError(t, err)
 	assert.Len(t, loadedSandboxes, len(sandboxes))
 	loadedContainers, err := runtimeService.ListContainers(&runtime.ContainerFilter{})
 	require.NoError(t, err)
 	assert.Len(t, loadedContainers, len(sandboxes)*3)
 	for _, s := range sandboxes {
 		for _, loaded := range loadedSandboxes {
 			if s.id == loaded.Id {
-				assert.Equal(t, s.expectedState, loaded.State)
+				assert.Equal(t, s.state, loaded.State)
 				break
 			}
 		}
 		for _, c := range s.containers {
 			for _, loaded := range loadedContainers {
 				if c.id == loaded.Id {
 					assert.Equal(t, c.state, loaded.State)
 					break
 				}
 			}
 		}
 	}
 	t.Logf("Should be able to stop and remove sandbox after restart")
 	for _, s := range sandboxes {
-		// Properly stop the sandbox if it's ready before restart.
+		assert.NoError(t, runtimeService.StopPodSandbox(s.id))
 		if s.stateBeforeExit == runtime.PodSandboxState_SANDBOX_READY {
 			assert.NoError(t, runtimeService.StopPodSandbox(s.id))
 		}
 		assert.NoError(t, runtimeService.RemovePodSandbox(s.id))
 	}
 }
 // TestSandboxDeletionAcrossCRIContainerdRestart tests the case that sandbox container
 // is deleted from containerd during cri-containerd is down. This should not happen.
 // However, if this really happens, cri-containerd should not load such sandbox and
 // should do best effort cleanup of the sandbox root directory. Note that in this case,
 // cri-containerd loses the network namespace of the sandbox, so it won't be able to
 // teardown the network properly.
 // This test uses host network sandbox to avoid resource leakage.
 func TestSandboxDeletionAcrossCRIContainerdRestart(t *testing.T) {
 	if !*standaloneCRIContainerd {
 		t.Skip("Skip because cri-containerd does not run in standalone mode")
 	}
 	ctx := context.Background()
 	sandboxNS := "sandbox-delete-restart-cri-containerd"
 	t.Logf("Make sure no sandbox is running before test")
 	existingSandboxes, err := runtimeService.ListPodSandbox(&runtime.PodSandboxFilter{})
 	require.NoError(t, err)
 	require.Empty(t, existingSandboxes)
 	t.Logf("Start test sandboxes")
 	cfg := PodSandboxConfig("sandbox", sandboxNS, WithHostNetwork)
 	sb, err := runtimeService.RunPodSandbox(cfg)
 	require.NoError(t, err)
 	defer func() {
 		// Make sure the sandbox is cleaned up in any case.
 		runtimeService.StopPodSandbox(sb)
 		runtimeService.RemovePodSandbox(sb)
 	}()
 	t.Logf("Kill cri-containerd")
 	require.NoError(t, KillProcess("cri-containerd"))
 	defer func() {
 		assert.NoError(t, Eventually(func() (bool, error) {
 			return ConnectDaemons() == nil, nil
 		}, time.Second, 30*time.Second), "make sure cri-containerd is running before test finish")
 	}()
 	t.Logf("Delete sandbox container from containerd")
 	cntr, err := containerdClient.LoadContainer(ctx, sb)
 	require.NoError(t, err)
 	task, err := cntr.Task(ctx, nil)
 	require.NoError(t, err)
 	_, err = task.Delete(ctx, containerd.WithProcessKill)
 	require.NoError(t, err)
 	require.NoError(t, cntr.Delete(ctx, containerd.WithSnapshotCleanup))
 	t.Logf("Wait until cri-containerd is restarted")
 	require.NoError(t, Eventually(func() (bool, error) {
 		return ConnectDaemons() == nil, nil
 	}, time.Second, 30*time.Second), "wait for cri-containerd to be restarted")
 	t.Logf("Check sandbox state after restart")
 	loadedSandboxes, err := runtimeService.ListPodSandbox(&runtime.PodSandboxFilter{})
 	require.NoError(t, err)
 	assert.Empty(t, loadedSandboxes)
 	t.Logf("Make sure sandbox root is removed")
 	sandboxRoot := filepath.Join(*criContainerdRoot, "sandboxes", sb)
 	_, err = os.Stat(sandboxRoot)
 	assert.True(t, os.IsNotExist(err))
 }
--- a/integration/test_utils.go
+++ b/integration/test_utils.go
@@ -21,6 +21,8 @@ import (
 	"flag"
 	"fmt"
 	"os/exec"
 	"strconv"
 	"strings"
 	"time"
 	"github.com/containerd/containerd"
@@ -161,6 +163,23 @@ func WithCommand(c string, args ...string) ContainerOpts {
 	}
 }
 // Add pid namespace mode.
 func WithPidNamespace(mode runtime.NamespaceMode) ContainerOpts {
 	return func(cf *runtime.ContainerConfig) {
 		if cf.Linux == nil {
 			cf.Linux = &runtime.LinuxContainerConfig{}
 		}
 		if cf.Linux.SecurityContext == nil {
 			cf.Linux.SecurityContext = &runtime.LinuxContainerSecurityContext{}
 		}
 		if cf.Linux.SecurityContext.NamespaceOptions == nil {
 			cf.Linux.SecurityContext.NamespaceOptions = &runtime.NamespaceOption{}
 		}
 		cf.Linux.SecurityContext.NamespaceOptions.Pid = mode
 	}
 }
 // ContainerConfig creates a container config given a name and image name
 // and additional container config options
 func ContainerConfig(name, image string, opts ...ContainerOpts) *runtime.ContainerConfig {
@@ -212,3 +231,16 @@ func KillProcess(name string) error {
 	}
 	return nil
 }
 // PidOf returns pid of a process by name.
 func PidOf(name string) (int, error) {
 	b, err := exec.Command("pidof", name).CombinedOutput()
 	output := strings.TrimSpace(string(b))
 	if err != nil {
 		if len(output) != 0 {
 			return 0, fmt.Errorf("failed to run pidof %q - error: %v, output: %q", name, err, output)
 		}
 		return 0, nil
 	}
 	return strconv.Atoi(output)
 }