Add generic restart test.
Signed-off-by: Lantao Liu <lantaol@google.com>
This commit is contained in:
parent
00cd5b6a0c
commit
09294fca40
@ -17,8 +17,6 @@ limitations under the License.
|
|||||||
package integration
|
package integration
|
||||||
|
|
||||||
import (
|
import (
|
||||||
"os"
|
|
||||||
"path/filepath"
|
|
||||||
"testing"
|
"testing"
|
||||||
"time"
|
"time"
|
||||||
|
|
||||||
@ -26,47 +24,61 @@ import (
|
|||||||
"github.com/stretchr/testify/assert"
|
"github.com/stretchr/testify/assert"
|
||||||
"github.com/stretchr/testify/require"
|
"github.com/stretchr/testify/require"
|
||||||
"golang.org/x/net/context"
|
"golang.org/x/net/context"
|
||||||
"golang.org/x/sys/unix"
|
|
||||||
runtime "k8s.io/kubernetes/pkg/kubelet/apis/cri/runtime/v1alpha2"
|
runtime "k8s.io/kubernetes/pkg/kubelet/apis/cri/runtime/v1alpha2"
|
||||||
)
|
)
|
||||||
|
|
||||||
// Restart test must run sequentially.
|
// Restart test must run sequentially.
|
||||||
// NOTE(random-liu): Current restart test only support standalone cri-containerd mode.
|
|
||||||
|
|
||||||
func TestSandboxAcrossCRIContainerdRestart(t *testing.T) {
|
func TestContainerdRestart(t *testing.T) {
|
||||||
if !*standaloneCRIContainerd {
|
type container struct {
|
||||||
t.Skip("Skip because cri-containerd does not run in standalone mode")
|
name string
|
||||||
|
id string
|
||||||
|
state runtime.ContainerState
|
||||||
|
}
|
||||||
|
type sandbox struct {
|
||||||
|
name string
|
||||||
|
id string
|
||||||
|
state runtime.PodSandboxState
|
||||||
|
containers []container
|
||||||
}
|
}
|
||||||
ctx := context.Background()
|
ctx := context.Background()
|
||||||
sandboxNS := "sandbox-restart-cri-containerd"
|
sandboxNS := "restart-containerd"
|
||||||
sandboxes := []struct {
|
sandboxes := []sandbox{
|
||||||
name string
|
|
||||||
id string
|
|
||||||
stateBeforeExit runtime.PodSandboxState
|
|
||||||
actionAfterExit string
|
|
||||||
expectedState runtime.PodSandboxState
|
|
||||||
}{
|
|
||||||
{
|
{
|
||||||
name: "task-always-ready",
|
name: "ready-sandbox",
|
||||||
stateBeforeExit: runtime.PodSandboxState_SANDBOX_READY,
|
state: runtime.PodSandboxState_SANDBOX_READY,
|
||||||
expectedState: runtime.PodSandboxState_SANDBOX_READY,
|
containers: []container{
|
||||||
|
{
|
||||||
|
name: "created-container",
|
||||||
|
state: runtime.ContainerState_CONTAINER_CREATED,
|
||||||
|
},
|
||||||
|
{
|
||||||
|
name: "running-container",
|
||||||
|
state: runtime.ContainerState_CONTAINER_RUNNING,
|
||||||
|
},
|
||||||
|
{
|
||||||
|
name: "exited-container",
|
||||||
|
state: runtime.ContainerState_CONTAINER_EXITED,
|
||||||
|
},
|
||||||
|
},
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
name: "task-always-not-ready",
|
name: "notready-sandbox",
|
||||||
stateBeforeExit: runtime.PodSandboxState_SANDBOX_NOTREADY,
|
state: runtime.PodSandboxState_SANDBOX_NOTREADY,
|
||||||
expectedState: runtime.PodSandboxState_SANDBOX_NOTREADY,
|
containers: []container{
|
||||||
},
|
{
|
||||||
{
|
name: "created-container",
|
||||||
name: "task-exit-before-restart",
|
state: runtime.ContainerState_CONTAINER_CREATED,
|
||||||
stateBeforeExit: runtime.PodSandboxState_SANDBOX_READY,
|
},
|
||||||
actionAfterExit: "kill",
|
{
|
||||||
expectedState: runtime.PodSandboxState_SANDBOX_NOTREADY,
|
name: "running-container",
|
||||||
},
|
state: runtime.ContainerState_CONTAINER_RUNNING,
|
||||||
{
|
},
|
||||||
name: "task-deleted-before-restart",
|
{
|
||||||
stateBeforeExit: runtime.PodSandboxState_SANDBOX_READY,
|
name: "exited-container",
|
||||||
actionAfterExit: "delete",
|
state: runtime.ContainerState_CONTAINER_EXITED,
|
||||||
expectedState: runtime.PodSandboxState_SANDBOX_NOTREADY,
|
},
|
||||||
|
},
|
||||||
},
|
},
|
||||||
}
|
}
|
||||||
t.Logf("Make sure no sandbox is running before test")
|
t.Logf("Make sure no sandbox is running before test")
|
||||||
@ -74,134 +86,97 @@ func TestSandboxAcrossCRIContainerdRestart(t *testing.T) {
|
|||||||
require.NoError(t, err)
|
require.NoError(t, err)
|
||||||
require.Empty(t, existingSandboxes)
|
require.Empty(t, existingSandboxes)
|
||||||
|
|
||||||
t.Logf("Start test sandboxes")
|
t.Logf("Start test sandboxes and containers")
|
||||||
for i := range sandboxes {
|
for i := range sandboxes {
|
||||||
s := &sandboxes[i]
|
s := &sandboxes[i]
|
||||||
cfg := PodSandboxConfig(s.name, sandboxNS)
|
sbCfg := PodSandboxConfig(s.name, sandboxNS)
|
||||||
sb, err := runtimeService.RunPodSandbox(cfg)
|
sid, err := runtimeService.RunPodSandbox(sbCfg)
|
||||||
require.NoError(t, err)
|
require.NoError(t, err)
|
||||||
defer func() {
|
defer func() {
|
||||||
// Make sure the sandbox is cleaned up in any case.
|
// Make sure the sandbox is cleaned up in any case.
|
||||||
runtimeService.StopPodSandbox(sb)
|
runtimeService.StopPodSandbox(sid)
|
||||||
runtimeService.RemovePodSandbox(sb)
|
runtimeService.RemovePodSandbox(sid)
|
||||||
}()
|
}()
|
||||||
s.id = sb
|
s.id = sid
|
||||||
if s.stateBeforeExit == runtime.PodSandboxState_SANDBOX_NOTREADY {
|
for j := range s.containers {
|
||||||
require.NoError(t, runtimeService.StopPodSandbox(sb))
|
c := &s.containers[j]
|
||||||
|
cfg := ContainerConfig(c.name, pauseImage,
|
||||||
|
// Set pid namespace as per container, so that container won't die
|
||||||
|
// when sandbox container is killed.
|
||||||
|
WithPidNamespace(runtime.NamespaceMode_CONTAINER),
|
||||||
|
)
|
||||||
|
cid, err := runtimeService.CreateContainer(sid, cfg, sbCfg)
|
||||||
|
require.NoError(t, err)
|
||||||
|
// Reply on sandbox cleanup.
|
||||||
|
c.id = cid
|
||||||
|
switch c.state {
|
||||||
|
case runtime.ContainerState_CONTAINER_CREATED:
|
||||||
|
case runtime.ContainerState_CONTAINER_RUNNING:
|
||||||
|
require.NoError(t, runtimeService.StartContainer(cid))
|
||||||
|
case runtime.ContainerState_CONTAINER_EXITED:
|
||||||
|
require.NoError(t, runtimeService.StartContainer(cid))
|
||||||
|
require.NoError(t, runtimeService.StopContainer(cid, 10))
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
if s.state == runtime.PodSandboxState_SANDBOX_NOTREADY {
|
||||||
|
cntr, err := containerdClient.LoadContainer(ctx, sid)
|
||||||
t.Logf("Kill cri-containerd")
|
require.NoError(t, err)
|
||||||
require.NoError(t, KillProcess("cri-containerd"))
|
task, err := cntr.Task(ctx, nil)
|
||||||
defer func() {
|
require.NoError(t, err)
|
||||||
assert.NoError(t, Eventually(func() (bool, error) {
|
_, err = task.Delete(ctx, containerd.WithProcessKill)
|
||||||
return ConnectDaemons() == nil, nil
|
|
||||||
}, time.Second, 30*time.Second), "make sure cri-containerd is running before test finish")
|
|
||||||
}()
|
|
||||||
|
|
||||||
t.Logf("Change sandbox state, must finish before cri-containerd is restarted")
|
|
||||||
for _, s := range sandboxes {
|
|
||||||
if s.actionAfterExit == "" {
|
|
||||||
continue
|
|
||||||
}
|
|
||||||
cntr, err := containerdClient.LoadContainer(ctx, s.id)
|
|
||||||
require.NoError(t, err)
|
|
||||||
task, err := cntr.Task(ctx, nil)
|
|
||||||
require.NoError(t, err)
|
|
||||||
switch s.actionAfterExit {
|
|
||||||
case "kill":
|
|
||||||
require.NoError(t, task.Kill(ctx, unix.SIGKILL, containerd.WithKillAll))
|
|
||||||
case "delete":
|
|
||||||
_, err := task.Delete(ctx, containerd.WithProcessKill)
|
|
||||||
require.NoError(t, err)
|
require.NoError(t, err)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
t.Logf("Wait until cri-containerd is restarted")
|
t.Logf("Kill containerd")
|
||||||
|
require.NoError(t, KillProcess("containerd"))
|
||||||
|
defer func() {
|
||||||
|
assert.NoError(t, Eventually(func() (bool, error) {
|
||||||
|
return ConnectDaemons() == nil, nil
|
||||||
|
}, time.Second, 30*time.Second), "make sure containerd is running before test finish")
|
||||||
|
}()
|
||||||
|
|
||||||
|
t.Logf("Wait until containerd is killed")
|
||||||
|
require.NoError(t, Eventually(func() (bool, error) {
|
||||||
|
pid, err := PidOf("containerd")
|
||||||
|
if err != nil {
|
||||||
|
return false, err
|
||||||
|
}
|
||||||
|
return pid == 0, nil
|
||||||
|
}, time.Second, 30*time.Second), "wait for containerd to be killed")
|
||||||
|
|
||||||
|
t.Logf("Wait until containerd is restarted")
|
||||||
require.NoError(t, Eventually(func() (bool, error) {
|
require.NoError(t, Eventually(func() (bool, error) {
|
||||||
return ConnectDaemons() == nil, nil
|
return ConnectDaemons() == nil, nil
|
||||||
}, time.Second, 30*time.Second), "wait for cri-containerd to be restarted")
|
}, time.Second, 30*time.Second), "wait for containerd to be restarted")
|
||||||
|
|
||||||
t.Logf("Check sandbox state after restart")
|
t.Logf("Check sandbox and container state after restart")
|
||||||
loadedSandboxes, err := runtimeService.ListPodSandbox(&runtime.PodSandboxFilter{})
|
loadedSandboxes, err := runtimeService.ListPodSandbox(&runtime.PodSandboxFilter{})
|
||||||
require.NoError(t, err)
|
require.NoError(t, err)
|
||||||
assert.Len(t, loadedSandboxes, len(sandboxes))
|
assert.Len(t, loadedSandboxes, len(sandboxes))
|
||||||
|
loadedContainers, err := runtimeService.ListContainers(&runtime.ContainerFilter{})
|
||||||
|
require.NoError(t, err)
|
||||||
|
assert.Len(t, loadedContainers, len(sandboxes)*3)
|
||||||
for _, s := range sandboxes {
|
for _, s := range sandboxes {
|
||||||
for _, loaded := range loadedSandboxes {
|
for _, loaded := range loadedSandboxes {
|
||||||
if s.id == loaded.Id {
|
if s.id == loaded.Id {
|
||||||
assert.Equal(t, s.expectedState, loaded.State)
|
assert.Equal(t, s.state, loaded.State)
|
||||||
break
|
break
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
for _, c := range s.containers {
|
||||||
|
for _, loaded := range loadedContainers {
|
||||||
|
if c.id == loaded.Id {
|
||||||
|
assert.Equal(t, c.state, loaded.State)
|
||||||
|
break
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
t.Logf("Should be able to stop and remove sandbox after restart")
|
t.Logf("Should be able to stop and remove sandbox after restart")
|
||||||
for _, s := range sandboxes {
|
for _, s := range sandboxes {
|
||||||
// Properly stop the sandbox if it's ready before restart.
|
assert.NoError(t, runtimeService.StopPodSandbox(s.id))
|
||||||
if s.stateBeforeExit == runtime.PodSandboxState_SANDBOX_READY {
|
|
||||||
assert.NoError(t, runtimeService.StopPodSandbox(s.id))
|
|
||||||
}
|
|
||||||
assert.NoError(t, runtimeService.RemovePodSandbox(s.id))
|
assert.NoError(t, runtimeService.RemovePodSandbox(s.id))
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// TestSandboxDeletionAcrossCRIContainerdRestart tests the case that sandbox container
|
|
||||||
// is deleted from containerd during cri-containerd is down. This should not happen.
|
|
||||||
// However, if this really happens, cri-containerd should not load such sandbox and
|
|
||||||
// should do best effort cleanup of the sandbox root directory. Note that in this case,
|
|
||||||
// cri-containerd loses the network namespace of the sandbox, so it won't be able to
|
|
||||||
// teardown the network properly.
|
|
||||||
// This test uses host network sandbox to avoid resource leakage.
|
|
||||||
func TestSandboxDeletionAcrossCRIContainerdRestart(t *testing.T) {
|
|
||||||
if !*standaloneCRIContainerd {
|
|
||||||
t.Skip("Skip because cri-containerd does not run in standalone mode")
|
|
||||||
}
|
|
||||||
ctx := context.Background()
|
|
||||||
sandboxNS := "sandbox-delete-restart-cri-containerd"
|
|
||||||
t.Logf("Make sure no sandbox is running before test")
|
|
||||||
existingSandboxes, err := runtimeService.ListPodSandbox(&runtime.PodSandboxFilter{})
|
|
||||||
require.NoError(t, err)
|
|
||||||
require.Empty(t, existingSandboxes)
|
|
||||||
|
|
||||||
t.Logf("Start test sandboxes")
|
|
||||||
cfg := PodSandboxConfig("sandbox", sandboxNS, WithHostNetwork)
|
|
||||||
sb, err := runtimeService.RunPodSandbox(cfg)
|
|
||||||
require.NoError(t, err)
|
|
||||||
defer func() {
|
|
||||||
// Make sure the sandbox is cleaned up in any case.
|
|
||||||
runtimeService.StopPodSandbox(sb)
|
|
||||||
runtimeService.RemovePodSandbox(sb)
|
|
||||||
}()
|
|
||||||
|
|
||||||
t.Logf("Kill cri-containerd")
|
|
||||||
require.NoError(t, KillProcess("cri-containerd"))
|
|
||||||
defer func() {
|
|
||||||
assert.NoError(t, Eventually(func() (bool, error) {
|
|
||||||
return ConnectDaemons() == nil, nil
|
|
||||||
}, time.Second, 30*time.Second), "make sure cri-containerd is running before test finish")
|
|
||||||
}()
|
|
||||||
|
|
||||||
t.Logf("Delete sandbox container from containerd")
|
|
||||||
cntr, err := containerdClient.LoadContainer(ctx, sb)
|
|
||||||
require.NoError(t, err)
|
|
||||||
task, err := cntr.Task(ctx, nil)
|
|
||||||
require.NoError(t, err)
|
|
||||||
_, err = task.Delete(ctx, containerd.WithProcessKill)
|
|
||||||
require.NoError(t, err)
|
|
||||||
require.NoError(t, cntr.Delete(ctx, containerd.WithSnapshotCleanup))
|
|
||||||
|
|
||||||
t.Logf("Wait until cri-containerd is restarted")
|
|
||||||
require.NoError(t, Eventually(func() (bool, error) {
|
|
||||||
return ConnectDaemons() == nil, nil
|
|
||||||
}, time.Second, 30*time.Second), "wait for cri-containerd to be restarted")
|
|
||||||
|
|
||||||
t.Logf("Check sandbox state after restart")
|
|
||||||
loadedSandboxes, err := runtimeService.ListPodSandbox(&runtime.PodSandboxFilter{})
|
|
||||||
require.NoError(t, err)
|
|
||||||
assert.Empty(t, loadedSandboxes)
|
|
||||||
|
|
||||||
t.Logf("Make sure sandbox root is removed")
|
|
||||||
sandboxRoot := filepath.Join(*criContainerdRoot, "sandboxes", sb)
|
|
||||||
_, err = os.Stat(sandboxRoot)
|
|
||||||
assert.True(t, os.IsNotExist(err))
|
|
||||||
}
|
|
||||||
|
@ -21,6 +21,8 @@ import (
|
|||||||
"flag"
|
"flag"
|
||||||
"fmt"
|
"fmt"
|
||||||
"os/exec"
|
"os/exec"
|
||||||
|
"strconv"
|
||||||
|
"strings"
|
||||||
"time"
|
"time"
|
||||||
|
|
||||||
"github.com/containerd/containerd"
|
"github.com/containerd/containerd"
|
||||||
@ -161,6 +163,23 @@ func WithCommand(c string, args ...string) ContainerOpts {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Add pid namespace mode.
|
||||||
|
func WithPidNamespace(mode runtime.NamespaceMode) ContainerOpts {
|
||||||
|
return func(cf *runtime.ContainerConfig) {
|
||||||
|
if cf.Linux == nil {
|
||||||
|
cf.Linux = &runtime.LinuxContainerConfig{}
|
||||||
|
}
|
||||||
|
if cf.Linux.SecurityContext == nil {
|
||||||
|
cf.Linux.SecurityContext = &runtime.LinuxContainerSecurityContext{}
|
||||||
|
}
|
||||||
|
if cf.Linux.SecurityContext.NamespaceOptions == nil {
|
||||||
|
cf.Linux.SecurityContext.NamespaceOptions = &runtime.NamespaceOption{}
|
||||||
|
}
|
||||||
|
cf.Linux.SecurityContext.NamespaceOptions.Pid = mode
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
// ContainerConfig creates a container config given a name and image name
|
// ContainerConfig creates a container config given a name and image name
|
||||||
// and additional container config options
|
// and additional container config options
|
||||||
func ContainerConfig(name, image string, opts ...ContainerOpts) *runtime.ContainerConfig {
|
func ContainerConfig(name, image string, opts ...ContainerOpts) *runtime.ContainerConfig {
|
||||||
@ -212,3 +231,16 @@ func KillProcess(name string) error {
|
|||||||
}
|
}
|
||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// PidOf returns pid of a process by name.
|
||||||
|
func PidOf(name string) (int, error) {
|
||||||
|
b, err := exec.Command("pidof", name).CombinedOutput()
|
||||||
|
output := strings.TrimSpace(string(b))
|
||||||
|
if err != nil {
|
||||||
|
if len(output) != 0 {
|
||||||
|
return 0, fmt.Errorf("failed to run pidof %q - error: %v, output: %q", name, err, output)
|
||||||
|
}
|
||||||
|
return 0, nil
|
||||||
|
}
|
||||||
|
return strconv.Atoi(output)
|
||||||
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user