Skip to content

Commit bddeba8

Browse files
committed
Make TestContainerPids more resilient
ListPids may not pick up the sh subprocess yet when it is first run. To make this test more resilient, retry fetching the processes if only a single pid is found for a short time. Signed-off-by: Derek McGowan <[email protected]>
1 parent ada2fa1 commit bddeba8

File tree

1 file changed

+58
-40
lines changed

1 file changed

+58
-40
lines changed

integration/client/container_test.go

+58-40
Original file line numberDiff line numberDiff line change
@@ -33,6 +33,15 @@ import (
3333

3434
apievents "github.com/containerd/containerd/api/events"
3535
"github.com/containerd/containerd/api/types/runc/options"
36+
"github.com/containerd/continuity/fs"
37+
"github.com/containerd/errdefs"
38+
"github.com/containerd/go-runc"
39+
"github.com/containerd/log/logtest"
40+
"github.com/containerd/platforms"
41+
"github.com/containerd/typeurl/v2"
42+
specs "github.com/opencontainers/runtime-spec/specs-go"
43+
"github.com/stretchr/testify/require"
44+
3645
. "github.com/containerd/containerd/v2/client"
3746
"github.com/containerd/containerd/v2/core/containers"
3847
"github.com/containerd/containerd/v2/core/images"
@@ -42,14 +51,6 @@ import (
4251
"github.com/containerd/containerd/v2/pkg/oci"
4352
gogotypes "github.com/containerd/containerd/v2/pkg/protobuf/types"
4453
"github.com/containerd/containerd/v2/plugins"
45-
"github.com/containerd/continuity/fs"
46-
"github.com/containerd/errdefs"
47-
"github.com/containerd/go-runc"
48-
"github.com/containerd/log/logtest"
49-
"github.com/containerd/platforms"
50-
"github.com/containerd/typeurl/v2"
51-
specs "github.com/opencontainers/runtime-spec/specs-go"
52-
"github.com/stretchr/testify/require"
5354
)
5455

5556
func empty() cio.Creator {
@@ -571,44 +572,61 @@ func TestContainerPids(t *testing.T) {
571572
t.Errorf("invalid task pid %d", taskPid)
572573
}
573574

574-
processes, err := task.Pids(ctx)
575-
if err != nil {
576-
t.Fatal(err)
577-
}
578-
579-
l := len(processes)
580-
// The point of this test is to see that we successfully can get all of
581-
// the pids running in the container and they match the number expected,
582-
// but for Windows this concept is a bit different. Windows containers
583-
// essentially go through the usermode boot phase of the operating system,
584-
// and have quite a few processes and system services running outside of
585-
// the "init" process you specify. Because of this, there's not a great
586-
// way to say "there should only be N processes running" like we can ensure
587-
// for Linux based off the process we asked to run.
588-
//
589-
// With all that said, on Windows lets check that we're greater than one
590-
// ("init" + system services/procs)
591-
if runtime.GOOS == "windows" {
592-
if l <= 1 {
593-
t.Errorf("expected more than one process but received %d", l)
575+
tryUntil := time.Now().Add(time.Second)
576+
checkPids := func() bool {
577+
processes, err := task.Pids(ctx)
578+
if err != nil {
579+
t.Fatal(err)
594580
}
595-
} else {
596-
// 2 processes, 1 for sh and one for sleep
597-
if l != 2 {
598-
t.Errorf("expected 2 process but received %d", l)
581+
582+
l := len(processes)
583+
// The point of this test is to see that we successfully can get all of
584+
// the pids running in the container and they match the number expected,
585+
// but for Windows this concept is a bit different. Windows containers
586+
// essentially go through the usermode boot phase of the operating system,
587+
// and have quite a few processes and system services running outside of
588+
// the "init" process you specify. Because of this, there's not a great
589+
// way to say "there should only be N processes running" like we can ensure
590+
// for Linux based off the process we asked to run.
591+
//
592+
// With all that said, on Windows lets check that we're greater than one
593+
// ("init" + system services/procs)
594+
if runtime.GOOS == "windows" {
595+
if l <= 1 {
596+
t.Errorf("expected more than one process but received %d", l)
597+
}
598+
} else {
599+
// 2 processes, 1 for sh and one for sleep
600+
if l != 2 {
601+
if l == 1 && time.Now().Before(tryUntil) {
602+
// The subcommand may not have been started when the
603+
// pids are requested. Retrying is a simple way to
604+
// handle the race under normal conditions. A better
605+
// but more complex solution would be first waiting
606+
// for output from the subprocess to be seen.
607+
return true
608+
}
609+
t.Errorf("expected 2 process but received %d", l)
610+
}
599611
}
600-
}
601612

602-
var found bool
603-
for _, p := range processes {
604-
if p.Pid == taskPid {
605-
found = true
606-
break
613+
var found bool
614+
for _, p := range processes {
615+
if p.Pid == taskPid {
616+
found = true
617+
break
618+
}
607619
}
620+
if !found {
621+
t.Errorf("pid %d must be in %+v", taskPid, processes)
622+
}
623+
return false
608624
}
609-
if !found {
610-
t.Errorf("pid %d must be in %+v", taskPid, processes)
625+
626+
for checkPids() {
627+
time.Sleep(5 * time.Millisecond)
611628
}
629+
612630
if err := task.Kill(ctx, syscall.SIGKILL); err != nil {
613631
select {
614632
case s := <-statusC:

0 commit comments

Comments
 (0)