1 // Copyright (C) The Arvados Authors. All rights reserved.
3 // SPDX-License-Identifier: AGPL-3.0
11 "git.arvados.org/arvados.git/lib/dispatchcloud/test"
12 "git.arvados.org/arvados.git/sdk/go/arvados"
13 "git.arvados.org/arvados.git/sdk/go/ctxlog"
14 check "gopkg.in/check.v1"
17 // Ensure the scheduler expunges containers from the queue when they
18 // are no longer relevant (completed and not running, queued with
20 func (*SchedulerSuite) TestForgetIrrelevantContainers(c *check.C) {
21 ctx := ctxlog.Context(context.Background(), ctxlog.TestLogger(c))
24 ChooseType: chooseType,
25 Containers: []arvados.Container{
27 UUID: test.ContainerUUID(1),
29 State: arvados.ContainerStateQueued,
30 RuntimeConstraints: arvados.RuntimeConstraints{
36 UUID: test.ContainerUUID(2),
38 State: arvados.ContainerStateComplete,
39 RuntimeConstraints: arvados.RuntimeConstraints{
48 ents, _ := queue.Entries()
49 c.Check(ents, check.HasLen, 1)
51 sch := New(ctx, arvados.NewClientFromEnv(), &queue, &pool, nil, time.Millisecond, time.Millisecond, 0, 0, 0)
54 ents, _ = queue.Entries()
55 c.Check(ents, check.HasLen, 0)
58 func (*SchedulerSuite) TestCancelOrphanedContainers(c *check.C) {
59 ctx := ctxlog.Context(context.Background(), ctxlog.TestLogger(c))
61 unalloc: map[arvados.InstanceType]int{test.InstanceType(1): 1},
62 unknown: map[arvados.InstanceType]int{test.InstanceType(1): 1},
65 ChooseType: chooseType,
66 Containers: []arvados.Container{
68 UUID: test.ContainerUUID(1),
70 State: arvados.ContainerStateRunning,
71 RuntimeConstraints: arvados.RuntimeConstraints{
80 ents, _ := queue.Entries()
81 c.Check(ents, check.HasLen, 1)
83 sch := New(ctx, arvados.NewClientFromEnv(), &queue, &pool, nil, time.Millisecond, time.Millisecond, 0, 0, 0)
85 // Sync shouldn't cancel the container because it might be
86 // running on the VM with state=="unknown".
88 // (Cancel+forget happens asynchronously and requires multiple
89 // sync() calls, so even after 10x sync-and-sleep iterations,
90 // we aren't 100% confident that sync isn't trying to
91 // cancel. But in the test environment, the goroutines started
92 // by sync() access stubs and therefore run quickly, so it
93 // works fine in practice. We accept that if the code is
94 // broken, the test will still pass occasionally.)
95 for i := 0; i < 10; i++ {
97 time.Sleep(time.Millisecond)
99 ents, _ = queue.Entries()
100 c.Check(ents, check.HasLen, 1)
101 c.Check(ents[test.ContainerUUID(1)].Container.State, check.Equals, arvados.ContainerStateRunning)
103 // Sync should cancel & forget the container when the
104 // "unknown" node goes away.
106 // (As above, cancel+forget is async and requires multiple
107 // sync() calls, but stubs are fast so in practice this takes
108 // much less than 1s to complete.)
110 for deadline := time.Now().Add(time.Second); ; time.Sleep(time.Millisecond) {
112 ents, _ = queue.Entries()
113 if len(ents) == 0 || time.Now().After(deadline) {
117 c.Check(ents, check.HasLen, 0)