14807: Allow some fake nodes to remain unbroken.
[arvados.git] / lib / dispatchcloud / container / queue_test.go
1 // Copyright (C) The Arvados Authors. All rights reserved.
2 //
3 // SPDX-License-Identifier: AGPL-3.0
4
5 package container
6
7 import (
8         "errors"
9         "os"
10         "sync"
11         "testing"
12         "time"
13
14         "git.curoverse.com/arvados.git/sdk/go/arvados"
15         "git.curoverse.com/arvados.git/sdk/go/arvadostest"
16         "github.com/sirupsen/logrus"
17         check "gopkg.in/check.v1"
18 )
19
20 // Gocheck boilerplate
21 func Test(t *testing.T) {
22         check.TestingT(t)
23 }
24
25 var _ = check.Suite(&IntegrationSuite{})
26
27 func logger() logrus.FieldLogger {
28         logger := logrus.StandardLogger()
29         if os.Getenv("ARVADOS_DEBUG") != "" {
30                 logger.SetLevel(logrus.DebugLevel)
31         }
32         return logger
33 }
34
35 type IntegrationSuite struct{}
36
37 func (suite *IntegrationSuite) TearDownTest(c *check.C) {
38         err := arvados.NewClientFromEnv().RequestAndDecode(nil, "POST", "database/reset", nil, nil)
39         c.Check(err, check.IsNil)
40 }
41
42 func (suite *IntegrationSuite) TestGetLockUnlockCancel(c *check.C) {
43         typeChooser := func(ctr *arvados.Container) (arvados.InstanceType, error) {
44                 return arvados.InstanceType{Name: "testType"}, nil
45         }
46
47         client := arvados.NewClientFromEnv()
48         cq := NewQueue(logger(), nil, typeChooser, client)
49
50         err := cq.Update()
51         c.Check(err, check.IsNil)
52
53         ents, threshold := cq.Entries()
54         c.Check(len(ents), check.Not(check.Equals), 0)
55         c.Check(time.Since(threshold) < time.Minute, check.Equals, true)
56         c.Check(time.Since(threshold) > 0, check.Equals, true)
57
58         _, ok := ents[arvadostest.QueuedContainerUUID]
59         c.Check(ok, check.Equals, true)
60
61         var wg sync.WaitGroup
62         for uuid, ent := range ents {
63                 c.Check(ent.Container.UUID, check.Equals, uuid)
64                 c.Check(ent.InstanceType.Name, check.Equals, "testType")
65                 c.Check(ent.Container.State, check.Equals, arvados.ContainerStateQueued)
66                 c.Check(ent.Container.Priority > 0, check.Equals, true)
67
68                 ctr, ok := cq.Get(uuid)
69                 c.Check(ok, check.Equals, true)
70                 c.Check(ctr.UUID, check.Equals, uuid)
71
72                 wg.Add(1)
73                 go func() {
74                         defer wg.Done()
75                         err := cq.Unlock(uuid)
76                         c.Check(err, check.NotNil)
77                         err = cq.Lock(uuid)
78                         c.Check(err, check.IsNil)
79                         ctr, ok := cq.Get(uuid)
80                         c.Check(ok, check.Equals, true)
81                         c.Check(ctr.State, check.Equals, arvados.ContainerStateLocked)
82                         err = cq.Lock(uuid)
83                         c.Check(err, check.NotNil)
84                         err = cq.Unlock(uuid)
85                         c.Check(err, check.IsNil)
86                         ctr, ok = cq.Get(uuid)
87                         c.Check(ok, check.Equals, true)
88                         c.Check(ctr.State, check.Equals, arvados.ContainerStateQueued)
89                         err = cq.Unlock(uuid)
90                         c.Check(err, check.NotNil)
91                 }()
92         }
93         wg.Wait()
94
95         err = cq.Cancel(arvadostest.CompletedContainerUUID)
96         c.Check(err, check.ErrorMatches, `.*State cannot change from Complete to Cancelled.*`)
97 }
98
99 func (suite *IntegrationSuite) TestCancelIfNoInstanceType(c *check.C) {
100         errorTypeChooser := func(ctr *arvados.Container) (arvados.InstanceType, error) {
101                 return arvados.InstanceType{}, errors.New("no suitable instance type")
102         }
103
104         client := arvados.NewClientFromEnv()
105         cq := NewQueue(logger(), nil, errorTypeChooser, client)
106
107         var ctr arvados.Container
108         err := client.RequestAndDecode(&ctr, "GET", "arvados/v1/containers/"+arvadostest.QueuedContainerUUID, nil, nil)
109         c.Check(err, check.IsNil)
110         c.Check(ctr.State, check.Equals, arvados.ContainerStateQueued)
111
112         cq.Update()
113
114         // Wait for the cancel operation to take effect. Container
115         // will have state=Cancelled or just disappear from the queue.
116         suite.waitfor(c, time.Second, func() bool {
117                 err := client.RequestAndDecode(&ctr, "GET", "arvados/v1/containers/"+arvadostest.QueuedContainerUUID, nil, nil)
118                 return err == nil && ctr.State == arvados.ContainerStateCancelled
119         })
120         c.Check(ctr.RuntimeStatus["error"], check.Equals, `no suitable instance type`)
121 }
122
123 func (suite *IntegrationSuite) waitfor(c *check.C, timeout time.Duration, fn func() bool) {
124         defer func() {
125                 c.Check(fn(), check.Equals, true)
126         }()
127         deadline := time.Now().Add(timeout)
128         for !fn() && time.Now().Before(deadline) {
129                 time.Sleep(timeout / 1000)
130         }
131 }