16723: Don't lock a requeued container while old crunch-runs exist.
authorTom Clegg <tom@tomclegg.ca>
Fri, 21 Aug 2020 15:30:04 +0000 (11:30 -0400)
committerTom Clegg <tom@tomclegg.ca>
Fri, 21 Aug 2020 15:30:04 +0000 (11:30 -0400)
Arvados-DCO-1.1-Signed-off-by: Tom Clegg <tom@tomclegg.ca>

lib/dispatchcloud/scheduler/run_queue.go

index 4447f084a90cff2f962298c2bb3a71fef851ebb1..dddb974b326fbe7d61c280148e71f4f5c86e7abe 100644 (file)
@@ -88,6 +88,8 @@ tryrun:
                                // a higher-priority container on the
                                // same instance type. Don't let this
                                // one sneak in ahead of it.
+                       } else if sch.pool.KillContainer(ctr.UUID, "about to lock") {
+                               logger.Info("not restarting yet: crunch-run process from previous attempt has not exited")
                        } else if sch.pool.StartContainer(it, ctr) {
                                // Success.
                        } else {