// Copyright (C) The Arvados Authors. All rights reserved.
//
// SPDX-License-Identifier: AGPL-3.0

package worker

import (
	"bytes"
	"crypto/md5"
	"errors"
	"fmt"
	"io"
	"strings"
	"time"

	"git.arvados.org/arvados.git/lib/cloud"
	"git.arvados.org/arvados.git/lib/config"
	"git.arvados.org/arvados.git/lib/dispatchcloud/test"
	"git.arvados.org/arvados.git/sdk/go/arvados"
	"git.arvados.org/arvados.git/sdk/go/ctxlog"
	"github.com/prometheus/client_golang/prometheus"
	"github.com/sirupsen/logrus"
	check "gopkg.in/check.v1"
)

var _ = check.Suite(&WorkerSuite{})

type WorkerSuite struct {
	logger      logrus.FieldLogger
	testCluster *arvados.Cluster
}

func (suite *WorkerSuite) SetUpTest(c *check.C) {
	suite.logger = ctxlog.TestLogger(c)
	cfg, err := config.NewLoader(nil, suite.logger).Load()
	c.Assert(err, check.IsNil)
	suite.testCluster, err = cfg.GetCluster("")
	c.Assert(err, check.IsNil)
}

func (suite *WorkerSuite) TestProbeAndUpdate(c *check.C) {
	bootTimeout := time.Minute
	probeTimeout := time.Second

	ac := arvados.NewClientFromEnv()
	is, err := (&test.StubDriver{}).InstanceSet(nil, "test-instance-set-id", nil, suite.logger)
	c.Assert(err, check.IsNil)
	inst, err := is.Create(arvados.InstanceType{}, "", nil, "echo InitCommand", nil)
	c.Assert(err, check.IsNil)

	type trialT struct {
		testCaseComment string // displayed in test output to help identify failure case
		age             time.Duration
		state           State
		running         int
		starting        int
		respBoot        stubResp // zero value is success
		respDeploy      stubResp // zero value is success
		respRun         stubResp // zero value is success + nothing running
		respRunDeployed stubResp
		deployRunner    []byte
		expectStdin     []byte
		expectState     State
		expectRunning   int
	}

	errFail := errors.New("failed")
	respFail := stubResp{"", "command failed\n", errFail}
	respContainerRunning := stubResp{"zzzzz-dz642-abcdefghijklmno\n", "", nil}
	for idx, trial := range []trialT{
		{
			testCaseComment: "Unknown, probes fail",
			state:           StateUnknown,
			respBoot:        respFail,
			respRun:         respFail,
			expectState:     StateUnknown,
		},
		{
			testCaseComment: "Unknown, boot probe fails, but one container is running",
			state:           StateUnknown,
			respBoot:        respFail,
			respRun:         respContainerRunning,
			expectState:     StateUnknown,
			expectRunning:   1,
		},
		{
			testCaseComment: "Unknown, boot probe fails, previously running container has exited",
			state:           StateUnknown,
			running:         1,
			respBoot:        respFail,
			expectState:     StateUnknown,
			expectRunning:   0,
		},
		{
			testCaseComment: "Unknown, boot timeout exceeded, boot probe fails",
			state:           StateUnknown,
			age:             bootTimeout + time.Second,
			respBoot:        respFail,
			respRun:         respFail,
			expectState:     StateShutdown,
		},
		{
			testCaseComment: "Unknown, boot timeout exceeded, boot probe succeeds but crunch-run fails",
			state:           StateUnknown,
			age:             bootTimeout * 2,
			respRun:         respFail,
			expectState:     StateShutdown,
		},
		{
			testCaseComment: "Unknown, boot timeout exceeded, boot probe fails but crunch-run succeeds",
			state:           StateUnknown,
			age:             bootTimeout * 2,
			respBoot:        respFail,
			expectState:     StateShutdown,
		},
		{
			testCaseComment: "Unknown, boot timeout exceeded, boot probe fails but container is running",
			state:           StateUnknown,
			age:             bootTimeout * 2,
			respBoot:        respFail,
			respRun:         respContainerRunning,
			expectState:     StateUnknown,
			expectRunning:   1,
		},
		{
			testCaseComment: "Unknown, boot probe fails, deployRunner succeeds, container is running",
			state:           StateUnknown,
			respBoot:        respFail,
			respRun:         respFail,
			respRunDeployed: respContainerRunning,
			deployRunner:    []byte("ELF"),
			expectStdin:     []byte("ELF"),
			expectState:     StateUnknown,
			expectRunning:   1,
		},
		{
			testCaseComment: "Unknown, boot timeout exceeded, boot probe fails but deployRunner succeeds and container is running",
			state:           StateUnknown,
			age:             bootTimeout * 2,
			respBoot:        respFail,
			respRun:         respFail,
			respRunDeployed: respContainerRunning,
			deployRunner:    []byte("ELF"),
			expectStdin:     []byte("ELF"),
			expectState:     StateUnknown,
			expectRunning:   1,
		},
		{
			testCaseComment: "Unknown, boot timeout exceeded, boot probe fails but deployRunner succeeds and no container is running",
			state:           StateUnknown,
			age:             bootTimeout * 2,
			respBoot:        respFail,
			respRun:         respFail,
			deployRunner:    []byte("ELF"),
			expectStdin:     []byte("ELF"),
			expectState:     StateShutdown,
		},
		{
			testCaseComment: "Booting, boot probe fails, run probe fails",
			state:           StateBooting,
			respBoot:        respFail,
			respRun:         respFail,
			expectState:     StateBooting,
		},
		{
			testCaseComment: "Booting, boot probe fails, run probe succeeds (but isn't expected to be called)",
			state:           StateBooting,
			respBoot:        respFail,
			expectState:     StateBooting,
		},
		{
			testCaseComment: "Booting, boot probe succeeds, run probe fails",
			state:           StateBooting,
			respRun:         respFail,
			expectState:     StateBooting,
		},
		{
			testCaseComment: "Booting, boot probe succeeds, run probe succeeds",
			state:           StateBooting,
			expectState:     StateIdle,
		},
		{
			testCaseComment: "Booting, boot probe succeeds, run probe succeeds, container is running",
			state:           StateBooting,
			respRun:         respContainerRunning,
			expectState:     StateRunning,
			expectRunning:   1,
		},
		{
			testCaseComment: "Booting, boot timeout exceeded",
			state:           StateBooting,
			age:             bootTimeout * 2,
			respRun:         respFail,
			expectState:     StateShutdown,
		},
		{
			testCaseComment: "Idle, probe timeout exceeded, one container running",
			state:           StateIdle,
			age:             probeTimeout * 2,
			respRun:         respContainerRunning,
			expectState:     StateRunning,
			expectRunning:   1,
		},
		{
			testCaseComment: "Idle, probe timeout exceeded, one container running, probe fails",
			state:           StateIdle,
			age:             probeTimeout * 2,
			running:         1,
			respRun:         respFail,
			expectState:     StateShutdown,
			expectRunning:   1,
		},
		{
			testCaseComment: "Idle, probe timeout exceeded, nothing running, probe fails",
			state:           StateIdle,
			age:             probeTimeout * 2,
			respRun:         respFail,
			expectState:     StateShutdown,
		},
		{
			testCaseComment: "Running, one container still running",
			state:           StateRunning,
			running:         1,
			respRun:         respContainerRunning,
			expectState:     StateRunning,
			expectRunning:   1,
		},
		{
			testCaseComment: "Running, container has exited",
			state:           StateRunning,
			running:         1,
			expectState:     StateIdle,
			expectRunning:   0,
		},
		{
			testCaseComment: "Running, probe timeout exceeded, nothing running, new container being started",
			state:           StateRunning,
			age:             probeTimeout * 2,
			starting:        1,
			expectState:     StateRunning,
		},
		{
			testCaseComment: "Booting, boot probe succeeds, deployRunner succeeds, run probe succeeds",
			state:           StateBooting,
			deployRunner:    []byte("ELF"),
			expectStdin:     []byte("ELF"),
			respRun:         respFail,
			respRunDeployed: respContainerRunning,
			expectRunning:   1,
			expectState:     StateRunning,
		},
		{
			testCaseComment: "Booting, boot probe succeeds, deployRunner fails",
			state:           StateBooting,
			deployRunner:    []byte("ELF"),
			respDeploy:      respFail,
			expectStdin:     []byte("ELF"),
			expectState:     StateBooting,
		},
		{
			testCaseComment: "Booting, boot probe succeeds, deployRunner skipped, run probe succeeds",
			state:           StateBooting,
			deployRunner:    nil,
			respDeploy:      respFail,
			expectState:     StateIdle,
		},
	} {
		c.Logf("------- trial %d: %#v", idx, trial)
		ctime := time.Now().Add(-trial.age)
		exr := &stubExecutor{
			response: map[string]stubResp{
				"bootprobe":         trial.respBoot,
				"crunch-run --list": trial.respRun,
				"{deploy}":          trial.respDeploy,
			},
		}
		wp := &Pool{
			arvClient:        ac,
			newExecutor:      func(cloud.Instance) Executor { return exr },
			cluster:          suite.testCluster,
			bootProbeCommand: "bootprobe",
			timeoutBooting:   bootTimeout,
			timeoutProbe:     probeTimeout,
			exited:           map[string]time.Time{},
			runnerCmdDefault: "crunch-run",
			runnerArgs:       []string{"--args=not used with --list"},
			runnerCmd:        "crunch-run",
			runnerData:       trial.deployRunner,
			runnerMD5:        md5.Sum(trial.deployRunner),
		}
		wp.registerMetrics(prometheus.NewRegistry())
		if trial.deployRunner != nil {
			svHash := md5.Sum(trial.deployRunner)
			wp.runnerCmd = fmt.Sprintf("/var/run/arvados/crunch-run~%x", svHash)
			exr.response[wp.runnerCmd+" --list"] = trial.respRunDeployed
		}
		wkr := &worker{
			logger:   suite.logger,
			executor: exr,
			wp:       wp,
			mtx:      &wp.mtx,
			state:    trial.state,
			instance: inst,
			appeared: ctime,
			busy:     ctime,
			probed:   ctime,
			updated:  ctime,
			running:  map[string]*remoteRunner{},
			starting: map[string]*remoteRunner{},
			probing:  make(chan struct{}, 1),
		}
		if trial.running > 0 {
			uuid := "zzzzz-dz642-abcdefghijklmno"
			wkr.running = map[string]*remoteRunner{uuid: newRemoteRunner(uuid, wkr)}
		}
		if trial.starting > 0 {
			uuid := "zzzzz-dz642-bcdefghijklmnop"
			wkr.starting = map[string]*remoteRunner{uuid: newRemoteRunner(uuid, wkr)}
		}
		wkr.probeAndUpdate()
		c.Check(wkr.state, check.Equals, trial.expectState)
		c.Check(len(wkr.running), check.Equals, trial.expectRunning)
		c.Check(exr.stdin.String(), check.Equals, string(trial.expectStdin))
	}
}

type stubResp struct {
	stdout string
	stderr string
	err    error
}

type stubExecutor struct {
	response map[string]stubResp
	stdin    bytes.Buffer
}

func (se *stubExecutor) SetTarget(cloud.ExecutorTarget) {}
func (se *stubExecutor) Close()                         {}
func (se *stubExecutor) Execute(env map[string]string, cmd string, stdin io.Reader) (stdout, stderr []byte, err error) {
	if stdin != nil {
		_, err = io.Copy(&se.stdin, stdin)
		if err != nil {
			return nil, []byte(err.Error()), err
		}
	}
	resp, ok := se.response[cmd]
	if !ok && strings.Contains(cmd, `; cat >"$dstfile"`) {
		resp, ok = se.response["{deploy}"]
	}
	if !ok {
		return nil, []byte(fmt.Sprintf("%s: command not found\n", cmd)), errors.New("command not found")
	}
	return []byte(resp.stdout), []byte(resp.stderr), resp.err
}