Merge branch 'pr/24'

[arvados.git] / services / keepstore / pull_worker_test.go
diff --git a/services/keepstore/pull_worker_test.go b/services/keepstore/pull_worker_test.go

index 0bdb886b95558669dc8dfcbf69b08f7c94c15b5e..c6a41953842b6c2ab9403c84c04d17cee839fabd 100644 (file)
--- a/services/keepstore/pull_worker_test.go
+++ b/services/keepstore/pull_worker_test.go
@@ -1,121 +1,332 @@
  package main
  
  import (
+       "bytes"
         "errors"
+       "git.curoverse.com/arvados.git/sdk/go/arvadosclient"
+       "git.curoverse.com/arvados.git/sdk/go/keepclient"
+       . "gopkg.in/check.v1"
+       "io"
         "net/http"
         "testing"
         "time"
  )
  
+type PullWorkerTestSuite struct{}
+
+// Gocheck boilerplate
  func TestPullWorker(t *testing.T) {
-       defer teardown()
+       TestingT(t)
+}
+
+// Gocheck boilerplate
+var _ = Suite(&PullWorkerTestSuite{})
+
+var testPullLists map[string]string
+var readContent string
+var readError error
+var putContent []byte
+var putError error
+var currentTestData PullWorkerTestData
  
-       // Since keepstore does not come into picture in tests,
-       // we need to explicitly start the goroutine in tests.
-       go RunPullWorker(pullq.NextItem)
+func (s *PullWorkerTestSuite) SetUpTest(c *C) {
+       readContent = ""
+       readError = nil
+       putContent = []byte("")
+       putError = nil
  
-       data_manager_token = "DATA MANAGER TOKEN"
+       // When a new pull request arrives, the old one will be overwritten.
+       // This behavior is verified using these two maps in the
+       // "TestPullWorkerPullList_with_two_items_latest_replacing_old"
+       testPullLists = make(map[string]string)
+}
+
+// Since keepstore does not come into picture in tests,
+// we need to explicitly start the goroutine in tests.
+func RunTestPullWorker(c *C) {
+       arv, err := arvadosclient.MakeArvadosClient()
+       c.Assert(err, Equals, nil)
+       keepClient, err := keepclient.MakeKeepClient(&arv)
+       c.Assert(err, Equals, nil)
  
-       first_pull_list := []byte(`[
+       pullq = NewWorkQueue()
+       go RunPullWorker(pullq, keepClient)
+}
+
+var firstPullList = []byte(`[
                 {
-                       "locator":"locator1_to_verify_first_pull_list",
+                       "locator":"acbd18db4cc2f85cedef654fccc4a4d8+3",
                         "servers":[
                                 "server_1",
                                 "server_2"
                         ]
-               },
-    {
-                       "locator":"locator2_to_verify_first_pull_list",
+               },{
+                       "locator":"37b51d194a7513e45b56f6524f2d51f2+3",
                         "servers":[
-                               "server_1"
+                               "server_3"
                         ]
                 }
         ]`)
  
-       second_pull_list := []byte(`[
+var secondPullList = []byte(`[
                 {
-                       "locator":"locator_to_verify_second_pull_list",
+                       "locator":"73feffa4b7f6bb68e44cf984c85f6e88+3",
                         "servers":[
                                 "server_1",
-        "server_2"
+                               "server_2"
                         ]
                 }
         ]`)
  
-       type PullWorkerTestData struct {
-               name          string
-               req           RequestTester
-               response_code int
-               response_body string
-               read_content  string
-               read_error    bool
-               put_error     bool
+type PullWorkerTestData struct {
+       name         string
+       req          RequestTester
+       responseCode int
+       responseBody string
+       readContent  string
+       readError    bool
+       putError     bool
+}
+
+func (s *PullWorkerTestSuite) TestPullWorkerPullList_with_two_locators(c *C) {
+       defer teardown()
+
+       dataManagerToken = "DATA MANAGER TOKEN"
+       testData := PullWorkerTestData{
+               name:         "TestPullWorkerPullList_with_two_locators",
+               req:          RequestTester{"/pull", dataManagerToken, "PUT", firstPullList},
+               responseCode: http.StatusOK,
+               responseBody: "Received 2 pull requests\n",
+               readContent:  "hello",
+               readError:    false,
+               putError:     false,
         }
-       var testcases = []PullWorkerTestData{
-               {
-                       "Pull request 1 from the data manager in worker",
-                       RequestTester{"/pull", data_manager_token, "PUT", first_pull_list},
-                       http.StatusOK,
-                       "Received 2 pull requests\n",
-                       "hello",
-                       false,
-                       false,
-               },
-               {
-                       "Pull request 2 from the data manager in worker",
-                       RequestTester{"/pull", data_manager_token, "PUT", second_pull_list},
-                       http.StatusOK,
-                       "Received 1 pull requests\n",
-                       "hola",
-                       false,
-                       false,
-               },
-               {
-                       "Pull request with error on get",
-                       RequestTester{"/pull", data_manager_token, "PUT", second_pull_list},
-                       http.StatusOK,
-                       "Received 1 pull requests\n",
-                       "unused",
-                       true,
-                       false,
-               },
-               {
-                       "Pull request with error on put",
-                       RequestTester{"/pull", data_manager_token, "PUT", second_pull_list},
-                       http.StatusOK,
-                       "Received 1 pull requests\n",
-                       "unused",
-                       false,
-                       true,
-               },
+
+       performTest(testData, c)
+}
+
+func (s *PullWorkerTestSuite) TestPullWorkerPullList_with_one_locator(c *C) {
+       defer teardown()
+
+       dataManagerToken = "DATA MANAGER TOKEN"
+       testData := PullWorkerTestData{
+               name:         "TestPullWorkerPullList_with_one_locator",
+               req:          RequestTester{"/pull", dataManagerToken, "PUT", secondPullList},
+               responseCode: http.StatusOK,
+               responseBody: "Received 1 pull requests\n",
+               readContent:  "hola",
+               readError:    false,
+               putError:     false,
+       }
+
+       performTest(testData, c)
+}
+
+func (s *PullWorkerTestSuite) TestPullWorker_error_on_get_one_locator(c *C) {
+       defer teardown()
+
+       dataManagerToken = "DATA MANAGER TOKEN"
+       testData := PullWorkerTestData{
+               name:         "TestPullWorker_error_on_get_one_locator",
+               req:          RequestTester{"/pull", dataManagerToken, "PUT", secondPullList},
+               responseCode: http.StatusOK,
+               responseBody: "Received 1 pull requests\n",
+               readContent:  "unused",
+               readError:    true,
+               putError:     false,
+       }
+
+       performTest(testData, c)
+}
+
+func (s *PullWorkerTestSuite) TestPullWorker_error_on_get_two_locators(c *C) {
+       defer teardown()
+
+       dataManagerToken = "DATA MANAGER TOKEN"
+       testData := PullWorkerTestData{
+               name:         "TestPullWorker_error_on_get_two_locators",
+               req:          RequestTester{"/pull", dataManagerToken, "PUT", firstPullList},
+               responseCode: http.StatusOK,
+               responseBody: "Received 2 pull requests\n",
+               readContent:  "unused",
+               readError:    true,
+               putError:     false,
         }
  
-       for _, testData := range testcases {
-               // Override GetContent to mock keepclient functionality
-               GetContent = func(addr string, locator string) ([]byte, error) {
-                       if testData.read_error {
-                               return nil, errors.New("Error getting data")
-                       } else {
-                               return []byte(testData.read_content), nil
-                       }
+       performTest(testData, c)
+}
+
+func (s *PullWorkerTestSuite) TestPullWorker_error_on_put_one_locator(c *C) {
+       defer teardown()
+
+       dataManagerToken = "DATA MANAGER TOKEN"
+       testData := PullWorkerTestData{
+               name:         "TestPullWorker_error_on_put_one_locator",
+               req:          RequestTester{"/pull", dataManagerToken, "PUT", secondPullList},
+               responseCode: http.StatusOK,
+               responseBody: "Received 1 pull requests\n",
+               readContent:  "hello hello",
+               readError:    false,
+               putError:     true,
+       }
+
+       performTest(testData, c)
+}
+
+func (s *PullWorkerTestSuite) TestPullWorker_error_on_put_two_locators(c *C) {
+       defer teardown()
+
+       dataManagerToken = "DATA MANAGER TOKEN"
+       testData := PullWorkerTestData{
+               name:         "TestPullWorker_error_on_put_two_locators",
+               req:          RequestTester{"/pull", dataManagerToken, "PUT", firstPullList},
+               responseCode: http.StatusOK,
+               responseBody: "Received 2 pull requests\n",
+               readContent:  "hello again",
+               readError:    false,
+               putError:     true,
+       }
+
+       performTest(testData, c)
+}
+
+// When a new pull request arrives, the old one is replaced. This test
+// is used to check that behavior by first putting an item on the queue,
+// and then performing the test. Thus the "testPullLists" has two entries;
+// however, processedPullLists will see only the newest item in the list.
+func (s *PullWorkerTestSuite) TestPullWorkerPullList_with_two_items_latest_replacing_old(c *C) {
+       defer teardown()
+
+       var firstInput = []int{1}
+       pullq = NewWorkQueue()
+       pullq.ReplaceQueue(makeTestWorkList(firstInput))
+       testPullLists["Added_before_actual_test_item"] = string(1)
+
+       dataManagerToken = "DATA MANAGER TOKEN"
+       testData := PullWorkerTestData{
+               name:         "TestPullWorkerPullList_with_two_items_latest_replacing_old",
+               req:          RequestTester{"/pull", dataManagerToken, "PUT", secondPullList},
+               responseCode: http.StatusOK,
+               responseBody: "Received 1 pull requests\n",
+               readContent:  "hola de nuevo",
+               readError:    false,
+               putError:     false,
+       }
+
+       performTest(testData, c)
+}
+
+// In this case, the item will not be placed on pullq
+func (s *PullWorkerTestSuite) TestPullWorker_invalid_dataManagerToken(c *C) {
+       defer teardown()
+
+       dataManagerToken = "DATA MANAGER TOKEN"
+
+       testData := PullWorkerTestData{
+               name:         "TestPullWorkerPullList_with_two_locators",
+               req:          RequestTester{"/pull", "invalid_dataManagerToken", "PUT", firstPullList},
+               responseCode: http.StatusUnauthorized,
+               responseBody: "Unauthorized\n",
+               readContent:  "hello",
+               readError:    false,
+               putError:     false,
+       }
+
+       performTest(testData, c)
+}
+
+func performTest(testData PullWorkerTestData, c *C) {
+       KeepVM = MakeTestVolumeManager(2)
+       defer KeepVM.Close()
+
+       RunTestPullWorker(c)
+       defer pullq.Close()
+
+       currentTestData = testData
+       testPullLists[testData.name] = testData.responseBody
+
+       processedPullLists := make(map[string]string)
+
+       // Override GetContent to mock keepclient Get functionality
+       defer func(orig func(string, *keepclient.KeepClient) (io.ReadCloser, int64, string, error)) {
+               GetContent = orig
+       }(GetContent)
+       GetContent = func(signedLocator string, keepClient *keepclient.KeepClient) (reader io.ReadCloser, contentLength int64, url string, err error) {
+               c.Assert(getStatusItem("PullQueue", "InProgress"), Equals, float64(1))
+               processedPullLists[testData.name] = testData.responseBody
+               if testData.readError {
+                       err = errors.New("Error getting data")
+                       readError = err
+                       return nil, 0, "", err
                 }
+               readContent = testData.readContent
+               cb := &ClosingBuffer{bytes.NewBufferString(testData.readContent)}
+               var rc io.ReadCloser
+               rc = cb
+               return rc, int64(len(testData.readContent)), "", nil
+       }
  
-               // Override PutContent to mock PutBlock functionality
-               PutContent = func(content []byte, locator string) (err error) {
-                       if testData.put_error {
-                               return errors.New("Error putting data")
-                       } else {
-                               return nil
-                       }
+       // Override PutContent to mock PutBlock functionality
+       defer func(orig func([]byte, string) error) { PutContent = orig }(PutContent)
+       PutContent = func(content []byte, locator string) (err error) {
+               if testData.putError {
+                       err = errors.New("Error putting data")
+                       putError = err
+                       return err
                 }
+               putContent = content
+               return nil
+       }
+
+       c.Assert(getStatusItem("PullQueue", "InProgress"), Equals, float64(0))
+       c.Assert(getStatusItem("PullQueue", "Queued"), Equals, float64(0))
  
-               response := IssueRequest(&testData.req)
-               ExpectStatusCode(t, testData.name, testData.response_code, response)
-               ExpectBody(t, testData.name, testData.response_body, response)
+       response := IssueRequest(&testData.req)
+       c.Assert(response.Code, Equals, testData.responseCode)
+       c.Assert(response.Body.String(), Equals, testData.responseBody)
  
-               // give the channel a second to read and process all pull list entries
-               time.Sleep(1000 * time.Millisecond)
+       expectEqualWithin(c, time.Second, 0, func() interface{} {
+               st := pullq.Status()
+               return st.InProgress + st.Queued
+       })
  
-               expectChannelEmpty(t, pullq.NextItem)
+       if testData.name == "TestPullWorkerPullList_with_two_items_latest_replacing_old" {
+               c.Assert(len(testPullLists), Equals, 2)
+               c.Assert(len(processedPullLists), Equals, 1)
+               c.Assert(testPullLists["Added_before_actual_test_item"], NotNil)
+               c.Assert(testPullLists["TestPullWorkerPullList_with_two_items_latest_replacing_old"], NotNil)
+               c.Assert(processedPullLists["TestPullWorkerPullList_with_two_items_latest_replacing_old"], NotNil)
+       } else {
+               if testData.responseCode == http.StatusOK {
+                       c.Assert(len(testPullLists), Equals, 1)
+                       c.Assert(len(processedPullLists), Equals, 1)
+                       c.Assert(testPullLists[testData.name], NotNil)
+               } else {
+                       c.Assert(len(testPullLists), Equals, 1)
+                       c.Assert(len(processedPullLists), Equals, 0)
+               }
         }
+
+       if testData.readError {
+               c.Assert(readError, NotNil)
+       } else if testData.responseCode == http.StatusOK {
+               c.Assert(readError, IsNil)
+               c.Assert(readContent, Equals, testData.readContent)
+               if testData.putError {
+                       c.Assert(putError, NotNil)
+               } else {
+                       c.Assert(putError, IsNil)
+                       c.Assert(string(putContent), Equals, testData.readContent)
+               }
+       }
+
+       expectChannelEmpty(c, pullq.NextItem)
+}
+
+type ClosingBuffer struct {
+       *bytes.Buffer
+}
+
+func (cb *ClosingBuffer) Close() (err error) {
+       return
  }