1 // Copyright (C) The Arvados Authors. All rights reserved.
3 // SPDX-License-Identifier: AGPL-3.0
14 "git.curoverse.com/arvados.git/sdk/go/arvados"
15 "git.curoverse.com/arvados.git/sdk/go/httpserver"
18 //go:generate go run generate.go
20 // CollectionList is used as a template to auto-generate List()
21 // methods for other types; see generate.go.
23 func (conn *Conn) CollectionList(ctx context.Context, options arvados.ListOptions) (arvados.CollectionList, error) {
25 var merged arvados.CollectionList
26 err := conn.splitListRequest(ctx, options, func(ctx context.Context, _ string, backend arvados.API, options arvados.ListOptions) ([]string, error) {
27 cl, err := backend.CollectionList(ctx, options)
33 if len(merged.Items) == 0 {
36 merged.Items = append(merged.Items, cl.Items...)
38 uuids := make([]string, 0, len(cl.Items))
39 for _, item := range cl.Items {
40 uuids = append(uuids, item.UUID)
44 sort.Slice(merged.Items, func(i, j int) bool { return merged.Items[i].UUID < merged.Items[j].UUID })
48 // Call fn on one or more local/remote backends if opts indicates a
49 // federation-wide list query, i.e.:
51 // * There is at least one filter of the form
52 // ["uuid","in",[a,b,c,...]] or ["uuid","=",a]
54 // * One or more of the supplied UUIDs (a,b,c,...) has a non-local
57 // * There are no other filters
59 // (If opts doesn't indicate a federation-wide list query, fn is just
60 // called once with the local backend.)
62 // fn is called more than once only if the query meets the following
71 // * there are no filters other than the "uuid = ..." and "uuid in
72 // ..." filters mentioned above.
74 // * The maximum possible response size (total number of objects that
75 // could potentially be matched by all of the specified filters)
76 // exceeds the local cluster's response page size limit.
78 // If the query involves multiple backends but doesn't meet these
79 // restrictions, an error is returned without calling fn.
81 // Thus, the caller can assume that either:
83 // * splitListRequest() returns an error, or
85 // * fn is called exactly once, or
87 // * fn is called more than once, with options that satisfy the above
90 // Each call to fn indicates a single (local or remote) backend and a
91 // corresponding options argument suitable for sending to that
93 func (conn *Conn) splitListRequest(ctx context.Context, opts arvados.ListOptions, fn func(context.Context, string, arvados.API, arvados.ListOptions) ([]string, error)) error {
95 var matchAllFilters map[string]bool
96 for _, f := range opts.Filters {
97 matchThisFilter := map[string]bool{}
102 if f.Operator == "=" {
103 if uuid, ok := f.Operand.(string); ok {
104 matchThisFilter[uuid] = true
106 return httpErrorf(http.StatusBadRequest, "invalid operand type %T for filter %q", f.Operand, f)
108 } else if f.Operator == "in" {
109 if operand, ok := f.Operand.([]interface{}); ok {
110 // skip any elements that aren't
111 // strings (thus can't match a UUID,
112 // thus can't affect the response).
113 for _, v := range operand {
114 if uuid, ok := v.(string); ok {
115 matchThisFilter[uuid] = true
118 } else if strings, ok := f.Operand.([]string); ok {
119 for _, uuid := range strings {
120 matchThisFilter[uuid] = true
123 return httpErrorf(http.StatusBadRequest, "invalid operand type %T in filter %q", f.Operand, f)
130 if matchAllFilters == nil {
131 matchAllFilters = matchThisFilter
133 // Reduce matchAllFilters to the intersection
134 // of matchAllFilters ∩ matchThisFilter.
135 for uuid := range matchAllFilters {
136 if !matchThisFilter[uuid] {
137 delete(matchAllFilters, uuid)
143 // Collate UUIDs in matchAllFilters by remote cluster ID --
144 // e.g., todoByRemote["aaaaa"]["aaaaa-4zz18-000000000000000"]
145 // will be true -- and count the total number of UUIDs we're
146 // filtering on, so we can compare it to our max page size
149 todoByRemote := map[string]map[string]bool{}
150 for uuid := range matchAllFilters {
152 // Cannot match anything, just drop it
154 if todoByRemote[uuid[:5]] == nil {
155 todoByRemote[uuid[:5]] = map[string]bool{}
157 todoByRemote[uuid[:5]][uuid] = true
162 if len(todoByRemote) > 1 {
164 return httpErrorf(http.StatusBadRequest, "cannot execute federated list query with filters other than 'uuid = ...' and 'uuid in [...]'")
166 if opts.Count != "none" {
167 return httpErrorf(http.StatusBadRequest, "cannot execute federated list query unless count==\"none\"")
169 if opts.Limit >= 0 || opts.Offset != 0 || len(opts.Order) > 0 {
170 return httpErrorf(http.StatusBadRequest, "cannot execute federated list query with limit, offset, or order parameter")
172 if max := conn.cluster.API.MaxItemsPerResponse; nUUIDs > max {
173 return httpErrorf(http.StatusBadRequest, "cannot execute federated list query because number of UUIDs (%d) exceeds page size limit %d", nUUIDs, max)
175 selectingUUID := false
176 for _, attr := range opts.Select {
181 if opts.Select != nil && !selectingUUID {
182 return httpErrorf(http.StatusBadRequest, "cannot execute federated list query with a select parameter that does not include uuid")
186 ctx, cancel := context.WithCancel(ctx)
188 errs := make(chan error, len(todoByRemote))
189 for clusterID, todo := range todoByRemote {
190 go func(clusterID string, todo map[string]bool) {
191 // This goroutine sends exactly one value to
193 batch := make([]string, 0, len(todo))
194 for uuid := range todo {
195 batch = append(batch, uuid)
198 var backend arvados.API
199 if clusterID == conn.cluster.ClusterID {
201 } else if backend = conn.remotes[clusterID]; backend == nil {
202 errs <- httpErrorf(http.StatusNotFound, "cannot execute federated list query: no proxy available for cluster %q", clusterID)
207 if len(batch) > len(todo) {
208 // Reduce batch to just the todo's
210 for uuid := range todo {
211 batch = append(batch, uuid)
214 remoteOpts.Filters = []arvados.Filter{{"uuid", "in", batch}}
216 done, err := fn(ctx, clusterID, backend, remoteOpts)
222 for _, uuid := range done {
223 if _, ok := todo[uuid]; ok {
229 errs <- httpErrorf(http.StatusBadGateway, "cannot make progress in federated list query: cluster %q returned none of the requested UUIDs", clusterID)
237 // Wait for all goroutines to return, then return the first
238 // non-nil error, if any.
240 for range todoByRemote {
241 if err := <-errs; err != nil && firstErr == nil {
243 // Signal to any remaining fn() calls that
244 // further effort is futile.
251 func httpErrorf(code int, format string, args ...interface{}) error {
252 return httpserver.ErrorWithStatus(fmt.Errorf(format, args...), code)