// Copyright (C) The Arvados Authors. All rights reserved.
// SPDX-License-Identifier: AGPL-3.0

package controller

import (


	// sqlx needs lib/pq to talk to PostgreSQL
	_ "github.com/lib/pq"

type Handler struct {
	Cluster           *arvados.Cluster
	BackgroundContext context.Context

	setupOnce      sync.Once
	federation     *federation.Conn
	handlerStack   http.Handler
	proxy          *proxy
	secureClient   *http.Client
	insecureClient *http.Client
	dbConnector    ctrlctx.DBConnector
	limitLogCreate chan struct{}

	cache map[string]*cacheEnt

func (h *Handler) ServeHTTP(w http.ResponseWriter, req *http.Request) {
	if req.Method != "GET" && req.Method != "HEAD" {
		// http.ServeMux returns 301 with a cleaned path if
		// the incoming request has a double slash. Some
		// clients (including the Go standard library) change
		// the request method to GET when following a 301
		// redirect if the original method was not HEAD
		// (RFC7231 6.4.2 specifically allows this in the case
		// of POST). Thus "POST //foo" gets misdirected to
		// "GET /foo". To avoid this, eliminate double slashes
		// before passing the request to ServeMux.
		for strings.Contains(req.URL.Path, "//") {
			req.URL.Path = strings.Replace(req.URL.Path, "//", "/", -1)
	h.handlerStack.ServeHTTP(w, req)

func (h *Handler) CheckHealth() error {
	_, err := h.dbConnector.GetDB(context.TODO())
	if err != nil {
		return err
	_, _, err = railsproxy.FindRailsAPI(h.Cluster)
	if err != nil {
		return err
	if h.Cluster.API.VocabularyPath != "" {
		req, err := http.NewRequest("GET", "/arvados/v1/vocabulary", nil)
		if err != nil {
			return err
		var resp httptest.ResponseRecorder
		h.handlerStack.ServeHTTP(&resp, req)
		if resp.Result().StatusCode != http.StatusOK {
			return fmt.Errorf("%d %s", resp.Result().StatusCode, resp.Result().Status)
	return nil

func (h *Handler) Done() <-chan struct{} {
	return nil

func neverRedirect(*http.Request, []*http.Request) error { return http.ErrUseLastResponse }

func (h *Handler) setup() {
	mux := http.NewServeMux()
	healthFuncs := make(map[string]health.Func)

	h.dbConnector = ctrlctx.DBConnector{PostgreSQL: h.Cluster.PostgreSQL}
	go func() {
	oidcAuthorizer := localdb.OIDCAccessTokenAuthorizer(h.Cluster, h.dbConnector.GetDB)
	h.federation = federation.New(h.BackgroundContext, h.Cluster, &healthFuncs, h.dbConnector.GetDB)
	rtr := router.New(h.federation, router.Config{
		MaxRequestSize: h.Cluster.API.MaxRequestSize,
		WrapCalls: api.ComposeWrappers(

	healthRoutes := health.Routes{"ping": func() error { _, err := h.dbConnector.GetDB(context.TODO()); return err }}
	for name, f := range healthFuncs {
		healthRoutes[name] = f
	mux.Handle("/_health/", &health.Handler{
		Token:  h.Cluster.ManagementToken,
		Prefix: "/_health/",
		Routes: healthRoutes,
	mux.Handle("/arvados/v1/config", rtr)
	mux.Handle("/arvados/v1/vocabulary", rtr)
	mux.Handle("/"+arvados.EndpointUserAuthenticate.Path, rtr) // must come before .../users/
	mux.Handle("/arvados/v1/collections", rtr)
	mux.Handle("/arvados/v1/collections/", rtr)
	mux.Handle("/arvados/v1/users", rtr)
	mux.Handle("/arvados/v1/users/", rtr)
	mux.Handle("/arvados/v1/connect/", rtr)
	mux.Handle("/arvados/v1/container_requests", rtr)
	mux.Handle("/arvados/v1/container_requests/", rtr)
	mux.Handle("/arvados/v1/groups", rtr)
	mux.Handle("/arvados/v1/groups/", rtr)
	mux.Handle("/arvados/v1/links", rtr)
	mux.Handle("/arvados/v1/links/", rtr)
	mux.Handle("/arvados/v1/authorized_keys", rtr)
	mux.Handle("/arvados/v1/authorized_keys/", rtr)
	mux.Handle("/login", rtr)
	mux.Handle("/logout", rtr)
	mux.Handle("/arvados/v1/api_client_authorizations", rtr)
	mux.Handle("/arvados/v1/api_client_authorizations/", rtr)

	hs := http.NotFoundHandler()
	hs = prepend(hs, h.proxyRailsAPI)
	hs = prepend(hs, h.routeContainerEndpoints(rtr))
	hs = prepend(hs, h.limitLogCreateRequests)
	hs = h.setupProxyRemoteCluster(hs)
	hs = prepend(hs, oidcAuthorizer.Middleware)
	mux.Handle("/", hs)
	h.handlerStack = mux

	sc := *arvados.DefaultSecureClient
	sc.CheckRedirect = neverRedirect
	h.secureClient = &sc

	ic := *arvados.InsecureHTTPClient
	ic.CheckRedirect = neverRedirect
	h.insecureClient = &ic

	logCreateLimit := int(float64(h.Cluster.API.MaxConcurrentRequests) * h.Cluster.API.LogCreateRequestFraction)
	if logCreateLimit == 0 && h.Cluster.API.LogCreateRequestFraction > 0 {
		logCreateLimit = 1
	h.limitLogCreate = make(chan struct{}, logCreateLimit)

	h.proxy = &proxy{
		Name: "arvados-controller",
	h.cache = map[string]*cacheEnt{
		"/discovery/v1/apis/arvados/v1/rest": &cacheEnt{validate: validateDiscoveryDoc},

	go h.trashSweepWorker()
	go h.containerLogSweepWorker()

type middlewareFunc func(http.ResponseWriter, *http.Request, http.Handler)

func prepend(next http.Handler, middleware middlewareFunc) http.Handler {
	return http.HandlerFunc(func(w http.ResponseWriter, req *http.Request) {
		middleware(w, req, next)

func (h *Handler) localClusterRequest(req *http.Request) (*http.Response, error) {
	urlOut, insecure, err := railsproxy.FindRailsAPI(h.Cluster)
	if err != nil {
		return nil, err
	urlOut = &url.URL{
		Scheme:   urlOut.Scheme,
		Host:     urlOut.Host,
		Path:     req.URL.Path,
		RawPath:  req.URL.RawPath,
		RawQuery: req.URL.RawQuery,
	client := h.secureClient
	if insecure {
		client = h.insecureClient
	// Clearing the Host field here causes the Go http client to
	// use the host part of urlOut as the Host header in the
	// outgoing request, instead of the Host value from the
	// original request we received.
	req.Host = ""
	return h.proxy.Do(req, urlOut, client)

// Route /arvados/v1/containers/{uuid}/log*, .../ssh, and
// .../gateway_tunnel to rtr, pass everything else to next.
// (http.ServeMux doesn't let us route these without also routing
// everything under /containers/, which we don't want yet.)
func (h *Handler) routeContainerEndpoints(rtr http.Handler) middlewareFunc {
	return func(w http.ResponseWriter, req *http.Request, next http.Handler) {
		trim := strings.TrimPrefix(req.URL.Path, "/arvados/v1/containers/")
		if trim != req.URL.Path && (strings.Index(trim, "/log") == 27 ||
			strings.Index(trim, "/ssh") == 27 ||
			strings.Index(trim, "/gateway_tunnel") == 27) {
			rtr.ServeHTTP(w, req)
		} else {
			next.ServeHTTP(w, req)

func (h *Handler) limitLogCreateRequests(w http.ResponseWriter, req *http.Request, next http.Handler) {
	if cap(h.limitLogCreate) > 0 && req.Method == http.MethodPost && strings.HasPrefix(req.URL.Path, "/arvados/v1/logs") {
		select {
		case h.limitLogCreate <- struct{}{}:
			defer func() { <-h.limitLogCreate }()
			next.ServeHTTP(w, req)
			http.Error(w, "Excess log messages", http.StatusServiceUnavailable)
	next.ServeHTTP(w, req)

// cacheEnt implements a basic stale-while-revalidate cache, suitable
// for the Arvados discovery document.
type cacheEnt struct {
	validate     func(body []byte) error
	mtx          sync.Mutex
	header       http.Header
	body         []byte
	expireAfter  time.Time
	refreshAfter time.Time
	refreshLock  sync.Mutex

const (
	cacheTTL    = 5 * time.Minute
	cacheExpire = 24 * time.Hour

func (ent *cacheEnt) refresh(path string, do func(*http.Request) (*http.Response, error)) (http.Header, []byte, error) {
	defer ent.refreshLock.Unlock()
	if header, body, needRefresh := ent.response(); !needRefresh {
		// another goroutine refreshed successfully while we
		// were waiting for refreshLock
		return header, body, nil
	} else if body != nil {
		// Cache is present, but expired. We'll try to refresh
		// below. Meanwhile, other refresh() calls will queue
		// up for refreshLock -- and we don't want them to
		// turn into N upstream requests, even if upstream is
		// failing.  (If we succeed we'll update the expiry
		// time again below with the real cacheTTL -- this
		// just takes care of the error case.)
		ent.refreshAfter = time.Now().Add(time.Second)

	ctx, cancel := context.WithDeadline(context.Background(), time.Now().Add(time.Minute))
	defer cancel()
	// "http://localhost" is just a placeholder here -- we'll fill
	// in req.URL.Path below, and then do(), which is
	// localClusterRequest(), will replace the scheme and host
	// parts with the real proxy destination.
	req, err := http.NewRequestWithContext(ctx, http.MethodGet, "http://localhost", nil)
	if err != nil {
		return nil, nil, err
	req.URL.Path = path
	resp, err := do(req)
	if err != nil {
		return nil, nil, err
	if resp.StatusCode != http.StatusOK {
		return nil, nil, fmt.Errorf("HTTP status %d", resp.StatusCode)
	body, err := ioutil.ReadAll(resp.Body)
	if err != nil {
		return nil, nil, fmt.Errorf("Read error: %w", err)
	header := http.Header{}
	for k, v := range resp.Header {
		if !dropHeaders[k] && k != "X-Request-Id" {
			header[k] = v
	if ent.validate != nil {
		if err := ent.validate(body); err != nil {
			return nil, nil, err
	} else if mediatype, _, err := mime.ParseMediaType(header.Get("Content-Type")); err == nil && mediatype == "application/json" {
		if !json.Valid(body) {
			return nil, nil, errors.New("invalid JSON encoding in response")
	defer ent.mtx.Unlock()
	ent.header = header
	ent.body = body
	ent.refreshAfter = time.Now().Add(cacheTTL)
	ent.expireAfter = time.Now().Add(cacheExpire)
	return ent.header, ent.body, nil

func (ent *cacheEnt) response() (http.Header, []byte, bool) {
	defer ent.mtx.Unlock()
	if ent.expireAfter.Before(time.Now()) {
		ent.header, ent.body, ent.refreshAfter = nil, nil, time.Time{}
	return ent.header, ent.body, ent.refreshAfter.Before(time.Now())

func (ent *cacheEnt) ServeHTTP(ctx context.Context, w http.ResponseWriter, path string, do func(*http.Request) (*http.Response, error)) {
	header, body, needRefresh := ent.response()
	if body == nil {
		// need to fetch before we can return anything
		var err error
		header, body, err = ent.refresh(path, do)
		if err != nil {
			http.Error(w, err.Error(), http.StatusBadGateway)
	} else if needRefresh {
		// re-fetch in background
		go func() {
			_, _, err := ent.refresh(path, do)
			if err != nil {
				ctxlog.FromContext(ctx).WithError(err).WithField("path", path).Warn("error refreshing cache")
	for k, v := range header {
		w.Header()[k] = v

func (h *Handler) proxyRailsAPI(w http.ResponseWriter, req *http.Request, next http.Handler) {
	if ent, ok := h.cache[req.URL.Path]; ok && req.Method == http.MethodGet {
		ent.ServeHTTP(req.Context(), w, req.URL.Path, h.localClusterRequest)
	resp, err := h.localClusterRequest(req)
	n, err := h.proxy.ForwardResponse(w, resp, err)
	if err != nil {
		httpserver.Logger(req).WithError(err).WithField("bytesCopied", n).Error("error copying response body")

// Use a localhost entry from Services.RailsAPI.InternalURLs if one is
// present, otherwise choose an arbitrary entry.
func findRailsAPI(cluster *arvados.Cluster) (*url.URL, bool, error) {
	var best *url.URL
	for target := range cluster.Services.RailsAPI.InternalURLs {
		target := url.URL(target)
		best = &target
		if strings.HasPrefix(target.Host, "localhost:") || strings.HasPrefix(target.Host, "") || strings.HasPrefix(target.Host, "[::1]:") {
	if best == nil {
		return nil, false, fmt.Errorf("Services.RailsAPI.InternalURLs is empty")
	return best, cluster.TLS.Insecure, nil

func validateDiscoveryDoc(body []byte) error {
	var dd arvados.DiscoveryDocument
	err := json.Unmarshal(body, &dd)
	if err != nil {
		return fmt.Errorf("error decoding JSON response: %w", err)
	if dd.BasePath == "" {
		return errors.New("error in discovery document: no value for basePath")
	return nil