X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/f9eb135e4420352198729534f115f233cda8c261..69158dc93fdfec57279ba227f872f3a7c01c4e78:/services/ws/router.go diff --git a/services/ws/router.go b/services/ws/router.go index 685b6132ab..878c282f8a 100644 --- a/services/ws/router.go +++ b/services/ws/router.go @@ -1,47 +1,98 @@ -package main +// Copyright (C) The Arvados Authors. All rights reserved. +// +// SPDX-License-Identifier: AGPL-3.0 + +package ws import ( - "encoding/json" - "fmt" - "log" + "io" "net/http" "sync" + "sync/atomic" + "time" + "git.arvados.org/arvados.git/sdk/go/arvados" + "git.arvados.org/arvados.git/sdk/go/ctxlog" + "git.arvados.org/arvados.git/sdk/go/health" + "github.com/prometheus/client_golang/prometheus" + "github.com/sirupsen/logrus" "golang.org/x/net/websocket" ) +type wsConn interface { + io.ReadWriter + Request() *http.Request + SetReadDeadline(time.Time) error + SetWriteDeadline(time.Time) error +} + type router struct { - Config *Config + client *arvados.Client + cluster *arvados.Cluster + eventSource eventSource + newPermChecker func() permChecker - eventSource eventSource - mux *http.ServeMux - setupOnce sync.Once + handler *handler + mux *http.ServeMux + setupOnce sync.Once + done chan struct{} + reg *prometheus.Registry } func (rtr *router) setup() { + mSockets := prometheus.NewGaugeVec(prometheus.GaugeOpts{ + Namespace: "arvados", + Subsystem: "ws", + Name: "sockets", + Help: "Number of connected sockets", + }, []string{"version"}) + rtr.reg.MustRegister(mSockets) + + rtr.handler = &handler{ + PingTimeout: time.Duration(rtr.cluster.API.SendTimeout), + QueueSize: rtr.cluster.API.WebsocketClientEventQueue, + } rtr.mux = http.NewServeMux() - rtr.mux.Handle("/websocket", rtr.makeServer(&handlerV0{ - PingTimeout: rtr.Config.PingTimeout.Duration(), - QueueSize: rtr.Config.ClientEventQueue, - })) - rtr.mux.Handle("/arvados/v1/events.ws", rtr.makeServer(&handlerV1{ - PingTimeout: rtr.Config.PingTimeout.Duration(), - QueueSize: rtr.Config.ClientEventQueue, - })) + rtr.mux.Handle("/websocket", rtr.makeServer(newSessionV0, mSockets.WithLabelValues("0"))) + rtr.mux.Handle("/arvados/v1/events.ws", rtr.makeServer(newSessionV1, mSockets.WithLabelValues("1"))) + rtr.mux.Handle("/_health/", &health.Handler{ + Token: rtr.cluster.ManagementToken, + Prefix: "/_health/", + Routes: health.Routes{ + "db": rtr.eventSource.DBHealth, + }, + Log: func(r *http.Request, err error) { + if err != nil { + ctxlog.FromContext(r.Context()).WithError(err).Error("error") + } + }, + }) } -func (rtr *router) makeServer(handler handler) *websocket.Server { +func (rtr *router) makeServer(newSession sessionFactory, gauge prometheus.Gauge) *websocket.Server { + var connected int64 return &websocket.Server{ Handshake: func(c *websocket.Config, r *http.Request) error { return nil }, Handler: websocket.Handler(func(ws *websocket.Conn) { - log.Printf("%v accepted", ws.Request().RemoteAddr) - sink := rtr.eventSource.NewSink(nil) - handler.Handle(ws, sink.Channel()) - sink.Stop() + t0 := time.Now() + logger := ctxlog.FromContext(ws.Request().Context()) + atomic.AddInt64(&connected, 1) + gauge.Set(float64(atomic.LoadInt64(&connected))) + + stats := rtr.handler.Handle(ws, logger, rtr.eventSource, + func(ws wsConn, sendq chan<- interface{}) (session, error) { + return newSession(ws, sendq, rtr.eventSource.DB(), rtr.newPermChecker(), rtr.client) + }) + + logger.WithFields(logrus.Fields{ + "elapsed": time.Now().Sub(t0).Seconds(), + "stats": stats, + }).Info("client disconnected") ws.Close() - log.Printf("%v disconnected", ws.Request().RemoteAddr) + atomic.AddInt64(&connected, -1) + gauge.Set(float64(atomic.LoadInt64(&connected))) }), } } @@ -49,11 +100,13 @@ func (rtr *router) makeServer(handler handler) *websocket.Server { func (rtr *router) ServeHTTP(resp http.ResponseWriter, req *http.Request) { rtr.setupOnce.Do(rtr.setup) rtr.mux.ServeHTTP(resp, req) - j, err := json.Marshal(map[string]interface{}{ - "req": fmt.Sprintf("%+v", req), - }) - if err != nil { - log.Fatal(err) - } - log.Print(string(j)) +} + +func (rtr *router) CheckHealth() error { + rtr.setupOnce.Do(rtr.setup) + return rtr.eventSource.DBHealth() +} + +func (rtr *router) Done() <-chan struct{} { + return rtr.done }