From ab886917b57b5fa06b802d3578ae26a4e7e62100 Mon Sep 17 00:00:00 2001 From: Nicholas Wiersma Date: Thu, 9 Nov 2023 09:19:49 +0200 Subject: [PATCH] feat: add healthz and server (#101) --- .golangci.yml | 1 + http/handlers.go | 10 +++ http/healthz/healthz.go | 78 ++++++++++++++++ http/healthz/healthz_test.go | 65 ++++++++++++++ http/server.go | 166 ++++++++++++++++++++++++++++++++++- http/server_test.go | 108 +++++++++++++++++++++++ 6 files changed, 426 insertions(+), 2 deletions(-) create mode 100644 http/healthz/healthz.go create mode 100644 http/healthz/healthz_test.go diff --git a/.golangci.yml b/.golangci.yml index 5eb0aed..d639561 100644 --- a/.golangci.yml +++ b/.golangci.yml @@ -33,6 +33,7 @@ linters: - gochecknoinits - goerr113 - gomnd + - ireturn - nlreturn - varnamelen - wrapcheck diff --git a/http/handlers.go b/http/handlers.go index d9388c6..0ce5eb5 100644 --- a/http/handlers.go +++ b/http/handlers.go @@ -3,21 +3,31 @@ package http import "net/http" // OK replies to the request with an HTTP 200 ok reply. +// +// Deprecated: Use healthz instead. func OK(rw http.ResponseWriter, _ *http.Request) { rw.WriteHeader(http.StatusOK) } // OKHandler returns a simple request handler // that replies to each request with a “200 OK” reply. +// +// Deprecated: Use healthz instead. func OKHandler() http.Handler { return http.HandlerFunc(OK) } // DefaultHealthPath is the default HTTP path for checking health. +// +// Deprecated: Use healthz instead. var DefaultHealthPath = "/health" // Health represents an object that can check its health. +// +// Deprecated: Use healthz instead. type Health interface { IsHealthy() error } // NewHealthHandler returns a handler for application health checking. +// +// Deprecated: Use healthz instead. func NewHealthHandler(v ...Health) http.HandlerFunc { return func(rw http.ResponseWriter, r *http.Request) { for _, h := range v { diff --git a/http/healthz/healthz.go b/http/healthz/healthz.go new file mode 100644 index 0000000..44ac7f1 --- /dev/null +++ b/http/healthz/healthz.go @@ -0,0 +1,78 @@ +// Package healthz provides HTTP healthz handling. +package healthz + +import ( + "bytes" + "fmt" + "net/http" +) + +// HealthChecker represents a named health checker. +type HealthChecker interface { + Name() string + Check(*http.Request) error +} + +type healthCheck struct { + name string + check func(*http.Request) error +} + +// NamedCheck returns a named health check. +func NamedCheck(name string, check func(*http.Request) error) HealthChecker { + return &healthCheck{ + name: name, + check: check, + } +} + +func (c healthCheck) Name() string { return c.name } + +func (c healthCheck) Check(req *http.Request) error { return c.check(req) } + +// PingHealth returns true when called. +var PingHealth HealthChecker = ping{} + +type ping struct{} + +func (c ping) Name() string { return "ping" } + +func (c ping) Check(_ *http.Request) error { return nil } + +// Handler returns an HTTP check handler. +func Handler(name string, errFn func(string), checks ...HealthChecker) http.Handler { + return http.HandlerFunc(func(rw http.ResponseWriter, req *http.Request) { + var ( + checkOutput bytes.Buffer + failedChecks []string + failedLogOutput bytes.Buffer + ) + for _, check := range checks { + if err := check.Check(req); err != nil { + _, _ = fmt.Fprintf(&checkOutput, "- %s failed\n", check.Name()) + _, _ = fmt.Fprintf(&failedLogOutput, "%s failed: %v\n", check.Name(), err) + failedChecks = append(failedChecks, check.Name()) + continue + } + + _, _ = fmt.Fprintf(&checkOutput, "+ %s ok\n", check.Name()) + } + + if len(failedChecks) > 0 { + errFn(failedLogOutput.String()) + http.Error(rw, + fmt.Sprintf("%s%s check failed", checkOutput.String(), name), + http.StatusInternalServerError, + ) + return + } + + if _, found := req.URL.Query()["verbose"]; !found { + _, _ = fmt.Fprint(rw, "ok") + return + } + + _, _ = checkOutput.WriteTo(rw) + _, _ = fmt.Fprintf(rw, "%s check passed", name) + }) +} diff --git a/http/healthz/healthz_test.go b/http/healthz/healthz_test.go new file mode 100644 index 0000000..783eb28 --- /dev/null +++ b/http/healthz/healthz_test.go @@ -0,0 +1,65 @@ +package healthz_test + +import ( + "errors" + "net/http" + "net/http/httptest" + "testing" + + "github.com/hamba/pkg/v2/http/healthz" + "github.com/stretchr/testify/assert" +) + +func TestHandler(t *testing.T) { + goodCheck := healthz.NamedCheck("good", func(*http.Request) error { return nil }) + + var gotOutput string + h := healthz.Handler("readyz", func(output string) { + gotOutput = output + }, goodCheck) + + req := httptest.NewRequest(http.MethodGet, "/readyz", nil) + rec := httptest.NewRecorder() + + h.ServeHTTP(rec, req) + + assert.Equal(t, http.StatusOK, rec.Code) + assert.Equal(t, "", gotOutput) + assert.Equal(t, `ok`, rec.Body.String()) +} +func TestHandler_Verbose(t *testing.T) { + goodCheck := healthz.NamedCheck("good", func(*http.Request) error { return nil }) + + var gotOutput string + h := healthz.Handler("readyz", func(output string) { + gotOutput = output + }, goodCheck) + + req := httptest.NewRequest(http.MethodGet, "/readyz?verbose=1", nil) + rec := httptest.NewRecorder() + + h.ServeHTTP(rec, req) + + assert.Equal(t, http.StatusOK, rec.Code) + assert.Equal(t, "", gotOutput) + assert.Equal(t, "+ good ok\nreadyz check passed", rec.Body.String()) +} + +func TestHandler_WithFailingChecks(t *testing.T) { + goodCheck := healthz.NamedCheck("good", func(*http.Request) error { return nil }) + badCheck := healthz.NamedCheck("bad", func(*http.Request) error { return errors.New("test error") }) + + var gotOutput string + h := healthz.Handler("readyz", func(output string) { + gotOutput = output + }, goodCheck, badCheck) + + req := httptest.NewRequest(http.MethodGet, "/readyz", nil) + rec := httptest.NewRecorder() + + h.ServeHTTP(rec, req) + + assert.Equal(t, http.StatusInternalServerError, rec.Code) + assert.Equal(t, "bad failed: test error\n", gotOutput) + assert.Equal(t, "+ good ok\n- bad failed\nreadyz check failed\n", rec.Body.String()) +} diff --git a/http/server.go b/http/server.go index 21fef3b..32d5232 100644 --- a/http/server.go +++ b/http/server.go @@ -4,10 +4,18 @@ import ( "context" "crypto/tls" "errors" + "fmt" "net" "net/http" + "strings" + "sync" "time" + "github.com/hamba/logger/v2" + lctx "github.com/hamba/logger/v2/ctx" + "github.com/hamba/pkg/v2/http/healthz" + "github.com/hamba/pkg/v2/http/middleware" + "github.com/hamba/statter/v2" "golang.org/x/net/http2" "golang.org/x/net/http2/h2c" ) @@ -42,7 +50,6 @@ func WithH2C() SrvOptFunc { h2s := &http2.Server{ IdleTimeout: 120 * time.Second, } - srv.Handler = h2c.NewHandler(srv.Handler, h2s) } } @@ -53,7 +60,7 @@ type Server struct { srv *http.Server } -// NewServer returns a server. +// NewServer returns a server with the base context ctx. func NewServer(ctx context.Context, addr string, h http.Handler, opts ...SrvOptFunc) *Server { srv := &http.Server{ BaseContext: func(_ net.Listener) context.Context { @@ -97,3 +104,158 @@ func (s *Server) Shutdown(timeout time.Duration) error { func (s *Server) Close() error { return s.srv.Close() } + +// HealthServerConfig configures a HealthServer. +type HealthServerConfig struct { + Addr string + Handler http.Handler + Stats *statter.Statter + Log *logger.Logger +} + +// HealthServer is an HTTP server with healthz capabilities. +type HealthServer struct { + srv *Server + + shudownCh chan struct{} + + readyzMu sync.Mutex + readyzInstalled bool + readyzChecks []healthz.HealthChecker + + livezMu sync.Mutex + livezInstalled bool + livezChecks []healthz.HealthChecker + + stats *statter.Statter + log *logger.Logger +} + +// NewHealthServer returns an HTTP server with healthz capabilities. +func NewHealthServer(ctx context.Context, cfg HealthServerConfig, opts ...SrvOptFunc) *HealthServer { + srv := NewServer(ctx, cfg.Addr, cfg.Handler, opts...) + + return &HealthServer{ + srv: srv, + shudownCh: make(chan struct{}), + stats: cfg.Stats, + log: cfg.Log, + } +} + +// AddHealthzChecks adds health checks to both readyz and livez. +func (s *HealthServer) AddHealthzChecks(checks ...healthz.HealthChecker) error { + if err := s.AddReadyzChecks(checks...); err != nil { + return err + } + return s.AddLivezChecks(checks...) +} + +// AddReadyzChecks adds health checks to readyz. +func (s *HealthServer) AddReadyzChecks(checks ...healthz.HealthChecker) error { + s.readyzMu.Lock() + defer s.readyzMu.Unlock() + if s.readyzInstalled { + return errors.New("could not add checks as readyz has already been installed") + } + s.readyzChecks = append(s.readyzChecks, checks...) + return nil +} + +// AddLivezChecks adds health checks to livez. +func (s *HealthServer) AddLivezChecks(checks ...healthz.HealthChecker) error { + s.livezMu.Lock() + defer s.livezMu.Unlock() + if s.livezInstalled { + return errors.New("could not add checks as livez has already been installed") + } + s.livezChecks = append(s.livezChecks, checks...) + return nil +} + +// Serve installs the health checks and starts the server in a non-blocking way. +func (s *HealthServer) Serve(errFn func(error)) { + s.installChecks() + + s.srv.Serve(errFn) +} + +func (s *HealthServer) installChecks() { + mux := http.NewServeMux() + s.installLivezChecks(mux) + + // When shutdown is started, the readyz check should start failing. + if err := s.AddReadyzChecks(shutdownCheck{ch: s.shudownCh}); err != nil { + s.log.Error("Could not install readyz shutdown check", lctx.Err(err)) + } + s.installReadyzChecks(mux) + + mux.Handle("/", s.srv.srv.Handler) + s.srv.srv.Handler = mux +} + +func (s *HealthServer) installReadyzChecks(mux *http.ServeMux) { + s.readyzMu.Lock() + defer s.readyzMu.Unlock() + s.readyzInstalled = true + s.installCheckers(mux, "/readyz", s.readyzChecks) +} + +func (s *HealthServer) installLivezChecks(mux *http.ServeMux) { + s.livezMu.Lock() + defer s.livezMu.Unlock() + s.livezInstalled = true + s.installCheckers(mux, "/livez", s.livezChecks) +} + +func (s *HealthServer) installCheckers(mux *http.ServeMux, path string, checks []healthz.HealthChecker) { + if len(checks) == 0 { + checks = []healthz.HealthChecker{healthz.PingHealth} + } + + s.log.Info("Installing health checkers", + lctx.Str("path", path), + lctx.Str("checks", strings.Join(checkNames(checks), ",")), + ) + + name := strings.TrimPrefix(path, "/") + h := healthz.Handler(name, func(output string) { + s.log.Info(fmt.Sprintf("%s check failed\n%s", name, output)) + }, checks...) + mux.Handle(path, middleware.WithStats(name, s.stats, h)) +} + +// Shutdown attempts to close all server connections. +func (s *HealthServer) Shutdown(timeout time.Duration) error { + close(s.shudownCh) + + return s.srv.Shutdown(timeout) +} + +// Close closes the server. +func (s *HealthServer) Close() error { + return s.srv.Close() +} + +func checkNames(checks []healthz.HealthChecker) []string { + names := make([]string, len(checks)) + for i, check := range checks { + names[i] = check.Name() + } + return names +} + +type shutdownCheck struct { + ch <-chan struct{} +} + +func (s shutdownCheck) Name() string { return "shutdown" } + +func (s shutdownCheck) Check(*http.Request) error { + select { + case <-s.ch: + return errors.New("server is shutting down") + default: + return nil + } +} diff --git a/http/server_test.go b/http/server_test.go index 3c4d2a8..9b92f54 100644 --- a/http/server_test.go +++ b/http/server_test.go @@ -6,10 +6,14 @@ import ( "io" "net" "net/http" + "sync" "testing" "time" + "github.com/hamba/logger/v2" httpx "github.com/hamba/pkg/v2/http" + "github.com/hamba/pkg/v2/http/healthz" + "github.com/hamba/statter/v2" "github.com/stretchr/testify/assert" "github.com/stretchr/testify/require" "golang.org/x/net/http2" @@ -80,3 +84,107 @@ func TestServer_WithH2C(t *testing.T) { assert.Equal(t, res.StatusCode, http.StatusOK) assert.True(t, handlerCalled) } + +func TestHealthServer(t *testing.T) { + stats := statter.New(statter.DiscardReporter, time.Minute) + log := logger.New(io.Discard, logger.LogfmtFormat(), logger.Error) + + check := healthz.NamedCheck("test", func(*http.Request) error { + return nil + }) + + srv := httpx.NewHealthServer(context.Background(), httpx.HealthServerConfig{ + Addr: ":16543", + Handler: http.HandlerFunc(func(http.ResponseWriter, *http.Request) {}), + Stats: stats, + Log: log, + }) + err := srv.AddHealthzChecks(check) + require.NoError(t, err) + srv.Serve(func(err error) { + require.NoError(t, err) + }) + t.Cleanup(func() { + _ = srv.Close() + }) + + statusCode, body := requireDoRequest(t, "http://localhost:16543/readyz?verbose=1") + assert.Equal(t, statusCode, http.StatusOK) + want := `+ test ok ++ shutdown ok +readyz check passed` + assert.Equal(t, want, body) + + statusCode, body = requireDoRequest(t, "http://localhost:16543/livez?verbose=1") + assert.Equal(t, statusCode, http.StatusOK) + want = `+ test ok +livez check passed` + assert.Equal(t, want, body) +} + +func TestHealthServer_ShutdownCausesReadyzCheckToFail(t *testing.T) { + stats := statter.New(statter.DiscardReporter, time.Minute) + log := logger.New(io.Discard, logger.LogfmtFormat(), logger.Error) + + calledCh := make(chan struct{}) + check := healthz.NamedCheck("test", func(*http.Request) error { + close(calledCh) + time.Sleep(time.Millisecond) + return nil + }) + + srv := httpx.NewHealthServer(context.Background(), httpx.HealthServerConfig{ + Addr: ":16543", + Handler: http.HandlerFunc(func(http.ResponseWriter, *http.Request) {}), + Stats: stats, + Log: log, + }) + err := srv.AddHealthzChecks(check) + require.NoError(t, err) + srv.Serve(func(err error) { + require.NoError(t, err) + }) + t.Cleanup(func() { + _ = srv.Close() + }) + + var wg sync.WaitGroup + wg.Add(1) + go func() { + defer wg.Done() + + <-calledCh + + err = srv.Shutdown(time.Second) + require.NoError(t, err) + }() + + statusCode, body := requireDoRequest(t, "http://localhost:16543/readyz?verbose=1") + assert.Equal(t, statusCode, http.StatusInternalServerError) + want := `+ test ok +- shutdown failed +readyz check failed +` + assert.Equal(t, want, body) + + wg.Wait() +} + +func requireDoRequest(t *testing.T, path string) (int, string) { + t.Helper() + + req, err := http.NewRequest(http.MethodGet, path, nil) + require.NoError(t, err) + + resp, err := http.DefaultClient.Do(req) + require.NoError(t, err) + defer func() { + _, _ = io.Copy(io.Discard, resp.Body) + _ = resp.Body.Close() + }() + + b, err := io.ReadAll(resp.Body) + require.NoError(t, err) + + return resp.StatusCode, string(b) +}