Feature: faster healthcheck, fix #283

This commit is contained in:
Quentin McGaw
2020-12-30 19:34:11 +00:00
parent 6f3a074e00
commit 11338b6382
4 changed files with 84 additions and 18 deletions

View File

@@ -118,7 +118,7 @@ ENV VPNSP=pia \
UPDATER_PERIOD=0 UPDATER_PERIOD=0
ENTRYPOINT ["/entrypoint"] ENTRYPOINT ["/entrypoint"]
EXPOSE 8000/tcp 8888/tcp 8388/tcp 8388/udp EXPOSE 8000/tcp 8888/tcp 8388/tcp 8388/udp
HEALTHCHECK --interval=10m --timeout=10s --start-period=30s --retries=2 CMD /entrypoint healthcheck HEALTHCHECK --interval=5s --timeout=5s --start-period=10s --retries=1 CMD /entrypoint healthcheck
RUN apk add -q --progress --no-cache --update openvpn ca-certificates iptables ip6tables unbound tzdata && \ RUN apk add -q --progress --no-cache --update openvpn ca-certificates iptables ip6tables unbound tzdata && \
rm -rf /var/cache/apk/* /etc/unbound/* /usr/sbin/unbound-* && \ rm -rf /var/cache/apk/* /etc/unbound/* /usr/sbin/unbound-* && \
deluser openvpn && \ deluser openvpn && \

View File

@@ -1,21 +1,25 @@
package healthcheck package healthcheck
import ( import (
"net" "errors"
"net/http" "net/http"
"sync"
"github.com/qdm12/golibs/logging" "github.com/qdm12/golibs/logging"
) )
type handler struct { type handler struct {
logger logging.Logger logger logging.Logger
resolver *net.Resolver healthErr error
healthErrMu sync.RWMutex
} }
func newHandler(logger logging.Logger, resolver *net.Resolver) http.Handler { var errHealthcheckNotRunYet = errors.New("healthcheck did not run yet")
func newHandler(logger logging.Logger) *handler {
return &handler{ return &handler{
logger: logger, logger: logger,
resolver: resolver, healthErr: errHealthcheckNotRunYet,
} }
} }
@@ -24,11 +28,22 @@ func (h *handler) ServeHTTP(responseWriter http.ResponseWriter, request *http.Re
http.Error(responseWriter, "method not supported for healthcheck", http.StatusBadRequest) http.Error(responseWriter, "method not supported for healthcheck", http.StatusBadRequest)
return return
} }
err := healthCheck(request.Context(), h.resolver) if err := h.getErr(); err != nil {
if err != nil {
h.logger.Error(err) h.logger.Error(err)
http.Error(responseWriter, err.Error(), http.StatusInternalServerError) http.Error(responseWriter, err.Error(), http.StatusInternalServerError)
return return
} }
responseWriter.WriteHeader(http.StatusOK) responseWriter.WriteHeader(http.StatusOK)
} }
func (h *handler) setErr(err error) {
h.healthErrMu.Lock()
defer h.healthErrMu.Unlock()
h.healthErr = err
}
func (h *handler) getErr() (err error) {
h.healthErrMu.RLock()
defer h.healthErrMu.RUnlock()
return h.healthErr
}

View File

@@ -2,8 +2,46 @@ package healthcheck
import ( import (
"context" "context"
"errors"
"fmt" "fmt"
"net" "net"
"sync"
"time"
)
func (s *server) runHealthcheckLoop(ctx context.Context, wg *sync.WaitGroup) {
defer wg.Done()
for {
err := healthCheck(ctx, s.resolver)
s.handler.setErr(err)
if err != nil { // try again after 1 second
timer := time.NewTimer(time.Second)
select {
case <-ctx.Done():
if !timer.Stop() {
<-timer.C
}
return
case <-timer.C:
}
continue
}
// Success, check again in 10 minutes
const period = 10 * time.Minute
timer := time.NewTimer(period)
select {
case <-ctx.Done():
if !timer.Stop() {
<-timer.C
}
return
case <-timer.C:
}
}
}
var (
errNoIPResolved = errors.New("no IP address resolved")
) )
func healthCheck(ctx context.Context, resolver *net.Resolver) (err error) { func healthCheck(ctx context.Context, resolver *net.Resolver) (err error) {
@@ -12,9 +50,9 @@ func healthCheck(ctx context.Context, resolver *net.Resolver) (err error) {
ips, err := resolver.LookupIP(ctx, "ip", domainToResolve) ips, err := resolver.LookupIP(ctx, "ip", domainToResolve)
switch { switch {
case err != nil: case err != nil:
return fmt.Errorf("cannot resolve github.com: %s", err) return err
case len(ips) == 0: case len(ips) == 0:
return fmt.Errorf("resolved no IP addresses for %s", domainToResolve) return fmt.Errorf("%w for %s", errNoIPResolved, domainToResolve)
default: default:
return nil return nil
} }

View File

@@ -16,26 +16,36 @@ type Server interface {
} }
type server struct { type server struct {
address string address string
logger logging.Logger logger logging.Logger
handler http.Handler handler *handler
resolver *net.Resolver
} }
func NewServer(address string, logger logging.Logger) Server { func NewServer(address string, logger logging.Logger) Server {
healthcheckLogger := logger.WithPrefix("healthcheck: ")
return &server{ return &server{
address: address, address: address,
logger: logger.WithPrefix("healthcheck: "), logger: healthcheckLogger,
handler: newHandler(logger, net.DefaultResolver), handler: newHandler(healthcheckLogger),
resolver: net.DefaultResolver,
} }
} }
func (s *server) Run(ctx context.Context, wg *sync.WaitGroup) { func (s *server) Run(ctx context.Context, wg *sync.WaitGroup) {
defer wg.Done()
internalWg := &sync.WaitGroup{}
internalWg.Add(1)
go s.runHealthcheckLoop(ctx, internalWg)
server := http.Server{ server := http.Server{
Addr: s.address, Addr: s.address,
Handler: s.handler, Handler: s.handler,
} }
internalWg.Add(1)
go func() { go func() {
defer wg.Done() defer internalWg.Done()
<-ctx.Done() <-ctx.Done()
s.logger.Warn("context canceled: shutting down server") s.logger.Warn("context canceled: shutting down server")
defer s.logger.Warn("server shut down") defer s.logger.Warn("server shut down")
@@ -46,9 +56,12 @@ func (s *server) Run(ctx context.Context, wg *sync.WaitGroup) {
s.logger.Error("failed shutting down: %s", err) s.logger.Error("failed shutting down: %s", err)
} }
}() }()
s.logger.Info("listening on %s", s.address) s.logger.Info("listening on %s", s.address)
err := server.ListenAndServe() err := server.ListenAndServe()
if err != nil && !errors.Is(ctx.Err(), context.Canceled) { if err != nil && !errors.Is(ctx.Err(), context.Canceled) {
s.logger.Error(err) s.logger.Error(err)
} }
internalWg.Wait()
} }