harness-drone/cmd/drone-agent/health.go

132 lines
2.7 KiB
Go
Raw Normal View History

2017-09-12 18:25:55 +00:00
package main
import (
"encoding/json"
"fmt"
2017-09-12 20:40:24 +00:00
"io"
2017-09-12 18:25:55 +00:00
"net/http"
2017-09-12 20:40:24 +00:00
"sync"
"time"
2017-09-12 18:25:55 +00:00
"github.com/drone/drone/version"
"github.com/urfave/cli"
)
// the file implements some basic healthcheck logic based on the
// following specification:
// https://github.com/mozilla-services/Dockerflow
func init() {
2017-09-12 20:40:24 +00:00
http.HandleFunc("/varz", handleStats)
http.HandleFunc("/healthz", handleHeartbeat)
http.HandleFunc("/version", handleVersion)
2017-09-12 18:25:55 +00:00
}
func handleHeartbeat(w http.ResponseWriter, r *http.Request) {
2017-09-12 20:40:24 +00:00
if counter.Healthy() {
w.WriteHeader(200)
} else {
w.WriteHeader(500)
}
2017-09-12 18:25:55 +00:00
}
func handleVersion(w http.ResponseWriter, r *http.Request) {
w.WriteHeader(200)
w.Header().Add("Content-Type", "text/json")
json.NewEncoder(w).Encode(versionResp{
Source: "https://github.com/drone/drone",
Version: version.Version.String(),
})
}
2017-09-12 20:40:24 +00:00
func handleStats(w http.ResponseWriter, r *http.Request) {
if counter.Healthy() {
w.WriteHeader(200)
} else {
w.WriteHeader(500)
}
w.Header().Add("Content-Type", "text/json")
counter.writeTo(w)
}
2017-09-12 18:25:55 +00:00
type versionResp struct {
Version string `json:"version"`
Source string `json:"source"`
}
2017-09-12 20:40:24 +00:00
// default statistics counter
var counter = &state{
Metadata: map[string]info{},
}
type state struct {
sync.Mutex `json:"-"`
Polling int `json:"polling_count"`
Running int `json:"running_count"`
Metadata map[string]info `json:"running"`
}
type info struct {
ID string `json:"id"`
Repo string `json:"repository"`
Build string `json:"build_number"`
Started time.Time `json:"build_started"`
Timeout time.Duration `json:"build_timeout"`
}
func (s *state) Add(id string, timeout time.Duration, repo, build string) {
s.Lock()
s.Polling--
s.Running++
s.Metadata[id] = info{
ID: id,
Repo: repo,
Build: build,
Timeout: timeout,
Started: time.Now().UTC(),
}
s.Unlock()
}
func (s *state) Done(id string) {
s.Lock()
s.Polling++
s.Running--
delete(s.Metadata, id)
s.Unlock()
}
func (s *state) Healthy() bool {
s.Lock()
defer s.Unlock()
now := time.Now()
buf := time.Hour // 1 hour buffer
for _, item := range s.Metadata {
if now.After(item.Started.Add(item.Timeout).Add(buf)) {
return false
}
}
return true
}
func (s *state) writeTo(w io.Writer) (int, error) {
s.Lock()
out, _ := json.Marshal(s)
s.Unlock()
return w.Write(out)
}
2017-09-12 18:25:55 +00:00
// handles pinging the endpoint and returns an error if the
// agent is in an unhealthy state.
func pinger(c *cli.Context) error {
2017-09-12 20:40:24 +00:00
resp, err := http.Get("http://localhost:3000/healthz")
2017-09-12 18:25:55 +00:00
if err != nil {
return err
}
defer resp.Body.Close()
if resp.StatusCode != 200 {
return fmt.Errorf("agent returned non-200 status code")
}
return nil
}