| Tim Windelschmidt | 6d33a43 | 2025-02-04 14:34:25 +0100 | [diff] [blame] | 1 | // Copyright The Monogon Project Authors. |
| 2 | // SPDX-License-Identifier: Apache-2.0 |
| 3 | |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 4 | package metrics |
| 5 | |
| 6 | import ( |
| 7 | "context" |
| 8 | "encoding/json" |
| 9 | "fmt" |
| 10 | "net/http" |
| 11 | "sync" |
| 12 | |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 13 | "source.monogon.dev/go/types/mapsets" |
| 14 | "source.monogon.dev/metropolis/node/core/curator/watcher" |
| Tim Windelschmidt | 9f21f53 | 2024-05-07 15:14:20 +0200 | [diff] [blame] | 15 | "source.monogon.dev/osbase/supervisor" |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 16 | |
| 17 | ipb "source.monogon.dev/metropolis/node/core/curator/proto/api" |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 18 | ) |
| 19 | |
| 20 | type Discovery struct { |
| 21 | Curator ipb.CuratorClient |
| 22 | |
| 23 | // sdResp will contain the cached sdResponse |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 24 | sdResp mapsets.OrderedMap[string, sdTarget] |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 25 | // sdRespMtx is the mutex for sdResp to allow usage inside the http handler. |
| 26 | sdRespMtx sync.RWMutex |
| 27 | } |
| 28 | |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 29 | type sdTarget struct { |
| 30 | Targets []string `json:"targets"` |
| 31 | Labels map[string]string `json:"labels"` |
| 32 | } |
| 33 | |
| 34 | // Run is the sub-runnable responsible for fetching and serving node updates. |
| 35 | func (s *Discovery) Run(ctx context.Context) error { |
| 36 | supervisor.Signal(ctx, supervisor.SignalHealthy) |
| 37 | |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 38 | defer func() { |
| 39 | s.sdRespMtx.Lock() |
| 40 | // disable the metrics endpoint until the new routine takes over |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 41 | s.sdResp.Clear() |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 42 | s.sdRespMtx.Unlock() |
| 43 | }() |
| 44 | |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 45 | return watcher.WatchNodes(ctx, s.Curator, watcher.SimpleFollower{ |
| 46 | FilterFn: func(a *ipb.Node) bool { |
| 47 | if a.Status == nil { |
| 48 | return false |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 49 | } |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 50 | if a.Status.ExternalAddress == "" { |
| 51 | return false |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 52 | } |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 53 | if a.Roles == nil { |
| 54 | return false |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 55 | } |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 56 | return true |
| 57 | }, |
| 58 | EqualsFn: func(a *ipb.Node, b *ipb.Node) bool { |
| 59 | if (a.Roles.ConsensusMember == nil) != (b.Roles.ConsensusMember == nil) { |
| 60 | return false |
| 61 | } |
| 62 | if (a.Roles.KubernetesController == nil) != (b.Roles.KubernetesController == nil) { |
| 63 | return false |
| 64 | } |
| 65 | if (a.Roles.ConsensusMember == nil) != (b.Roles.ConsensusMember == nil) { |
| 66 | return false |
| 67 | } |
| 68 | if a.Status.ExternalAddress != b.Status.ExternalAddress { |
| 69 | return false |
| 70 | } |
| 71 | return true |
| 72 | }, |
| 73 | OnNewUpdated: func(new *ipb.Node) error { |
| 74 | s.sdRespMtx.Lock() |
| 75 | defer s.sdRespMtx.Unlock() |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 76 | |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 77 | s.sdResp.Insert(new.Id, sdTarget{ |
| 78 | Targets: []string{new.Status.ExternalAddress}, |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 79 | Labels: map[string]string{ |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 80 | "__meta_metropolis_role_kubernetes_worker": fmt.Sprintf("%t", new.Roles.KubernetesWorker != nil), |
| 81 | "__meta_metropolis_role_kubernetes_controller": fmt.Sprintf("%t", new.Roles.KubernetesController != nil), |
| 82 | "__meta_metropolis_role_consensus_member": fmt.Sprintf("%t", new.Roles.ConsensusMember != nil), |
| Lorenz Brun | eb2520f | 2023-11-19 07:04:15 +0100 | [diff] [blame] | 83 | "__meta_metropolis_node": new.Id, |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 84 | }, |
| 85 | }) |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 86 | return nil |
| 87 | }, |
| 88 | OnDeleted: func(prev *ipb.Node) error { |
| 89 | s.sdRespMtx.Lock() |
| 90 | defer s.sdRespMtx.Unlock() |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 91 | |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 92 | s.sdResp.Delete(prev.Id) |
| 93 | return nil |
| 94 | }, |
| 95 | }) |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 96 | } |
| 97 | |
| 98 | func (s *Discovery) ServeHTTP(w http.ResponseWriter, r *http.Request) { |
| 99 | if r.Method != http.MethodGet { |
| 100 | http.Error(w, fmt.Sprintf("method %q not allowed", r.Method), http.StatusMethodNotAllowed) |
| 101 | return |
| 102 | } |
| 103 | |
| 104 | s.sdRespMtx.RLock() |
| 105 | defer s.sdRespMtx.RUnlock() |
| 106 | |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 107 | // If sdResp is empty, respond with Service Unavailable. This will only happen |
| 108 | // early enough in the lifecycle of a control plane node that it doesn't know |
| 109 | // about itself, or if this is not a control plane node: |
| 110 | if s.sdResp.Count() == 0 { |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 111 | w.WriteHeader(http.StatusServiceUnavailable) |
| 112 | return |
| 113 | } |
| 114 | |
| 115 | w.Header().Set("Content-Type", "application/json") |
| 116 | w.WriteHeader(http.StatusOK) |
| 117 | |
| Serge Bazanski | 60461b2 | 2023-10-26 19:16:59 +0200 | [diff] [blame] | 118 | // Turn into a plain array as expected by the service discovery API. |
| 119 | var res []sdTarget |
| 120 | for _, v := range s.sdResp.Values() { |
| 121 | res = append(res, v.Value) |
| 122 | } |
| 123 | if err := json.NewEncoder(w).Encode(res); err != nil { |
| Tim Windelschmidt | f64f197 | 2023-07-28 00:00:50 +0000 | [diff] [blame] | 124 | // If the encoder fails its mostly because of closed connections |
| 125 | // so lets just ignore these errors. |
| 126 | return |
| 127 | } |
| 128 | } |