Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 1 | // Copyright 2020 The Monogon Project Authors. |
| 2 | // |
| 3 | // SPDX-License-Identifier: Apache-2.0 |
| 4 | // |
| 5 | // Licensed under the Apache License, Version 2.0 (the "License"); |
| 6 | // you may not use this file except in compliance with the License. |
| 7 | // You may obtain a copy of the License at |
| 8 | // |
| 9 | // http://www.apache.org/licenses/LICENSE-2.0 |
| 10 | // |
| 11 | // Unless required by applicable law or agreed to in writing, software |
| 12 | // distributed under the License is distributed on an "AS IS" BASIS, |
| 13 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 14 | // See the License for the specific language governing permissions and |
| 15 | // limitations under the License. |
| 16 | |
| 17 | package cluster |
| 18 | |
| 19 | import ( |
| 20 | "context" |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 21 | "encoding/hex" |
| 22 | "fmt" |
| 23 | "net" |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 24 | "strings" |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 25 | |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 26 | "go.etcd.io/etcd/clientv3" |
| 27 | "golang.org/x/sys/unix" |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 28 | "google.golang.org/protobuf/proto" |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 29 | |
Serge Bazanski | 31370b0 | 2021-01-07 16:31:14 +0100 | [diff] [blame] | 30 | "source.monogon.dev/metropolis/node/core/localstorage" |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 31 | "source.monogon.dev/metropolis/pkg/supervisor" |
| 32 | ppb "source.monogon.dev/metropolis/proto/private" |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 33 | ) |
| 34 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 35 | // Node is a Metropolis cluster member. A node is a virtual or physical machine |
| 36 | // running Metropolis. This object represents a node only as part of a cluster |
| 37 | // - ie., this object will never be available outside of |
| 38 | // //metropolis/node/core/cluster if the Node is not part of a Cluster. Nodes |
| 39 | // are inherently tied to their long term storage, which is etcd. As such, |
| 40 | // methods on this object relate heavily to the Node's expected lifecycle on |
| 41 | // etcd. |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 42 | type Node struct { |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 43 | // clusterUnlockKey is half of the unlock key required to mount the node's |
| 44 | // data partition. It's stored in etcd, and will only be provided to the |
| 45 | // Node if it can prove its identity via an integrity mechanism (ie. via |
| 46 | // TPM), or when the Node was just created (as the key is generated locally |
| 47 | // by localstorage on first format/mount). The other part of the unlock |
| 48 | // key is the LocalUnlockKey that's present on the node's ESP partition. |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 49 | clusterUnlockKey []byte |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 50 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 51 | pubkey []byte |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 52 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 53 | state ppb.Node_FSMState |
| 54 | |
| 55 | // A Node can have multiple Roles. Each Role is represented by the presence |
| 56 | // of NodeRole* structures in this structure, with a nil pointer |
| 57 | // representing the lack of a role. |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 58 | consensusMember *NodeRoleConsensusMember |
| 59 | kubernetesWorker *NodeRoleKubernetesWorker |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 60 | |
| 61 | // At runtime, this represents an etcd client to the consensus cluster. This |
| 62 | // is used by applications (like Kubernetes). |
| 63 | KV clientv3.KV |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 64 | } |
| 65 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 66 | // NodeRoleConsensusMember defines that the Node is a consensus (etcd) cluster |
| 67 | // member. |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 68 | type NodeRoleConsensusMember struct { |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 69 | } |
| 70 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 71 | // NodeRoleKubernetesWorker defines that the Node should be running the |
| 72 | // Kubernetes control and data plane. |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 73 | type NodeRoleKubernetesWorker struct { |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 74 | } |
| 75 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 76 | // ID returns the name of this node, which is `metropolis-{pubkeyHash}`. This |
| 77 | // name should be the primary way to refer to Metropoils nodes within a |
| 78 | // cluster, and is guaranteed to be unique by relying on cryptographic |
| 79 | // randomness. |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 80 | func (n *Node) ID() string { |
Serge Bazanski | 662b5b3 | 2020-12-21 13:49:00 +0100 | [diff] [blame] | 81 | return fmt.Sprintf("metropolis-%s", n.IDBare()) |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 82 | } |
| 83 | |
| 84 | // IDBare returns the `{pubkeyHash}` part of the node ID. |
| 85 | func (n Node) IDBare() string { |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 86 | return hex.EncodeToString(n.pubkey[:16]) |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 87 | } |
| 88 | |
| 89 | func (n *Node) String() string { |
| 90 | return n.ID() |
| 91 | } |
| 92 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 93 | // ConsensusMember returns a copy of the NodeRoleConsensusMember struct if the |
| 94 | // Node is a consensus member, otherwise nil. |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 95 | func (n *Node) ConsensusMember() *NodeRoleConsensusMember { |
| 96 | if n.consensusMember == nil { |
| 97 | return nil |
| 98 | } |
| 99 | cm := *n.consensusMember |
| 100 | return &cm |
| 101 | } |
| 102 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 103 | // KubernetesWorker returns a copy of the NodeRoleKubernetesWorker struct if |
| 104 | // the Node is a kubernetes worker, otherwise nil. |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 105 | func (n *Node) KubernetesWorker() *NodeRoleKubernetesWorker { |
| 106 | if n.kubernetesWorker == nil { |
| 107 | return nil |
| 108 | } |
| 109 | kw := *n.kubernetesWorker |
| 110 | return &kw |
| 111 | } |
| 112 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 113 | // etcdPath builds the etcd path in which this node's protobuf-serialized state |
| 114 | // is stored in etcd. |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 115 | func (n *Node) etcdPath() string { |
| 116 | return fmt.Sprintf("/nodes/%s", n.ID()) |
| 117 | } |
| 118 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 119 | // proto serializes the Node object into protobuf, to be used for saving to |
| 120 | // etcd. |
| 121 | func (n *Node) proto() *ppb.Node { |
| 122 | msg := &ppb.Node{ |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 123 | ClusterUnlockKey: n.clusterUnlockKey, |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 124 | PublicKey: n.pubkey, |
| 125 | FsmState: n.state, |
| 126 | Roles: &ppb.Node_Roles{}, |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 127 | } |
| 128 | if n.consensusMember != nil { |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 129 | msg.Roles.ConsensusMember = &ppb.Node_Roles_ConsensusMember{} |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 130 | } |
| 131 | if n.kubernetesWorker != nil { |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 132 | msg.Roles.KubernetesWorker = &ppb.Node_Roles_KubernetesWorker{} |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 133 | } |
| 134 | return msg |
| 135 | } |
| 136 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 137 | // Store saves the Node into etcd. This should be called only once per Node |
| 138 | // (ie. when the Node has been created). |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 139 | func (n *Node) Store(ctx context.Context, kv clientv3.KV) error { |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 140 | // Currently the only flow to store a node to etcd is a write-once flow: |
| 141 | // once a node is created, it cannot be deleted or updated. In the future, |
| 142 | // flows to change cluster node roles might be introduced (ie. to promote |
| 143 | // nodes to consensus members, etc). |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 144 | key := n.etcdPath() |
| 145 | msg := n.proto() |
| 146 | nodeRaw, err := proto.Marshal(msg) |
| 147 | if err != nil { |
| 148 | return fmt.Errorf("failed to marshal node: %w", err) |
| 149 | } |
| 150 | |
| 151 | res, err := kv.Txn(ctx).If( |
| 152 | clientv3.Compare(clientv3.CreateRevision(key), "=", 0), |
| 153 | ).Then( |
| 154 | clientv3.OpPut(key, string(nodeRaw)), |
| 155 | ).Commit() |
| 156 | if err != nil { |
| 157 | return fmt.Errorf("failed to store node: %w", err) |
| 158 | } |
| 159 | |
| 160 | if !res.Succeeded { |
| 161 | return fmt.Errorf("attempted to re-register node (unsupported flow)") |
| 162 | } |
| 163 | return nil |
| 164 | } |
| 165 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 166 | // MakeConsensusMember turns the node into a consensus member. This only |
| 167 | // configures internal fields, and does not actually start any services. |
| 168 | func (n *Node) MakeConsensusMember() error { |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 169 | if n.consensusMember != nil { |
| 170 | return fmt.Errorf("node already is consensus member") |
| 171 | } |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 172 | n.consensusMember = &NodeRoleConsensusMember{} |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 173 | return nil |
| 174 | } |
| 175 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 176 | // MakeKubernetesWorker turns the node into a kubernetes worker. This only |
| 177 | // configures internal fields, and does not actually start any services. |
| 178 | func (n *Node) MakeKubernetesWorker() error { |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 179 | if n.kubernetesWorker != nil { |
| 180 | return fmt.Errorf("node is already kubernetes worker") |
| 181 | } |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 182 | n.kubernetesWorker = &NodeRoleKubernetesWorker{} |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 183 | return nil |
| 184 | } |
| 185 | |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 186 | // ConfigureLocalHostname uses the node's ID as a hostname, and sets the |
| 187 | // current hostname, and local files like hosts and machine-id accordingly. |
| 188 | func (n *Node) ConfigureLocalHostname(ctx context.Context, ephemeral *localstorage.EphemeralDirectory, address net.IP) error { |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 189 | if err := unix.Sethostname([]byte(n.ID())); err != nil { |
| 190 | return fmt.Errorf("failed to set runtime hostname: %w", err) |
| 191 | } |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 192 | hosts := []string{ |
| 193 | "127.0.0.1 localhost", |
| 194 | "::1 localhost", |
| 195 | fmt.Sprintf("%s %s", address.String(), n.ID()), |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 196 | } |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 197 | if err := ephemeral.Hosts.Write([]byte(strings.Join(hosts, "\n")), 0644); err != nil { |
| 198 | return fmt.Errorf("failed to write /ephemeral/hosts: %w", err) |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 199 | } |
Serge Bazanski | 42e61c6 | 2021-03-18 15:07:18 +0100 | [diff] [blame^] | 200 | if err := ephemeral.MachineID.Write([]byte(n.IDBare()), 0644); err != nil { |
| 201 | return fmt.Errorf("failed to write /ephemeral/machine-id: %w", err) |
| 202 | } |
| 203 | |
| 204 | // Check that we are self-resolvable. |
| 205 | ip, err := net.ResolveIPAddr("ip", n.ID()) |
| 206 | if err != nil { |
| 207 | return fmt.Errorf("failed to self-resolve: %w", err) |
| 208 | } |
| 209 | supervisor.Logger(ctx).Infof("This is node %s at %v", n.ID(), ip) |
Serge Bazanski | 1ebd1e1 | 2020-07-13 19:17:16 +0200 | [diff] [blame] | 210 | return nil |
| 211 | } |