metropolis/proto/common/common.proto - monogon - Gitiles

 // Copyright 2020 The Monogon Project Authors.
 //
 // SPDX-License-Identifier: Apache-2.0
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //     http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 syntax = "proto3";
 package metropolis.proto.common;
 option go_package = "source.monogon.dev/metropolis/proto/common";

 import "google/protobuf/timestamp.proto";

 // NodeRoles are the possible roles that a Metropolis Node should run within the
 // cluster. These are configured by the cluster and can be retrieved through the
 // Curator.
 //
 // Fields contained within each individual are publicly available, so while they
 // can be used to carry required data to start up services for a given role,
 // this must not be confidential/private data.
 message NodeRoles {
     message KubernetesController {
     }
     message KubernetesWorker {
     }
     message ConsensusMember {
         // ca_certificate is a DER-encoded x509 certificate of the etcd
         // cluster's CA. The member must use this certificate to verify the
         // identity of the cluster it's connecting to.
         bytes ca_certificate = 1;
         // pper_certificate is a DER-encoded x509 certificate of this node's
         // etcd peer listener. The member must serve member traffic using this
         // certificate. The private key corresponding to this certificate is
         // the same as the node's primary private keypair.
         bytes peer_certificate = 2;
         // initial_crl is a certificate revocation list that the etcd member
         // should be started with. After startup, the member will maintain its
         // own CRL by updating it from its primary storage location, and etcd
         // value.
         //
         // TODO(q3k): don't pass this here, instead pass this over an etcd
         // watcher and curator.Watch.
         bytes initial_crl = 3;
         message Peer {
             string Name = 1;
             string URL = 2;
         }
         repeated Peer peers = 4;
     }
     KubernetesWorker kubernetes_worker = 1;
     ConsensusMember consensus_member = 2;
     KubernetesController kubernetes_controller = 3;
 }

 // NodeState is the state of a Metropolis node from the point of view of the
 // cluster it is a part of (or intending to be a part of).
 enum NodeState {
     NODE_STATE_INVALID = 0;

     // NEW: the node has established a first contact with the cluster and
     // intends to register into it. The node's identity has not been verified
     // and no hardware attestation of the new node was performed.
     // The node has generated a CUK/NUK and set up storage encrypted with the
     // combination of both keys.
     // The node has generated a private/public keypair, and that keypair has
     // been used to contact the already running Cluster.
     NODE_STATE_NEW = 1;
     // STANDBY: the node has successfully passed identity and hardware
     // attestation checks as defined by the cluster policy. The node still isn't
     // part of the cluster, as it itself might perform checks against the
     // running Cluster.
     NODE_STATE_STANDBY = 2;
     // UP: the node has passed all preconditions for STANDBY and has also
     // performed a commit into the cluster by exchanging its CUK for a
     // certificate issued by the cluster.
     // The node is now ready to serve, and its certificate can be used to
     // authenticate its identity cryptographically.
     NODE_STATE_UP = 3;
     // DISOWNED: the node has been rejected or decommissioned by the cluster.
     // Any further contact from the node to the cluster will be rejected.
     NODE_STATE_DISOWNED = 4;
 };

 // ClusterState is the state of the cluster from the point of view of a node.
 // Different subsystems can watch this state and depend on it for behaviour
 // (eg. start serving when HOME, maybe self-fence on SPLIT, etc.).
 enum ClusterState {
     CLUSTER_STATE_INVALID = 0;

     // UNKNOWN: the node has not yet determined the existence of a cluster it
     // should join or start. This is a transient, initial state that should only
     // manifest during boot.
     CLUSTER_STATE_UNKNOWN = 1;
     // FOREIGN: the node is attempting to register into an already existing
     // cluster with which it managed to make preliminary contact, but which the
     // cluster has not yet fully productionized (eg. the node is still being
     // hardware attested, or the operator needs to confirm the
     // registration of this node).
     CLUSTER_STATE_FOREIGN = 2;
     // TRUSTED: the node is attempting to register into an already registered
     // cluster, and has been trusted by it. The node is now attempting to fully
     // commit to registering into the cluster.
     CLUSTER_STATE_TRUSTED = 3;
     // HOME: the node is part of this cluster. This is the bulk of time in which
     // this node will spend its time.
     CLUSTER_STATE_HOME = 4;
     // DISOWNING: the node has been disowned (ie., removed) by the cluster, and
     // that it will not be ever part of any cluster again, and  that it will be
     // decommissioned by the operator.
     CLUSTER_STATE_DISOWNING = 5;
     // SPLIT:the node would usually be Home in a cluster, but has been split
     // from the consensus of the cluster. This can happen for nodes running
     // consensus when consensus is lost (eg. when there is no quorum or this
     // node has been netsplit), and for other nodes if they have lost network
     // connectivity to the consensus nodes. Clients should make their own
     // decision what action to perform in this state, depending on the level of
     // consistency required and whether it makes sense for the node to fence its
     // services off.
     CLUSTER_STATE_SPLIT = 6;
 }

 // NodeStatus contains all fields self-reported by nodes. This data is
 // inherently less trusted than other data available about a node, as it can be
 // updated to any value by each node individually, including compromised nodes.
 message NodeStatus {
     // external_address is the IP address that the node expects management,
     // cluster and user traffic to arrive at (ie. the address on which it is
     // listening for gRPC, and role-specific services like etcd and
     // Kubernetes).
     string external_address = 1;
     // running_curator contains information about the curator service running
     // on this node, or is nil if the service is not running.
     message RunningCurator {
         // port is the TCP port on which the curator is listening.
         int32 port = 1;
     }
     RunningCurator running_curator = 3;
     // timestamp is an epoch number associated with the last status update.
     // It's set with a nanosecond granularity.
     google.protobuf.Timestamp timestamp = 2;
 }

 // The Cluster Directory is information about the network addressing of nodes
 // in a cluster. It is a serialized snapshot of some of the state within the
 // etcd cluster, and can be used by external processes (like a node Registering
 // into the cluster) to know how to reach this cluster over the network. It can
 // be thought of as a phonebook, or a static name/address configuration that
 // could live in /etc/hosts.
 //
 // The directory explicitly doesn't carry any information about the cluster's
 // identity or security - these should be configured and checked by higher
 // level configuration and processes. The directory can be stored and
 // transmitted in cleartext and without an integrity checks (like saved to the
 // EFI system partition across reboots) and any malicious change to it will
 // cause no more than a denial of service against the consumer of this
 // directory. This is because all nodes contacted must present a valid cluster
 // identity/certificate before they are trusted by the consumers of this
 // directory.
 message ClusterDirectory {
     message Node {
         bytes public_key = 1;
         message Address {
             string host = 1;
         };
         repeated Address addresses = 2;
     };
     repeated Node nodes = 1;
 }


 // NodeClusterNetworking carries information about the cluster networking (ie.
 // WireGuard mesh) connectivity of a node.
 message NodeClusterNetworking {
     message Prefix {
         string cidr = 1;
     }
     // wireguard_pubkey is the base64-encoded public key used by the node.
     string wireguard_pubkey = 1;
     // prefixes are networking routes exported by the node to the cluster networking
     // mesh, and are programmed by other nodes into their wireguard peer config.
     repeated Prefix prefixes = 2;
 }

 // Severity level corresponding to //metropolis/pkg/logtree.Severity.
 enum LeveledLogSeverity {
     INVALID = 0;
     INFO = 1;
     WARNING = 2;
     ERROR = 3;
     FATAL = 4;
 }

 // Filter set when requesting logs for a given DN. This message is equivalent to
 // the following GADT enum:
 // data LogFilter = WithChildren
 //                | OnlyRaw
 //                | OnlyLeveled
 //                | LeveledWithMinimumSeverity(Severity)
 //
 // Multiple LogFilters can be chained/combined when requesting logs, as long as
 // they do not conflict.
 message LogFilter {
     // Entries will be returned not only for the given DN, but all child DNs as
     // well. For instance, if the requested DN is foo, entries logged to foo,
     // foo.bar and foo.bar.baz will all be returned.
     message WithChildren {
     }
     // Only raw logging entries will be returned. Conflicts with OnlyLeveled
     // filters.
     message OnlyRaw {
     }
     // Only leveled logging entries will be returned. Conflicts with OnlyRaw
     // filters.
     message OnlyLeveled {
     }
     // If leveled logs are returned, all entries at severity lower than `minimum`
     // will be discarded.
     message LeveledWithMinimumSeverity {
         LeveledLogSeverity minimum = 1;
     }
     oneof filter {
         WithChildren with_children = 1;
         OnlyRaw only_raw = 3;
         OnlyLeveled only_leveled = 4;
         LeveledWithMinimumSeverity leveled_with_minimum_severity = 5;
     }
 }

 // LogEntry corresponding to logtree.LogEntry in //metropolis/pkg/logtree.
 message LogEntry {
     // A leveled log entry emitted from a compatible system, eg. Metorpolis code
     // or a klog-parsed line.
     message Leveled {
         repeated string lines = 1;
         google.protobuf.Timestamp timestamp = 2;
         LeveledLogSeverity severity = 3;
         // Source of the error, expressed as file:line.
         string location = 4;
     }
     // Raw log entry, captured from an external system without parting. Might
     // contain some timestamp/level/origin information embedded in data. Data
     // contained within should be treated as unsanitized external data.
     message Raw {
         string data = 1;
         // Original length of line, set if data was truncated.
         int64 original_length = 2;
     }

     // Origin DN.
     string dn = 1;
     oneof kind {
         Leveled leveled = 2;
         Raw raw = 3;
     }
 }

 // ClusterConfiguration contains the entirety of the user-configurable behaviour
 // of the cluster that is scoped to the entirety of the cluster (vs. per-node
 // configuration, which is kept alongside Node).
 //
 // It can be set initially when a cluster is being bootstrapped (in
 // NodeParamaters.ClusterBootstrap), and then can be partially managed by
 // management calls to the curator.
 message ClusterConfiguration {
     // tpm_mode defines the TPM usage policy for cluster nodes. When nodes
     // register into the cluster (and then join into it) they will report their
     // TPM availability, and in return the cluster will respond whether they
     // should use that TPM or not.
     //
     // If a node is instructed to use its TPM, it will use it to encrypt its part
     // of the disk encryption key when saving it to the EFI system partition.
     // That means that the node will only be able to re-join the cluster if its
     // secure boot configuration doesn't change.
     //
     // If a node is instructed to not use its TPM, it will save its part of the
     // disk encryption key straight onto the EFI system partition without any
     // further encryption. It still needs to connect to a working cluster to
     // retrieve the other part of the key. This means that the configuration is
     // secure vs. offline disk decryption attempts, but not secure if an
     // attacker can connect to a cluster and impersonate the node in order to
     // retrieve the other part of its key.
     enum TPMMode {
         TPM_MODE_INVALID = 0;
         // Nodes need to join with a TPM2.0 device and will be instructed to
         // use it.
         TPM_MODE_REQUIRED = 1;
         // Nodes will be allowed to join regardless of TPM2.0 presence, and will
         // be instructed to use it if they have one.
         TPM_MODE_BEST_EFFORT = 2;
         // Regardless of the node's local TPM presence it will be instructed to
         // not use it.
         TPM_MODE_DISABLED = 3;
     }
     TPMMode tpm_mode = 1;
 }

 // NodeTPMUsage describes whether a node has a TPM2.0 and if it is/should be
 // actively used to seal secrets before saving them to its EFI system partition.
 enum NodeTPMUsage {
     NODE_TPM_INVALID = 0;
     // This node has no TPM 2.0.
     NODE_TPM_NOT_PRESENT = 1;
     // This node has a TPM 2.0 but the cluster configuration mandates not using
     // it.
     NODE_TPM_PRESENT_BUT_UNUSED = 2;
     // This node has a TPM 2.0 and it is being actively used.
     NODE_TPM_PRESENT_AND_USED = 3;
 }
	// Copyright 2020 The Monogon Project Authors.
	//
	// SPDX-License-Identifier: Apache-2.0
	//
	// Licensed under the Apache License, Version 2.0 (the "License");
	// you may not use this file except in compliance with the License.
	// You may obtain a copy of the License at
	//
	// http://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS,
	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	// See the License for the specific language governing permissions and
	// limitations under the License.

	syntax = "proto3";
	package metropolis.proto.common;
	option go_package = "source.monogon.dev/metropolis/proto/common";

	import "google/protobuf/timestamp.proto";

	// NodeRoles are the possible roles that a Metropolis Node should run within the
	// cluster. These are configured by the cluster and can be retrieved through the
	// Curator.
	//
	// Fields contained within each individual are publicly available, so while they
	// can be used to carry required data to start up services for a given role,
	// this must not be confidential/private data.
	message NodeRoles {
	message KubernetesController {
	}
	message KubernetesWorker {
	}
	message ConsensusMember {
	// ca_certificate is a DER-encoded x509 certificate of the etcd
	// cluster's CA. The member must use this certificate to verify the
	// identity of the cluster it's connecting to.
	bytes ca_certificate = 1;
	// pper_certificate is a DER-encoded x509 certificate of this node's
	// etcd peer listener. The member must serve member traffic using this
	// certificate. The private key corresponding to this certificate is
	// the same as the node's primary private keypair.
	bytes peer_certificate = 2;
	// initial_crl is a certificate revocation list that the etcd member
	// should be started with. After startup, the member will maintain its
	// own CRL by updating it from its primary storage location, and etcd
	// value.
	//
	// TODO(q3k): don't pass this here, instead pass this over an etcd
	// watcher and curator.Watch.
	bytes initial_crl = 3;
	message Peer {
	string Name = 1;
	string URL = 2;
	}
	repeated Peer peers = 4;
	}
	KubernetesWorker kubernetes_worker = 1;
	ConsensusMember consensus_member = 2;
	KubernetesController kubernetes_controller = 3;
	}

	// NodeState is the state of a Metropolis node from the point of view of the
	// cluster it is a part of (or intending to be a part of).
	enum NodeState {
	NODE_STATE_INVALID = 0;

	// NEW: the node has established a first contact with the cluster and
	// intends to register into it. The node's identity has not been verified
	// and no hardware attestation of the new node was performed.
	// The node has generated a CUK/NUK and set up storage encrypted with the
	// combination of both keys.
	// The node has generated a private/public keypair, and that keypair has
	// been used to contact the already running Cluster.
	NODE_STATE_NEW = 1;
	// STANDBY: the node has successfully passed identity and hardware
	// attestation checks as defined by the cluster policy. The node still isn't
	// part of the cluster, as it itself might perform checks against the
	// running Cluster.
	NODE_STATE_STANDBY = 2;
	// UP: the node has passed all preconditions for STANDBY and has also
	// performed a commit into the cluster by exchanging its CUK for a
	// certificate issued by the cluster.
	// The node is now ready to serve, and its certificate can be used to
	// authenticate its identity cryptographically.
	NODE_STATE_UP = 3;
	// DISOWNED: the node has been rejected or decommissioned by the cluster.
	// Any further contact from the node to the cluster will be rejected.
	NODE_STATE_DISOWNED = 4;
	};

	// ClusterState is the state of the cluster from the point of view of a node.
	// Different subsystems can watch this state and depend on it for behaviour
	// (eg. start serving when HOME, maybe self-fence on SPLIT, etc.).
	enum ClusterState {
	CLUSTER_STATE_INVALID = 0;

	// UNKNOWN: the node has not yet determined the existence of a cluster it
	// should join or start. This is a transient, initial state that should only
	// manifest during boot.
	CLUSTER_STATE_UNKNOWN = 1;
	// FOREIGN: the node is attempting to register into an already existing
	// cluster with which it managed to make preliminary contact, but which the
	// cluster has not yet fully productionized (eg. the node is still being
	// hardware attested, or the operator needs to confirm the
	// registration of this node).
	CLUSTER_STATE_FOREIGN = 2;
	// TRUSTED: the node is attempting to register into an already registered
	// cluster, and has been trusted by it. The node is now attempting to fully
	// commit to registering into the cluster.
	CLUSTER_STATE_TRUSTED = 3;
	// HOME: the node is part of this cluster. This is the bulk of time in which
	// this node will spend its time.
	CLUSTER_STATE_HOME = 4;
	// DISOWNING: the node has been disowned (ie., removed) by the cluster, and
	// that it will not be ever part of any cluster again, and that it will be
	// decommissioned by the operator.
	CLUSTER_STATE_DISOWNING = 5;
	// SPLIT:the node would usually be Home in a cluster, but has been split
	// from the consensus of the cluster. This can happen for nodes running
	// consensus when consensus is lost (eg. when there is no quorum or this
	// node has been netsplit), and for other nodes if they have lost network
	// connectivity to the consensus nodes. Clients should make their own
	// decision what action to perform in this state, depending on the level of
	// consistency required and whether it makes sense for the node to fence its
	// services off.
	CLUSTER_STATE_SPLIT = 6;
	}

	// NodeStatus contains all fields self-reported by nodes. This data is
	// inherently less trusted than other data available about a node, as it can be
	// updated to any value by each node individually, including compromised nodes.
	message NodeStatus {
	// external_address is the IP address that the node expects management,
	// cluster and user traffic to arrive at (ie. the address on which it is
	// listening for gRPC, and role-specific services like etcd and
	// Kubernetes).
	string external_address = 1;
	// running_curator contains information about the curator service running
	// on this node, or is nil if the service is not running.
	message RunningCurator {
	// port is the TCP port on which the curator is listening.
	int32 port = 1;
	}
	RunningCurator running_curator = 3;
	// timestamp is an epoch number associated with the last status update.
	// It's set with a nanosecond granularity.
	google.protobuf.Timestamp timestamp = 2;
	}

	// The Cluster Directory is information about the network addressing of nodes
	// in a cluster. It is a serialized snapshot of some of the state within the
	// etcd cluster, and can be used by external processes (like a node Registering
	// into the cluster) to know how to reach this cluster over the network. It can
	// be thought of as a phonebook, or a static name/address configuration that
	// could live in /etc/hosts.
	//
	// The directory explicitly doesn't carry any information about the cluster's
	// identity or security - these should be configured and checked by higher
	// level configuration and processes. The directory can be stored and
	// transmitted in cleartext and without an integrity checks (like saved to the
	// EFI system partition across reboots) and any malicious change to it will
	// cause no more than a denial of service against the consumer of this
	// directory. This is because all nodes contacted must present a valid cluster
	// identity/certificate before they are trusted by the consumers of this
	// directory.
	message ClusterDirectory {
	message Node {
	bytes public_key = 1;
	message Address {
	string host = 1;
	};
	repeated Address addresses = 2;
	};
	repeated Node nodes = 1;
	}


	// NodeClusterNetworking carries information about the cluster networking (ie.
	// WireGuard mesh) connectivity of a node.
	message NodeClusterNetworking {
	message Prefix {
	string cidr = 1;
	}
	// wireguard_pubkey is the base64-encoded public key used by the node.
	string wireguard_pubkey = 1;
	// prefixes are networking routes exported by the node to the cluster networking
	// mesh, and are programmed by other nodes into their wireguard peer config.
	repeated Prefix prefixes = 2;
	}

	// Severity level corresponding to //metropolis/pkg/logtree.Severity.
	enum LeveledLogSeverity {
	INVALID = 0;
	INFO = 1;
	WARNING = 2;
	ERROR = 3;
	FATAL = 4;
	}

	// Filter set when requesting logs for a given DN. This message is equivalent to
	// the following GADT enum:
	// data LogFilter = WithChildren
	// \| OnlyRaw
	// \| OnlyLeveled
	// \| LeveledWithMinimumSeverity(Severity)
	//
	// Multiple LogFilters can be chained/combined when requesting logs, as long as
	// they do not conflict.
	message LogFilter {
	// Entries will be returned not only for the given DN, but all child DNs as
	// well. For instance, if the requested DN is foo, entries logged to foo,
	// foo.bar and foo.bar.baz will all be returned.
	message WithChildren {
	}
	// Only raw logging entries will be returned. Conflicts with OnlyLeveled
	// filters.
	message OnlyRaw {
	}
	// Only leveled logging entries will be returned. Conflicts with OnlyRaw
	// filters.
	message OnlyLeveled {
	}
	// If leveled logs are returned, all entries at severity lower than `minimum`
	// will be discarded.
	message LeveledWithMinimumSeverity {
	LeveledLogSeverity minimum = 1;
	}
	oneof filter {
	WithChildren with_children = 1;
	OnlyRaw only_raw = 3;
	OnlyLeveled only_leveled = 4;
	LeveledWithMinimumSeverity leveled_with_minimum_severity = 5;
	}
	}

	// LogEntry corresponding to logtree.LogEntry in //metropolis/pkg/logtree.
	message LogEntry {
	// A leveled log entry emitted from a compatible system, eg. Metorpolis code
	// or a klog-parsed line.
	message Leveled {
	repeated string lines = 1;
	google.protobuf.Timestamp timestamp = 2;
	LeveledLogSeverity severity = 3;
	// Source of the error, expressed as file:line.
	string location = 4;
	}
	// Raw log entry, captured from an external system without parting. Might
	// contain some timestamp/level/origin information embedded in data. Data
	// contained within should be treated as unsanitized external data.
	message Raw {
	string data = 1;
	// Original length of line, set if data was truncated.
	int64 original_length = 2;
	}

	// Origin DN.
	string dn = 1;
	oneof kind {
	Leveled leveled = 2;
	Raw raw = 3;
	}
	}

	// ClusterConfiguration contains the entirety of the user-configurable behaviour
	// of the cluster that is scoped to the entirety of the cluster (vs. per-node
	// configuration, which is kept alongside Node).
	//
	// It can be set initially when a cluster is being bootstrapped (in
	// NodeParamaters.ClusterBootstrap), and then can be partially managed by
	// management calls to the curator.
	message ClusterConfiguration {
	// tpm_mode defines the TPM usage policy for cluster nodes. When nodes
	// register into the cluster (and then join into it) they will report their
	// TPM availability, and in return the cluster will respond whether they
	// should use that TPM or not.
	//
	// If a node is instructed to use its TPM, it will use it to encrypt its part
	// of the disk encryption key when saving it to the EFI system partition.
	// That means that the node will only be able to re-join the cluster if its
	// secure boot configuration doesn't change.
	//
	// If a node is instructed to not use its TPM, it will save its part of the
	// disk encryption key straight onto the EFI system partition without any
	// further encryption. It still needs to connect to a working cluster to
	// retrieve the other part of the key. This means that the configuration is
	// secure vs. offline disk decryption attempts, but not secure if an
	// attacker can connect to a cluster and impersonate the node in order to
	// retrieve the other part of its key.
	enum TPMMode {
	TPM_MODE_INVALID = 0;
	// Nodes need to join with a TPM2.0 device and will be instructed to
	// use it.
	TPM_MODE_REQUIRED = 1;
	// Nodes will be allowed to join regardless of TPM2.0 presence, and will
	// be instructed to use it if they have one.
	TPM_MODE_BEST_EFFORT = 2;
	// Regardless of the node's local TPM presence it will be instructed to
	// not use it.
	TPM_MODE_DISABLED = 3;
	}
	TPMMode tpm_mode = 1;
	}

	// NodeTPMUsage describes whether a node has a TPM2.0 and if it is/should be
	// actively used to seal secrets before saving them to its EFI system partition.
	enum NodeTPMUsage {
	NODE_TPM_INVALID = 0;
	// This node has no TPM 2.0.
	NODE_TPM_NOT_PRESENT = 1;
	// This node has a TPM 2.0 but the cluster configuration mandates not using
	// it.
	NODE_TPM_PRESENT_BUT_UNUSED = 2;
	// This node has a TPM 2.0 and it is being actively used.
	NODE_TPM_PRESENT_AND_USED = 3;
	}