blob: 5fc76e33777c621efe0f131d0a2dbd344b302450 [file] [log] [blame]
Serge Bazanskid7d6e022021-09-01 15:03:06 +02001package rpc
2
3import (
4 "context"
5 "crypto/ed25519"
6 "crypto/rand"
7 "crypto/tls"
8 "crypto/x509"
9 "fmt"
10 "math/big"
11 "time"
12
Serge Bazanskid7d6e022021-09-01 15:03:06 +020013 "google.golang.org/grpc/credentials"
Serge Bazanski636032e2022-01-26 14:21:33 +010014 "google.golang.org/grpc/status"
Serge Bazanskid7d6e022021-09-01 15:03:06 +020015
Serge Bazanski3379a5d2021-09-09 12:56:40 +020016 "source.monogon.dev/metropolis/node/core/identity"
Serge Bazanskid7d6e022021-09-01 15:03:06 +020017 apb "source.monogon.dev/metropolis/proto/api"
18)
19
Serge Bazanski4ac71122023-07-24 13:08:34 +020020// UnknownNotAfter is a copy of //metroplis/pkg/pki.UnknownNotAfter.
21//
22// We copy it so that we can decouple the rpc package from the pki package, the
23// former being used by metroctl (and thus needing to be portable), the latter
24// having a dependency on fileargs (which isn't portable). The correct solution
25// here is to clarify portability policy of each workspace path, and apply it.
26// But this will do for now.
27//
28// TODO(issues/252): clean up and merge this back.
29var UnknownNotAfter = time.Unix(253402300799, 0)
30
Serge Bazanski3379a5d2021-09-09 12:56:40 +020031type verifyPeerCertificate func(rawCerts [][]byte, verifiedChains [][]*x509.Certificate) error
32
Serge Bazanski8535cb52023-03-29 14:15:08 +020033func verifyClusterCertificateAndNodeID(ca *x509.Certificate, nodeID string) verifyPeerCertificate {
Serge Bazanski3379a5d2021-09-09 12:56:40 +020034 return func(rawCerts [][]byte, verifiedChains [][]*x509.Certificate) error {
35 if len(rawCerts) != 1 {
36 return fmt.Errorf("server presented %d certificates, wanted exactly one", len(rawCerts))
37 }
38 serverCert, err := x509.ParseCertificate(rawCerts[0])
39 if err != nil {
40 return fmt.Errorf("server presented unparseable certificate: %w", err)
41 }
Serge Bazanski8535cb52023-03-29 14:15:08 +020042 pkey, err := identity.VerifyNodeInCluster(serverCert, ca)
43 if err != nil {
Serge Bazanski3379a5d2021-09-09 12:56:40 +020044 return fmt.Errorf("node certificate verification failed: %w", err)
45 }
Serge Bazanski8535cb52023-03-29 14:15:08 +020046 if nodeID != "" {
47 id := identity.NodeID(pkey)
48 if id != nodeID {
49 return fmt.Errorf("wanted to reach node %q, got %q", nodeID, id)
50 }
51 }
Serge Bazanski3379a5d2021-09-09 12:56:40 +020052
53 return nil
54 }
55}
56
Serge Bazanski8535cb52023-03-29 14:15:08 +020057func verifyFail(err error) verifyPeerCertificate {
58 return func(_ [][]byte, _ [][]*x509.Certificate) error {
59 return err
60 }
61}
62
Serge Bazanski399ce552022-03-29 12:52:42 +020063// NewEphemeralCredentials returns gRPC TransportCredentials that can be used to
64// dial a cluster without authenticating with a certificate, but instead
65// authenticating by proving the possession of a private key, via an ephemeral
66// self-signed certificate.
Serge Bazanskid7d6e022021-09-01 15:03:06 +020067//
Serge Bazanski399ce552022-03-29 12:52:42 +020068// Currently these credentials are used in two flows:
69//
Serge Bazanski8535cb52023-03-29 14:15:08 +020070// 1. Registration of nodes into a cluster, after which a node receives a proper
71// node certificate
Serge Bazanski399ce552022-03-29 12:52:42 +020072//
Serge Bazanski8535cb52023-03-29 14:15:08 +020073// 2. Escrow of initial owner credentials into a proper manager
74// certificate
Serge Bazanskid7d6e022021-09-01 15:03:06 +020075//
Serge Bazanski0c280152024-02-05 14:33:19 +010076// The given opts can be used to lock down the remote side of the connection, eg.
77// expecting a given cluster CA certificate or disabling remote side verification
78// by using WantInsecure().
79func NewEphemeralCredentials(private ed25519.PrivateKey, opts ...CredentialsOpt) (credentials.TransportCredentials, error) {
Serge Bazanskid7d6e022021-09-01 15:03:06 +020080 template := x509.Certificate{
81 SerialNumber: big.NewInt(1),
82 NotBefore: time.Now(),
Serge Bazanski4ac71122023-07-24 13:08:34 +020083 NotAfter: UnknownNotAfter,
Serge Bazanskid7d6e022021-09-01 15:03:06 +020084
Serge Bazanski3379a5d2021-09-09 12:56:40 +020085 KeyUsage: x509.KeyUsageKeyEncipherment | x509.KeyUsageDigitalSignature | x509.KeyUsageCertSign,
Serge Bazanskid7d6e022021-09-01 15:03:06 +020086 ExtKeyUsage: []x509.ExtKeyUsage{x509.ExtKeyUsageClientAuth},
87 BasicConstraintsValid: true,
88 }
89 certificateBytes, err := x509.CreateCertificate(rand.Reader, &template, &template, private.Public(), private)
90 if err != nil {
91 return nil, fmt.Errorf("when generating self-signed certificate: %w", err)
92 }
93 certificate := tls.Certificate{
94 Certificate: [][]byte{certificateBytes},
95 PrivateKey: private,
96 }
Serge Bazanski8535cb52023-03-29 14:15:08 +020097 return NewAuthenticatedCredentials(certificate, opts...), nil
98}
99
Serge Bazanski0c280152024-02-05 14:33:19 +0100100// CredentialsOpt are created using WantXXX functions and used in
101// NewCredentials.
102type CredentialsOpt struct {
Serge Bazanski8535cb52023-03-29 14:15:08 +0200103 wantCA *x509.Certificate
104 wantNodeID string
105 insecureOkay bool
106}
107
Serge Bazanski0c280152024-02-05 14:33:19 +0100108func (a *CredentialsOpt) merge(o *CredentialsOpt) {
Serge Bazanski8535cb52023-03-29 14:15:08 +0200109 if a.wantNodeID == "" && o.wantNodeID != "" {
110 a.wantNodeID = o.wantNodeID
111 }
112 if a.wantCA == nil && o.wantCA != nil {
113 a.wantCA = o.wantCA
114 }
115 if !a.insecureOkay && o.insecureOkay {
116 a.insecureOkay = o.insecureOkay
117 }
118}
119
120// WantRemoteCluster enables the verification of the remote cluster identity when
121// using NewAuthanticatedCredentials. If the connection is not terminated at a
122// cluster with the given CA certificate, an error will be returned.
123//
124// This is the bare minimum option required to implement secure connections to
125// clusters.
Serge Bazanski0c280152024-02-05 14:33:19 +0100126func WantRemoteCluster(ca *x509.Certificate) CredentialsOpt {
127 return CredentialsOpt{
Serge Bazanski8535cb52023-03-29 14:15:08 +0200128 wantCA: ca,
129 }
130}
131
132// WantRemoteNode enables the verification of the remote node identity when using
Serge Bazanski0c280152024-02-05 14:33:19 +0100133// NewCredentials. If the connection is not terminated at the node
Serge Bazanski8535cb52023-03-29 14:15:08 +0200134// ID 'id', an error will be returned. For this function to work,
135// WantRemoteCluster must also be set.
Serge Bazanski0c280152024-02-05 14:33:19 +0100136func WantRemoteNode(id string) CredentialsOpt {
137 return CredentialsOpt{
Serge Bazanski8535cb52023-03-29 14:15:08 +0200138 wantNodeID: id,
139 }
140}
141
142// WantInsecure disables the verification of the remote side of the connection
Serge Bazanski0c280152024-02-05 14:33:19 +0100143// via NewCredentials. This is unsafe.
144func WantInsecure() CredentialsOpt {
145 return CredentialsOpt{
Serge Bazanski8535cb52023-03-29 14:15:08 +0200146 insecureOkay: true,
147 }
Serge Bazanski3379a5d2021-09-09 12:56:40 +0200148}
Serge Bazanskid7d6e022021-09-01 15:03:06 +0200149
Serge Bazanskia3e38cf2024-07-31 14:40:04 +0000150// NewAuthenticatedTLSConfig returns a tls.Config that can be used to dial a
151// cluster with a given TLS certificate (from node or manager credentials).
Serge Bazanski399ce552022-03-29 12:52:42 +0200152//
Serge Bazanski0c280152024-02-05 14:33:19 +0100153// The provided CredentialsOpt specify the verification of the remote side of the
154// connection. When connecting to a cluster (any node), use WantRemoteCluster. If
155// you also want to verify the connection to a particular node, specify
156// WantRemoteNode alongside it. If no verification should be performed use
157// WantInsecure.
Serge Bazanski8535cb52023-03-29 14:15:08 +0200158//
159// The given options are parsed on a first-wins basis.
Serge Bazanskia3e38cf2024-07-31 14:40:04 +0000160func NewAuthenticatedTLSConfig(cert tls.Certificate, opts ...CredentialsOpt) *tls.Config {
Serge Bazanski399ce552022-03-29 12:52:42 +0200161 config := &tls.Config{
162 Certificates: []tls.Certificate{cert},
163 InsecureSkipVerify: true,
164 }
Serge Bazanski8535cb52023-03-29 14:15:08 +0200165
Serge Bazanski0c280152024-02-05 14:33:19 +0100166 var merged CredentialsOpt
Serge Bazanski8535cb52023-03-29 14:15:08 +0200167 for _, o := range opts {
168 merged.merge(&o)
Serge Bazanski399ce552022-03-29 12:52:42 +0200169 }
Serge Bazanski8535cb52023-03-29 14:15:08 +0200170
171 if merged.insecureOkay {
Serge Bazanski0c280152024-02-05 14:33:19 +0100172 if merged.wantNodeID != "" {
173 config.VerifyPeerCertificate = verifyFail(fmt.Errorf("WantInsecure specified alongside WantRemoteNode"))
174 } else if merged.wantCA != nil {
175 config.VerifyPeerCertificate = verifyFail(fmt.Errorf("WantInsecure specified alongside WantRemoteCluster"))
Serge Bazanski8535cb52023-03-29 14:15:08 +0200176 }
177 } else {
178 switch {
Serge Bazanski0c280152024-02-05 14:33:19 +0100179 case merged.wantNodeID == "" && merged.wantCA == nil:
180 config.VerifyPeerCertificate = verifyFail(fmt.Errorf("WantRemoteNode/WantRemoteCluster/WantInsecure not specified"))
Serge Bazanski8535cb52023-03-29 14:15:08 +0200181 case merged.wantNodeID != "" && merged.wantCA == nil:
182 config.VerifyPeerCertificate = verifyFail(fmt.Errorf("WantRemoteNode also requires WantRemoteCluster"))
183 case merged.wantCA == nil:
184 config.VerifyPeerCertificate = verifyFail(fmt.Errorf("no AuthenticaedCreentialsOpts specified"))
185 default:
186 config.VerifyPeerCertificate = verifyClusterCertificateAndNodeID(merged.wantCA, merged.wantNodeID)
187 }
188 }
189
Serge Bazanskia3e38cf2024-07-31 14:40:04 +0000190 return config
191}
192
193// NewAuthenticatedCredentials returns gRPC TransportCredentials that can be used
194// to dial a cluster with a given TLS certificate (from node or manager
195// credentials).
196//
197// The provided CredentialsOpt specify the verification of the remote side of the
198// connection. When connecting to a cluster (any node), use WantRemoteCluster. If
199// you also want to verify the connection to a particular node, specify
200// WantRemoteNode alongside it. If no verification should be performed use
201// WantInsecure.
202//
203// The given options are parsed on a first-wins basis.
204func NewAuthenticatedCredentials(cert tls.Certificate, opts ...CredentialsOpt) credentials.TransportCredentials {
205 return credentials.NewTLS(NewAuthenticatedTLSConfig(cert, opts...))
Serge Bazanskid7d6e022021-09-01 15:03:06 +0200206}
207
Serge Bazanski8535cb52023-03-29 14:15:08 +0200208// RetrieveOwnerCertificate uses AAA.Escrow to retrieve a cluster manager
Serge Bazanskid7d6e022021-09-01 15:03:06 +0200209// certificate for the initial owner of the cluster, authenticated by the
210// public/private key set in the clusters NodeParameters.ClusterBoostrap.
211//
212// The retrieved certificate can be used to dial further cluster RPCs.
213func RetrieveOwnerCertificate(ctx context.Context, aaa apb.AAAClient, private ed25519.PrivateKey) (*tls.Certificate, error) {
214 srv, err := aaa.Escrow(ctx)
215 if err != nil {
Serge Bazanski636032e2022-01-26 14:21:33 +0100216 if st, ok := status.FromError(err); ok {
217 return nil, status.Errorf(st.Code(), "Escrow call failed: %s", st.Message())
218 }
219 return nil, err
Serge Bazanskid7d6e022021-09-01 15:03:06 +0200220 }
221 if err := srv.Send(&apb.EscrowFromClient{
222 Parameters: &apb.EscrowFromClient_Parameters{
223 RequestedIdentityName: "owner",
224 PublicKey: private.Public().(ed25519.PublicKey),
225 },
226 }); err != nil {
227 return nil, fmt.Errorf("when sending client parameters: %w", err)
228 }
229 resp, err := srv.Recv()
230 if err != nil {
231 return nil, fmt.Errorf("when receiving server message: %w", err)
232 }
233 if len(resp.EmittedCertificate) == 0 {
234 return nil, fmt.Errorf("expected certificate, instead got needed proofs: %+v", resp.Needed)
235 }
236
237 return &tls.Certificate{
238 Certificate: [][]byte{resp.EmittedCertificate},
239 PrivateKey: private,
240 }, nil
241}