blob: fe701e6c9a6432cf2fb0a73d452ad136dcf7b86a [file] [log] [blame]
Lorenz Brun6e8f69c2019-11-18 10:44:24 +01001// Copyright 2020 The Monogon Project Authors.
2//
3// SPDX-License-Identifier: Apache-2.0
4//
5// Licensed under the Apache License, Version 2.0 (the "License");
6// you may not use this file except in compliance with the License.
7// You may obtain a copy of the License at
8//
9// http://www.apache.org/licenses/LICENSE-2.0
10//
11// Unless required by applicable law or agreed to in writing, software
12// distributed under the License is distributed on an "AS IS" BASIS,
13// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14// See the License for the specific language governing permissions and
15// limitations under the License.
16
17package kubernetes
18
19import (
Lorenz Brun878f5f92020-05-12 16:15:39 +020020 "context"
Serge Bazanskidbfc6382020-06-19 20:35:43 +020021 "fmt"
Lorenz Brun6e8f69c2019-11-18 10:44:24 +010022 "net"
Serge Bazanskidbfc6382020-06-19 20:35:43 +020023 "os"
Lorenz Brunb15abad2020-04-16 11:17:12 +020024 "time"
25
Lorenz Brun878f5f92020-05-12 16:15:39 +020026 "google.golang.org/grpc/codes"
27 "google.golang.org/grpc/status"
Lorenz Brunf042e6f2020-06-24 16:46:09 +020028 "k8s.io/client-go/informers"
Lorenz Brunb15abad2020-04-16 11:17:12 +020029 "k8s.io/client-go/kubernetes"
Lorenz Brunf042e6f2020-06-24 16:46:09 +020030 "k8s.io/client-go/tools/clientcmd"
Lorenz Brun878f5f92020-05-12 16:15:39 +020031
Serge Bazanski31370b02021-01-07 16:31:14 +010032 "source.monogon.dev/metropolis/node/core/localstorage"
Serge Bazanskid8af5bf2021-03-16 13:38:29 +010033 "source.monogon.dev/metropolis/node/core/network"
Serge Bazanski31370b02021-01-07 16:31:14 +010034 "source.monogon.dev/metropolis/node/core/network/dns"
35 "source.monogon.dev/metropolis/node/kubernetes/clusternet"
36 "source.monogon.dev/metropolis/node/kubernetes/nfproxy"
37 "source.monogon.dev/metropolis/node/kubernetes/pki"
Lorenz Brun4e090352021-03-17 17:44:41 +010038 "source.monogon.dev/metropolis/node/kubernetes/plugins/kvmdevice"
Serge Bazanski31370b02021-01-07 16:31:14 +010039 "source.monogon.dev/metropolis/node/kubernetes/reconciler"
40 "source.monogon.dev/metropolis/pkg/supervisor"
41 apb "source.monogon.dev/metropolis/proto/api"
Lorenz Brun6e8f69c2019-11-18 10:44:24 +010042)
43
44type Config struct {
Serge Bazanskid8af5bf2021-03-16 13:38:29 +010045 ServiceIPRange net.IPNet
46 ClusterNet net.IPNet
Serge Bazanskic2c7ad92020-07-13 17:20:09 +020047
Serge Bazanskid8af5bf2021-03-16 13:38:29 +010048 KPKI *pki.PKI
49 Root *localstorage.Root
50 Network *network.Service
Lorenz Brun6e8f69c2019-11-18 10:44:24 +010051}
52
Serge Bazanskic2c7ad92020-07-13 17:20:09 +020053type Service struct {
Serge Bazanski967be212020-11-02 11:26:59 +010054 c Config
Serge Bazanskic2c7ad92020-07-13 17:20:09 +020055}
Serge Bazanskidbfc6382020-06-19 20:35:43 +020056
Serge Bazanskic2c7ad92020-07-13 17:20:09 +020057func New(c Config) *Service {
58 s := &Service{
59 c: c,
60 }
61 return s
62}
63
Serge Bazanskic2c7ad92020-07-13 17:20:09 +020064func (s *Service) Run(ctx context.Context) error {
Serge Bazanskic2c7ad92020-07-13 17:20:09 +020065 controllerManagerConfig, err := getPKIControllerManagerConfig(ctx, s.c.KPKI)
66 if err != nil {
67 return fmt.Errorf("could not generate controller manager pki config: %w", err)
68 }
69 controllerManagerConfig.clusterNet = s.c.ClusterNet
70 schedulerConfig, err := getPKISchedulerConfig(ctx, s.c.KPKI)
71 if err != nil {
72 return fmt.Errorf("could not generate scheduler pki config: %w", err)
Lorenz Brun6e8f69c2019-11-18 10:44:24 +010073 }
Serge Bazanskidbfc6382020-06-19 20:35:43 +020074
Serge Bazanskic2c7ad92020-07-13 17:20:09 +020075 masterKubeconfig, err := s.c.KPKI.Kubeconfig(ctx, pki.Master)
76 if err != nil {
77 return fmt.Errorf("could not generate master kubeconfig: %w", err)
78 }
Lorenz Brun6e8f69c2019-11-18 10:44:24 +010079
Serge Bazanskic2c7ad92020-07-13 17:20:09 +020080 rawClientConfig, err := clientcmd.NewClientConfigFromBytes(masterKubeconfig)
81 if err != nil {
82 return fmt.Errorf("could not generate kubernetes client config: %w", err)
83 }
Lorenz Brun6e8f69c2019-11-18 10:44:24 +010084
Serge Bazanskic2c7ad92020-07-13 17:20:09 +020085 clientConfig, err := rawClientConfig.ClientConfig()
86 clientSet, err := kubernetes.NewForConfig(clientConfig)
87 if err != nil {
88 return fmt.Errorf("could not generate kubernetes client: %w", err)
89 }
90
91 informerFactory := informers.NewSharedInformerFactory(clientSet, 5*time.Minute)
92
93 hostname, err := os.Hostname()
94 if err != nil {
95 return fmt.Errorf("failed to get hostname: %w", err)
96 }
97
Serge Bazanskid8af5bf2021-03-16 13:38:29 +010098 // Sub-runnable which starts all parts of Kubernetes that depend on the
99 // machine's external IP address. If it changes, the runnable will exit.
100 // TODO(q3k): test this
101 supervisor.Run(ctx, "networked", func(ctx context.Context) error {
102 networkWatch := s.c.Network.Watch()
103 defer networkWatch.Close()
Lorenz Brun339582b2020-07-29 18:13:35 +0200104
Serge Bazanskid8af5bf2021-03-16 13:38:29 +0100105 var status *network.Status
Serge Bazanskic2c7ad92020-07-13 17:20:09 +0200106
Serge Bazanskid8af5bf2021-03-16 13:38:29 +0100107 supervisor.Logger(ctx).Info("Waiting for node networking...")
108 for status == nil || status.ExternalAddress == nil {
109 status, err = networkWatch.Get(ctx)
110 if err != nil {
111 return fmt.Errorf("failed to get network status: %w", err)
112 }
113 }
114 address := status.ExternalAddress
115 supervisor.Logger(ctx).Info("Node has active networking, starting apiserver/kubelet")
116
117 apiserver := &apiserverService{
118 KPKI: s.c.KPKI,
119 AdvertiseAddress: address,
120 ServiceIPRange: s.c.ServiceIPRange,
121 EphemeralConsensusDirectory: &s.c.Root.Ephemeral.Consensus,
122 }
123
124 kubelet := kubeletService{
125 NodeName: hostname,
126 ClusterDNS: []net.IP{address},
127 KubeletDirectory: &s.c.Root.Data.Kubernetes.Kubelet,
128 EphemeralDirectory: &s.c.Root.Ephemeral,
129 KPKI: s.c.KPKI,
130 }
131
132 err := supervisor.RunGroup(ctx, map[string]supervisor.Runnable{
133 "apiserver": apiserver.Run,
134 "kubelet": kubelet.Run,
135 })
136 if err != nil {
137 return fmt.Errorf("when starting apiserver/kubelet: %w", err)
138 }
139
140 supervisor.Signal(ctx, supervisor.SignalHealthy)
141
142 for status.ExternalAddress.Equal(address) {
143 status, err = networkWatch.Get(ctx)
144 if err != nil {
145 return fmt.Errorf("when watching for network changes: %w", err)
146 }
147 }
148 return fmt.Errorf("network configuration changed (%s -> %s)", address.String(), status.ExternalAddress.String())
149 })
Serge Bazanskic2c7ad92020-07-13 17:20:09 +0200150
151 csiPlugin := csiPluginServer{
152 KubeletDirectory: &s.c.Root.Data.Kubernetes.Kubelet,
153 VolumesDirectory: &s.c.Root.Data.Volumes,
154 }
155
156 csiProvisioner := csiProvisionerServer{
157 NodeName: hostname,
158 Kubernetes: clientSet,
159 InformerFactory: informerFactory,
160 VolumesDirectory: &s.c.Root.Data.Volumes,
161 }
162
163 clusternet := clusternet.Service{
164 NodeName: hostname,
165 Kubernetes: clientSet,
166 ClusterNet: s.c.ClusterNet,
167 InformerFactory: informerFactory,
168 DataDirectory: &s.c.Root.Data.Kubernetes.ClusterNetworking,
169 }
170
Lorenz Brunb682ba52020-07-08 14:51:36 +0200171 nfproxy := nfproxy.Service{
172 ClusterCIDR: s.c.ClusterNet,
173 ClientSet: clientSet,
174 }
175
Lorenz Brun4e090352021-03-17 17:44:41 +0100176 kvmDevicePlugin := kvmdevice.Plugin{
177 KubeletDirectory: &s.c.Root.Data.Kubernetes.Kubelet,
178 }
179
Serge Bazanskic2c7ad92020-07-13 17:20:09 +0200180 for _, sub := range []struct {
181 name string
182 runnable supervisor.Runnable
183 }{
Serge Bazanski967be212020-11-02 11:26:59 +0100184 {"controller-manager", runControllerManager(*controllerManagerConfig)},
185 {"scheduler", runScheduler(*schedulerConfig)},
Serge Bazanskic2c7ad92020-07-13 17:20:09 +0200186 {"reconciler", reconciler.Run(clientSet)},
187 {"csi-plugin", csiPlugin.Run},
188 {"csi-provisioner", csiProvisioner.Run},
189 {"clusternet", clusternet.Run},
Lorenz Brunb682ba52020-07-08 14:51:36 +0200190 {"nfproxy", nfproxy.Run},
Lorenz Brun4e090352021-03-17 17:44:41 +0100191 {"kvmdeviceplugin", kvmDevicePlugin.Run},
Serge Bazanskic2c7ad92020-07-13 17:20:09 +0200192 } {
193 err := supervisor.Run(ctx, sub.name, sub.runnable)
194 if err != nil {
195 return fmt.Errorf("could not run sub-service %q: %w", sub.name, err)
196 }
197 }
198
Lorenz Brunfa5c2fc2020-09-28 13:32:12 +0200199 supervisor.Logger(ctx).Info("Registering K8s CoreDNS")
200 clusterDNSDirective := dns.NewKubernetesDirective("cluster.local", masterKubeconfig)
Serge Bazanskid8af5bf2021-03-16 13:38:29 +0100201 s.c.Network.ConfigureDNS(clusterDNSDirective)
Lorenz Brunfa5c2fc2020-09-28 13:32:12 +0200202
Serge Bazanskic2c7ad92020-07-13 17:20:09 +0200203 supervisor.Signal(ctx, supervisor.SignalHealthy)
Lorenz Brunfa5c2fc2020-09-28 13:32:12 +0200204 <-ctx.Done()
Serge Bazanskid8af5bf2021-03-16 13:38:29 +0100205 s.c.Network.ConfigureDNS(dns.CancelDirective(clusterDNSDirective))
Serge Bazanskic2c7ad92020-07-13 17:20:09 +0200206 return nil
Lorenz Brun6e8f69c2019-11-18 10:44:24 +0100207}
208
Serge Bazanski216fe7b2021-05-21 18:36:16 +0200209// GetDebugKubeconfig issues a kubeconfig for an arbitrary given identity.
210// Useful for debugging and testing.
Serge Bazanskic2c7ad92020-07-13 17:20:09 +0200211func (s *Service) GetDebugKubeconfig(ctx context.Context, request *apb.GetDebugKubeconfigRequest) (*apb.GetDebugKubeconfigResponse, error) {
Serge Bazanski9411f7c2021-03-10 13:12:53 +0100212 client, err := s.c.KPKI.VolatileClient(ctx, request.Id, request.Groups)
213 if err != nil {
214 return nil, status.Errorf(codes.Unavailable, "Failed to get volatile client certificate: %v", err)
215 }
216 kubeconfig, err := pki.Kubeconfig(ctx, s.c.KPKI.KV, client)
Lorenz Brun878f5f92020-05-12 16:15:39 +0200217 if err != nil {
218 return nil, status.Errorf(codes.Unavailable, "Failed to generate kubeconfig: %v", err)
219 }
Serge Bazanski9411f7c2021-03-10 13:12:53 +0100220 return &apb.GetDebugKubeconfigResponse{DebugKubeconfig: string(kubeconfig)}, nil
Lorenz Brun6e8f69c2019-11-18 10:44:24 +0100221}