| Tim Windelschmidt | 6d33a43 | 2025-02-04 14:34:25 +0100 | [diff] [blame] | 1 | // Copyright The Monogon Project Authors. |
| 2 | // SPDX-License-Identifier: Apache-2.0 |
| 3 | |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 4 | package e2e |
| 5 | |
| 6 | import ( |
| 7 | "bufio" |
| 8 | "bytes" |
| 9 | "crypto/ed25519" |
| 10 | "crypto/rand" |
| 11 | "encoding/json" |
| 12 | "fmt" |
| 13 | "io" |
| 14 | "net" |
| 15 | "os" |
| 16 | "os/exec" |
| Tim Windelschmidt | 4bd25e8 | 2025-07-11 19:36:28 +0200 | [diff] [blame] | 17 | "path/filepath" |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 18 | "strings" |
| 19 | "testing" |
| 20 | "time" |
| 21 | |
| Tim Windelschmidt | 2a1d1b2 | 2024-02-06 07:07:42 +0100 | [diff] [blame] | 22 | "github.com/bazelbuild/rules_go/go/runfiles" |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 23 | "github.com/pkg/sftp" |
| 24 | "golang.org/x/crypto/ssh" |
| 25 | "google.golang.org/protobuf/proto" |
| 26 | |
| 27 | "source.monogon.dev/cloud/agent/api" |
| Tim Windelschmidt | 2a1d1b2 | 2024-02-06 07:07:42 +0100 | [diff] [blame] | 28 | |
| Tim Windelschmidt | 9f21f53 | 2024-05-07 15:14:20 +0200 | [diff] [blame] | 29 | "source.monogon.dev/osbase/fat32" |
| 30 | "source.monogon.dev/osbase/freeport" |
| Jan Schär | c1b6df4 | 2025-03-20 08:52:18 +0000 | [diff] [blame] | 31 | "source.monogon.dev/osbase/structfs" |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 32 | ) |
| 33 | |
| Tim Windelschmidt | 82e6af7 | 2024-07-23 00:05:42 +0000 | [diff] [blame] | 34 | var ( |
| 35 | // These are filled by bazel at linking time with the canonical path of |
| 36 | // their corresponding file. Inside the init function we resolve it |
| 37 | // with the rules_go runfiles package to the real path. |
| 38 | xCloudImagePath string |
| 39 | xOvmfVarsPath string |
| 40 | xOvmfCodePath string |
| 41 | xTakeoverPath string |
| Tim Windelschmidt | 8f1efe9 | 2025-04-01 01:28:43 +0200 | [diff] [blame] | 42 | xQEMUPath string |
| Tim Windelschmidt | 82e6af7 | 2024-07-23 00:05:42 +0000 | [diff] [blame] | 43 | ) |
| 44 | |
| 45 | func init() { |
| 46 | var err error |
| 47 | for _, path := range []*string{ |
| 48 | &xCloudImagePath, &xOvmfVarsPath, &xOvmfCodePath, |
| Tim Windelschmidt | 8f1efe9 | 2025-04-01 01:28:43 +0200 | [diff] [blame] | 49 | &xTakeoverPath, &xQEMUPath, |
| Tim Windelschmidt | 82e6af7 | 2024-07-23 00:05:42 +0000 | [diff] [blame] | 50 | } { |
| 51 | *path, err = runfiles.Rlocation(*path) |
| 52 | if err != nil { |
| 53 | panic(err) |
| 54 | } |
| 55 | } |
| Tim Windelschmidt | 4bd25e8 | 2025-07-11 19:36:28 +0200 | [diff] [blame] | 56 | // When running QEMU with snapshot=on set, QEMU creates a copy of the |
| 57 | // provided file in $TMPDIR. If $TMPDIR is set to /tmp, it will always |
| 58 | // be overridden to /var/tmp. This creates an issue for us, as the |
| 59 | // bazel tests only wire up /tmp, with /var/tmp being unaccessible |
| 60 | // because of permissions. Bazel provides $TEST_TMPDIR for this |
| 61 | // usecase, which we resolve to an absolute path and then override |
| 62 | // $TMPDIR. |
| 63 | tmpDir, err := filepath.Abs(os.Getenv("TEST_TMPDIR")) |
| 64 | if err != nil { |
| 65 | panic(err) |
| 66 | } |
| 67 | os.Setenv("TMPDIR", tmpDir) |
| Tim Windelschmidt | 82e6af7 | 2024-07-23 00:05:42 +0000 | [diff] [blame] | 68 | } |
| 69 | |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 70 | func TestE2E(t *testing.T) { |
| 71 | pubKey, privKey, err := ed25519.GenerateKey(rand.Reader) |
| 72 | if err != nil { |
| 73 | t.Fatal(err) |
| 74 | } |
| 75 | |
| 76 | sshPubKey, err := ssh.NewPublicKey(pubKey) |
| 77 | if err != nil { |
| 78 | t.Fatal(err) |
| 79 | } |
| 80 | |
| 81 | sshPrivkey, err := ssh.NewSignerFromKey(privKey) |
| 82 | if err != nil { |
| 83 | t.Fatal(err) |
| 84 | } |
| 85 | |
| 86 | // CloudConfig doesn't really have a rigid spec, so just put things into it |
| 87 | cloudConfig := make(map[string]any) |
| 88 | cloudConfig["ssh_authorized_keys"] = []string{ |
| 89 | strings.TrimSuffix(string(ssh.MarshalAuthorizedKey(sshPubKey)), "\n"), |
| 90 | } |
| 91 | |
| 92 | userData, err := json.Marshal(cloudConfig) |
| 93 | if err != nil { |
| 94 | t.Fatal(err) |
| 95 | } |
| 96 | |
| Jan Schär | c1b6df4 | 2025-03-20 08:52:18 +0000 | [diff] [blame] | 97 | root := structfs.Tree{ |
| 98 | structfs.File("user-data", structfs.Bytes("#cloud-config\n"+string(userData))), |
| 99 | structfs.File("meta-data", structfs.Bytes("")), |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 100 | } |
| 101 | cloudInitDataFile, err := os.CreateTemp("", "cidata*.img") |
| 102 | if err != nil { |
| 103 | t.Fatal(err) |
| 104 | } |
| 105 | defer os.Remove(cloudInitDataFile.Name()) |
| Jan Schär | c1b6df4 | 2025-03-20 08:52:18 +0000 | [diff] [blame] | 106 | if err := fat32.WriteFS(cloudInitDataFile, root, fat32.Options{Label: "cidata"}); err != nil { |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 107 | t.Fatal(err) |
| 108 | } |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 109 | |
| 110 | sshPort, sshPortCloser, err := freeport.AllocateTCPPort() |
| 111 | if err != nil { |
| 112 | t.Fatal(err) |
| 113 | } |
| 114 | |
| 115 | qemuArgs := []string{ |
| 116 | "-machine", "q35", "-accel", "kvm", "-nographic", "-nodefaults", "-m", "1024", |
| 117 | "-cpu", "host", "-smp", "sockets=1,cpus=1,cores=2,threads=2,maxcpus=4", |
| Tim Windelschmidt | 82e6af7 | 2024-07-23 00:05:42 +0000 | [diff] [blame] | 118 | "-drive", "if=pflash,format=raw,readonly=on,file=" + xOvmfCodePath, |
| 119 | "-drive", "if=pflash,format=raw,snapshot=on,file=" + xOvmfVarsPath, |
| 120 | "-drive", "if=virtio,format=qcow2,snapshot=on,cache=unsafe,file=" + xCloudImagePath, |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 121 | "-drive", "if=virtio,format=raw,snapshot=on,file=" + cloudInitDataFile.Name(), |
| 122 | "-netdev", fmt.Sprintf("user,id=net0,net=10.42.0.0/24,dhcpstart=10.42.0.10,hostfwd=tcp::%d-:22", sshPort), |
| 123 | "-device", "virtio-net-pci,netdev=net0,mac=22:d5:8e:76:1d:07", |
| 124 | "-device", "virtio-rng-pci", |
| 125 | "-serial", "stdio", |
| 126 | "-no-reboot", |
| 127 | } |
| Tim Windelschmidt | 8f1efe9 | 2025-04-01 01:28:43 +0200 | [diff] [blame] | 128 | qemuCmd := exec.Command(xQEMUPath, qemuArgs...) |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 129 | stdoutPipe, err := qemuCmd.StdoutPipe() |
| 130 | if err != nil { |
| 131 | t.Fatal(err) |
| 132 | } |
| 133 | agentStarted := make(chan struct{}) |
| 134 | go func() { |
| 135 | s := bufio.NewScanner(stdoutPipe) |
| 136 | for s.Scan() { |
| 137 | t.Log("kernel: " + s.Text()) |
| 138 | if strings.Contains(s.Text(), "Monogon BMaaS Agent started") { |
| 139 | agentStarted <- struct{}{} |
| 140 | break |
| 141 | } |
| 142 | } |
| 143 | qemuCmd.Wait() |
| 144 | }() |
| 145 | qemuCmd.Stderr = os.Stderr |
| 146 | sshPortCloser.Close() |
| 147 | if err := qemuCmd.Start(); err != nil { |
| 148 | t.Fatal(err) |
| 149 | } |
| 150 | defer qemuCmd.Process.Kill() |
| 151 | |
| 152 | var c *ssh.Client |
| 153 | for { |
| 154 | c, err = ssh.Dial("tcp", net.JoinHostPort("localhost", fmt.Sprintf("%d", sshPort)), &ssh.ClientConfig{ |
| 155 | User: "debian", |
| 156 | Auth: []ssh.AuthMethod{ssh.PublicKeys(sshPrivkey)}, |
| 157 | HostKeyCallback: ssh.InsecureIgnoreHostKey(), |
| 158 | Timeout: 5 * time.Second, |
| 159 | }) |
| 160 | if err != nil { |
| 161 | t.Logf("error connecting via SSH, retrying: %v", err) |
| 162 | time.Sleep(1 * time.Second) |
| 163 | continue |
| 164 | } |
| 165 | break |
| 166 | } |
| 167 | defer c.Close() |
| 168 | sc, err := sftp.NewClient(c) |
| 169 | if err != nil { |
| 170 | t.Fatal(err) |
| 171 | } |
| 172 | defer sc.Close() |
| 173 | takeoverFile, err := sc.Create("takeover") |
| 174 | if err != nil { |
| 175 | t.Fatal(err) |
| 176 | } |
| 177 | defer takeoverFile.Close() |
| 178 | if err := takeoverFile.Chmod(0o755); err != nil { |
| 179 | t.Fatal(err) |
| 180 | } |
| Tim Windelschmidt | 82e6af7 | 2024-07-23 00:05:42 +0000 | [diff] [blame] | 181 | takeoverSrcFile, err := os.Open(xTakeoverPath) |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 182 | if err != nil { |
| 183 | t.Fatal(err) |
| 184 | } |
| 185 | defer takeoverSrcFile.Close() |
| Tim Windelschmidt | 681d515 | 2025-01-08 00:19:33 +0100 | [diff] [blame] | 186 | |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 187 | if _, err := io.Copy(takeoverFile, takeoverSrcFile); err != nil { |
| 188 | t.Fatal(err) |
| 189 | } |
| 190 | if err := takeoverFile.Close(); err != nil { |
| 191 | t.Fatal(err) |
| 192 | } |
| 193 | sc.Close() |
| 194 | |
| 195 | sess, err := c.NewSession() |
| 196 | if err != nil { |
| 197 | t.Fatal(err) |
| 198 | } |
| 199 | defer sess.Close() |
| 200 | |
| 201 | init := api.TakeoverInit{ |
| Lorenz Brun | 5b8b860 | 2023-03-09 17:22:21 +0100 | [diff] [blame] | 202 | MachineId: "test", |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 203 | BmaasEndpoint: "localhost:1234", |
| 204 | } |
| 205 | initRaw, err := proto.Marshal(&init) |
| 206 | if err != nil { |
| 207 | t.Fatal(err) |
| 208 | } |
| 209 | sess.Stdin = bytes.NewReader(initRaw) |
| 210 | var stdoutBuf bytes.Buffer |
| 211 | var stderrBuf bytes.Buffer |
| 212 | sess.Stdout = &stdoutBuf |
| 213 | sess.Stderr = &stderrBuf |
| 214 | if err := sess.Run("sudo ./takeover"); err != nil { |
| 215 | t.Errorf("stderr:\n%s\n\n", stderrBuf.String()) |
| 216 | t.Fatal(err) |
| 217 | } |
| 218 | var resp api.TakeoverResponse |
| 219 | if err := proto.Unmarshal(stdoutBuf.Bytes(), &resp); err != nil { |
| 220 | t.Fatal(err) |
| 221 | } |
| 222 | switch res := resp.Result.(type) { |
| 223 | case *api.TakeoverResponse_Success: |
| 224 | if res.Success.InitMessage.BmaasEndpoint != init.BmaasEndpoint { |
| Tim Windelschmidt | d0d5d9d | 2025-03-26 22:07:11 +0100 | [diff] [blame] | 225 | t.Fatal("InitMessage not passed through properly") |
| Lorenz Brun | 2d284b5 | 2023-03-08 17:05:12 +0100 | [diff] [blame] | 226 | } |
| 227 | case *api.TakeoverResponse_Error: |
| 228 | t.Fatalf("takeover returned error: %v", res.Error.Message) |
| 229 | } |
| 230 | select { |
| 231 | case <-agentStarted: |
| 232 | // Done, test passed |
| 233 | case <-time.After(30 * time.Second): |
| 234 | t.Fatal("Waiting for BMaaS agent startup timed out") |
| 235 | } |
| 236 | } |