2024-07-08 21:18:55 +01:00
|
|
|
// Copyright (c) Tailscale Inc & AUTHORS
|
|
|
|
// SPDX-License-Identifier: BSD-3-Clause
|
|
|
|
|
|
|
|
//go:build !plan9
|
|
|
|
|
2024-07-29 13:57:11 +01:00
|
|
|
// Package sessionrecording contains functionality for recording Kubernetes API
|
|
|
|
// server proxy 'kubectl exec' sessions.
|
|
|
|
package sessionrecording
|
2024-07-08 21:18:55 +01:00
|
|
|
|
|
|
|
import (
|
|
|
|
"bufio"
|
|
|
|
"bytes"
|
|
|
|
"context"
|
|
|
|
"fmt"
|
|
|
|
"io"
|
|
|
|
"net"
|
|
|
|
"net/http"
|
|
|
|
"net/netip"
|
|
|
|
"strings"
|
|
|
|
|
|
|
|
"github.com/pkg/errors"
|
|
|
|
"go.uber.org/zap"
|
|
|
|
"tailscale.com/client/tailscale/apitype"
|
2024-07-29 13:57:11 +01:00
|
|
|
"tailscale.com/k8s-operator/sessionrecording/spdy"
|
|
|
|
"tailscale.com/k8s-operator/sessionrecording/tsrecorder"
|
2024-08-14 17:57:50 +01:00
|
|
|
"tailscale.com/k8s-operator/sessionrecording/ws"
|
2024-07-29 13:57:11 +01:00
|
|
|
"tailscale.com/sessionrecording"
|
2024-07-08 21:18:55 +01:00
|
|
|
"tailscale.com/tailcfg"
|
|
|
|
"tailscale.com/tsnet"
|
|
|
|
"tailscale.com/tstime"
|
2024-07-29 13:57:11 +01:00
|
|
|
"tailscale.com/util/clientmetric"
|
2024-07-08 21:18:55 +01:00
|
|
|
"tailscale.com/util/multierr"
|
|
|
|
)
|
|
|
|
|
2024-08-14 17:57:50 +01:00
|
|
|
const (
|
|
|
|
SPDYProtocol Protocol = "SPDY"
|
|
|
|
WSProtocol Protocol = "WebSocket"
|
|
|
|
)
|
2024-07-29 13:57:11 +01:00
|
|
|
|
2024-08-14 17:57:50 +01:00
|
|
|
// Protocol is the streaming protocol of the hijacked session. Supported
|
|
|
|
// protocols are SPDY and WebSocket.
|
|
|
|
type Protocol string
|
2024-07-29 13:57:11 +01:00
|
|
|
|
|
|
|
var (
|
|
|
|
// CounterSessionRecordingsAttempted counts the number of session recording attempts.
|
|
|
|
CounterSessionRecordingsAttempted = clientmetric.NewCounter("k8s_auth_proxy_session_recordings_attempted")
|
|
|
|
|
|
|
|
// counterSessionRecordingsUploaded counts the number of successfully uploaded session recordings.
|
|
|
|
counterSessionRecordingsUploaded = clientmetric.NewCounter("k8s_auth_proxy_session_recordings_uploaded")
|
|
|
|
)
|
|
|
|
|
2024-08-14 17:57:50 +01:00
|
|
|
func New(opts HijackerOpts) *Hijacker {
|
2024-07-29 13:57:11 +01:00
|
|
|
return &Hijacker{
|
2024-08-14 17:57:50 +01:00
|
|
|
ts: opts.TS,
|
|
|
|
req: opts.Req,
|
|
|
|
who: opts.Who,
|
|
|
|
ResponseWriter: opts.W,
|
|
|
|
pod: opts.Pod,
|
|
|
|
ns: opts.Namespace,
|
|
|
|
addrs: opts.Addrs,
|
|
|
|
failOpen: opts.FailOpen,
|
|
|
|
proto: opts.Proto,
|
|
|
|
log: opts.Log,
|
|
|
|
connectToRecorder: sessionrecording.ConnectToRecorder,
|
2024-07-29 13:57:11 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-08-14 17:57:50 +01:00
|
|
|
type HijackerOpts struct {
|
|
|
|
TS *tsnet.Server
|
|
|
|
Req *http.Request
|
|
|
|
W http.ResponseWriter
|
|
|
|
Who *apitype.WhoIsResponse
|
|
|
|
Addrs []netip.AddrPort
|
|
|
|
Log *zap.SugaredLogger
|
|
|
|
Pod string
|
|
|
|
Namespace string
|
|
|
|
FailOpen bool
|
|
|
|
Proto Protocol
|
|
|
|
}
|
|
|
|
|
2024-07-29 13:57:11 +01:00
|
|
|
// Hijacker implements [net/http.Hijacker] interface.
|
2024-07-08 21:18:55 +01:00
|
|
|
// It must be configured with an http request for a 'kubectl exec' session that
|
|
|
|
// needs to be recorded. It knows how to hijack the connection and configure for
|
|
|
|
// the session contents to be sent to a tsrecorder instance.
|
2024-07-29 13:57:11 +01:00
|
|
|
type Hijacker struct {
|
2024-07-08 21:18:55 +01:00
|
|
|
http.ResponseWriter
|
|
|
|
ts *tsnet.Server
|
|
|
|
req *http.Request
|
|
|
|
who *apitype.WhoIsResponse
|
|
|
|
log *zap.SugaredLogger
|
|
|
|
pod string // pod being exec-d
|
|
|
|
ns string // namespace of the pod being exec-d
|
|
|
|
addrs []netip.AddrPort // tsrecorder addresses
|
|
|
|
failOpen bool // whether to fail open if recording fails
|
|
|
|
connectToRecorder RecorderDialFn
|
2024-08-14 17:57:50 +01:00
|
|
|
proto Protocol // streaming protocol
|
2024-07-08 21:18:55 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// RecorderDialFn dials the specified netip.AddrPorts that should be tsrecorder
|
|
|
|
// addresses. It tries to connect to recorder endpoints one by one, till one
|
|
|
|
// connection succeeds. In case of success, returns a list with a single
|
|
|
|
// successful recording attempt and an error channel. If the connection errors
|
|
|
|
// after having been established, an error is sent down the channel.
|
|
|
|
type RecorderDialFn func(context.Context, []netip.AddrPort, func(context.Context, string, string) (net.Conn, error)) (io.WriteCloser, []*tailcfg.SSHRecordingAttempt, <-chan error, error)
|
|
|
|
|
|
|
|
// Hijack hijacks a 'kubectl exec' session and configures for the session
|
|
|
|
// contents to be sent to a recorder.
|
2024-07-29 13:57:11 +01:00
|
|
|
func (h *Hijacker) Hijack() (net.Conn, *bufio.ReadWriter, error) {
|
2024-07-08 21:18:55 +01:00
|
|
|
h.log.Infof("recorder addrs: %v, failOpen: %v", h.addrs, h.failOpen)
|
|
|
|
reqConn, brw, err := h.ResponseWriter.(http.Hijacker).Hijack()
|
|
|
|
if err != nil {
|
|
|
|
return nil, nil, fmt.Errorf("error hijacking connection: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
conn, err := h.setUpRecording(context.Background(), reqConn)
|
|
|
|
if err != nil {
|
|
|
|
return nil, nil, fmt.Errorf("error setting up session recording: %w", err)
|
|
|
|
}
|
|
|
|
return conn, brw, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// setupRecording attempts to connect to the recorders set via
|
|
|
|
// spdyHijacker.addrs. Returns conn from provided opts, wrapped in recording
|
|
|
|
// logic. If connecting to the recorder fails or an error is received during the
|
|
|
|
// session and spdyHijacker.failOpen is false, connection will be closed.
|
2024-07-29 13:57:11 +01:00
|
|
|
func (h *Hijacker) setUpRecording(ctx context.Context, conn net.Conn) (net.Conn, error) {
|
2024-07-08 21:18:55 +01:00
|
|
|
const (
|
|
|
|
// https://docs.asciinema.org/manual/asciicast/v2/
|
|
|
|
asciicastv2 = 2
|
|
|
|
)
|
2024-08-14 17:57:50 +01:00
|
|
|
var (
|
|
|
|
wc io.WriteCloser
|
|
|
|
err error
|
|
|
|
errChan <-chan error
|
|
|
|
)
|
2024-07-08 21:18:55 +01:00
|
|
|
h.log.Infof("kubectl exec session will be recorded, recorders: %v, fail open policy: %t", h.addrs, h.failOpen)
|
|
|
|
// TODO (irbekrm): send client a message that session will be recorded.
|
2024-08-14 17:57:50 +01:00
|
|
|
wc, _, errChan, err = h.connectToRecorder(ctx, h.addrs, h.ts.Dial)
|
2024-07-08 21:18:55 +01:00
|
|
|
if err != nil {
|
|
|
|
msg := fmt.Sprintf("error connecting to session recorders: %v", err)
|
|
|
|
if h.failOpen {
|
|
|
|
msg = msg + "; failure mode is 'fail open'; continuing session without recording."
|
|
|
|
h.log.Warnf(msg)
|
|
|
|
return conn, nil
|
|
|
|
}
|
|
|
|
msg = msg + "; failure mode is 'fail closed'; closing connection."
|
|
|
|
if err := closeConnWithWarning(conn, msg); err != nil {
|
|
|
|
return nil, multierr.New(errors.New(msg), err)
|
|
|
|
}
|
|
|
|
return nil, errors.New(msg)
|
|
|
|
}
|
|
|
|
|
|
|
|
// TODO (irbekrm): log which recorder
|
|
|
|
h.log.Info("successfully connected to a session recorder")
|
|
|
|
cl := tstime.DefaultClock{}
|
2024-07-29 13:57:11 +01:00
|
|
|
rec := tsrecorder.New(wc, cl, cl.Now(), h.failOpen)
|
2024-07-08 21:18:55 +01:00
|
|
|
qp := h.req.URL.Query()
|
2024-07-29 13:57:11 +01:00
|
|
|
ch := sessionrecording.CastHeader{
|
2024-07-08 21:18:55 +01:00
|
|
|
Version: asciicastv2,
|
2024-07-29 13:57:11 +01:00
|
|
|
Timestamp: cl.Now().Unix(),
|
2024-07-08 21:18:55 +01:00
|
|
|
Command: strings.Join(qp["command"], " "),
|
|
|
|
SrcNode: strings.TrimSuffix(h.who.Node.Name, "."),
|
|
|
|
SrcNodeID: h.who.Node.StableID,
|
2024-07-29 13:57:11 +01:00
|
|
|
Kubernetes: &sessionrecording.Kubernetes{
|
2024-07-08 21:18:55 +01:00
|
|
|
PodName: h.pod,
|
|
|
|
Namespace: h.ns,
|
2024-07-10 10:48:53 +01:00
|
|
|
Container: strings.Join(qp["container"], " "),
|
2024-07-08 21:18:55 +01:00
|
|
|
},
|
|
|
|
}
|
|
|
|
if !h.who.Node.IsTagged() {
|
|
|
|
ch.SrcNodeUser = h.who.UserProfile.LoginName
|
|
|
|
ch.SrcNodeUserID = h.who.Node.User
|
|
|
|
} else {
|
|
|
|
ch.SrcNodeTags = h.who.Node.Tags
|
|
|
|
}
|
2024-08-14 17:57:50 +01:00
|
|
|
|
|
|
|
var lc net.Conn
|
|
|
|
switch h.proto {
|
|
|
|
case SPDYProtocol:
|
|
|
|
lc = spdy.New(conn, rec, ch, h.log)
|
|
|
|
case WSProtocol:
|
|
|
|
lc = ws.New(conn, rec, ch, h.log)
|
|
|
|
default:
|
|
|
|
return nil, fmt.Errorf("unknown protocol: %s", h.proto)
|
|
|
|
}
|
|
|
|
|
2024-07-08 21:18:55 +01:00
|
|
|
go func() {
|
|
|
|
var err error
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
|
|
|
case err = <-errChan:
|
|
|
|
}
|
|
|
|
if err == nil {
|
2024-07-10 14:00:42 +01:00
|
|
|
counterSessionRecordingsUploaded.Add(1)
|
2024-07-08 21:18:55 +01:00
|
|
|
h.log.Info("finished uploading the recording")
|
|
|
|
return
|
|
|
|
}
|
|
|
|
msg := fmt.Sprintf("connection to the session recorder errorred: %v;", err)
|
|
|
|
if h.failOpen {
|
|
|
|
msg += msg + "; failure mode is 'fail open'; continuing session without recording."
|
|
|
|
h.log.Info(msg)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
msg += "; failure mode set to 'fail closed'; closing connection"
|
|
|
|
h.log.Error(msg)
|
|
|
|
// TODO (irbekrm): write a message to the client
|
|
|
|
if err := lc.Close(); err != nil {
|
|
|
|
h.log.Infof("error closing recorder connections: %v", err)
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}()
|
|
|
|
return lc, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func closeConnWithWarning(conn net.Conn, msg string) error {
|
|
|
|
b := io.NopCloser(bytes.NewBuffer([]byte(msg)))
|
|
|
|
resp := http.Response{Status: http.StatusText(http.StatusForbidden), StatusCode: http.StatusForbidden, Body: b}
|
|
|
|
if err := resp.Write(conn); err != nil {
|
|
|
|
return multierr.New(fmt.Errorf("error writing msg %q to conn: %v", msg, err), conn.Close())
|
|
|
|
}
|
|
|
|
return conn.Close()
|
|
|
|
}
|