| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403 |
- package ebpftracer
- import (
- "bytes"
- "encoding/binary"
- "errors"
- "fmt"
- "os"
- "runtime"
- "strconv"
- "strings"
- "time"
- "github.com/cilium/ebpf"
- "github.com/cilium/ebpf/link"
- "github.com/cilium/ebpf/perf"
- "github.com/coroot/coroot-node-agent/common"
- "github.com/coroot/coroot-node-agent/ebpftracer/l7"
- "github.com/coroot/coroot-node-agent/proc"
- "golang.org/x/mod/semver"
- "golang.org/x/sys/unix"
- "inet.af/netaddr"
- "k8s.io/klog/v2"
- )
- const MaxPayloadSize = 1024
- type EventType uint32
- type EventReason uint32
- const (
- EventTypeProcessStart EventType = 1
- EventTypeProcessExit EventType = 2
- EventTypeConnectionOpen EventType = 3
- EventTypeConnectionClose EventType = 4
- EventTypeConnectionError EventType = 5
- EventTypeListenOpen EventType = 6
- EventTypeListenClose EventType = 7
- EventTypeFileOpen EventType = 8
- EventTypeTCPRetransmit EventType = 9
- EventTypeL7Request EventType = 10
- EventReasonNone EventReason = 0
- EventReasonOOMKill EventReason = 1
- )
- type Event struct {
- Type EventType
- Reason EventReason
- Pid uint32
- SrcAddr netaddr.IPPort
- DstAddr netaddr.IPPort
- Fd uint64
- Timestamp uint64
- L7Request *l7.RequestData
- }
- type perfMapType uint8
- const (
- perfMapTypeProcEvents perfMapType = 1
- perfMapTypeTCPEvents perfMapType = 2
- perfMapTypeFileEvents perfMapType = 3
- perfMapTypeL7Events perfMapType = 4
- )
- type Tracer struct {
- kernelVersion string
- disableL7Tracing bool
- collection *ebpf.Collection
- readers map[string]*perf.Reader
- links []link.Link
- uprobes map[string]*ebpf.Program
- }
- func NewTracer(kernelVersion string, disableL7Tracing bool) *Tracer {
- if disableL7Tracing {
- klog.Infoln("L7 tracing is disabled")
- }
- return &Tracer{
- kernelVersion: kernelVersion,
- disableL7Tracing: disableL7Tracing,
- readers: map[string]*perf.Reader{},
- uprobes: map[string]*ebpf.Program{},
- }
- }
- func (t *Tracer) Run(events chan<- Event) error {
- if err := t.ebpf(events); err != nil {
- return err
- }
- if err := t.init(events); err != nil {
- return err
- }
- return nil
- }
- func (t *Tracer) Close() {
- for _, p := range t.uprobes {
- _ = p.Close()
- }
- for _, l := range t.links {
- _ = l.Close()
- }
- for _, r := range t.readers {
- _ = r.Close()
- }
- t.collection.Close()
- }
- func (t *Tracer) init(ch chan<- Event) error {
- pids, err := proc.ListPids()
- if err != nil {
- return fmt.Errorf("failed to list pids: %w", err)
- }
- for _, pid := range pids {
- ch <- Event{Type: EventTypeProcessStart, Pid: pid}
- }
- fds, sockets := readFds(pids)
- for _, fd := range fds {
- ch <- Event{Type: EventTypeFileOpen, Pid: fd.pid, Fd: fd.fd}
- }
- listens := map[uint64]bool{}
- for _, s := range sockets {
- if s.Listen {
- listens[uint64(s.pid)<<32|uint64(s.SAddr.Port())] = true
- }
- }
- for _, s := range sockets {
- typ := EventTypeConnectionOpen
- if s.Listen {
- typ = EventTypeListenOpen
- } else if listens[uint64(s.pid)<<32|uint64(s.SAddr.Port())] || s.DAddr.Port() > s.SAddr.Port() { // inbound
- continue
- }
- ch <- Event{
- Type: typ,
- Pid: s.pid,
- Fd: s.fd,
- SrcAddr: s.SAddr,
- DstAddr: s.DAddr,
- }
- }
- return nil
- }
- type perfMap struct {
- name string
- perCPUBufferSizePages int
- typ perfMapType
- }
- func (t *Tracer) ebpf(ch chan<- Event) error {
- if _, ok := ebpfProg[runtime.GOARCH]; !ok {
- return fmt.Errorf("unsupported architecture: %s", runtime.GOARCH)
- }
- kv := "v" + common.KernelMajorMinor(t.kernelVersion)
- var prg []byte
- for _, p := range ebpfProg[runtime.GOARCH] {
- if semver.Compare(kv, p.v) >= 0 {
- prg = p.p
- break
- }
- }
- if len(prg) == 0 {
- return fmt.Errorf("unsupported kernel version: %s", t.kernelVersion)
- }
- _, debugFsErr := os.Stat("/sys/kernel/debug/tracing")
- _, traceFsErr := os.Stat("/sys/kernel/tracing")
- if debugFsErr != nil && traceFsErr != nil {
- return fmt.Errorf("kernel tracing is not available: debugfs or tracefs must be mounted")
- }
- collectionSpec, err := ebpf.LoadCollectionSpecFromReader(bytes.NewReader(prg))
- if err != nil {
- return fmt.Errorf("failed to load collection spec: %w", err)
- }
- _ = unix.Setrlimit(unix.RLIMIT_MEMLOCK, &unix.Rlimit{Cur: unix.RLIM_INFINITY, Max: unix.RLIM_INFINITY})
- c, err := ebpf.NewCollectionWithOptions(collectionSpec, ebpf.CollectionOptions{
- //Programs: ebpf.ProgramOptions{LogLevel: 2, LogSize: 20 * 1024 * 1024},
- })
- if err != nil {
- var verr *ebpf.VerifierError
- if errors.As(err, &verr) {
- klog.Errorf("%+v", verr)
- }
- return fmt.Errorf("failed to load collection: %w", err)
- }
- t.collection = c
- perfMaps := []perfMap{
- {name: "proc_events", typ: perfMapTypeProcEvents, perCPUBufferSizePages: 4},
- {name: "tcp_listen_events", typ: perfMapTypeTCPEvents, perCPUBufferSizePages: 4},
- {name: "tcp_connect_events", typ: perfMapTypeTCPEvents, perCPUBufferSizePages: 8},
- {name: "tcp_retransmit_events", typ: perfMapTypeTCPEvents, perCPUBufferSizePages: 4},
- {name: "file_events", typ: perfMapTypeFileEvents, perCPUBufferSizePages: 4},
- }
- if !t.disableL7Tracing {
- perfMaps = append(perfMaps, perfMap{name: "l7_events", typ: perfMapTypeL7Events, perCPUBufferSizePages: 32})
- }
- for _, pm := range perfMaps {
- r, err := perf.NewReader(t.collection.Maps[pm.name], pm.perCPUBufferSizePages*os.Getpagesize())
- if err != nil {
- t.Close()
- return fmt.Errorf("failed to create ebpf reader: %w", err)
- }
- t.readers[pm.name] = r
- go runEventsReader(pm.name, r, ch, pm.typ)
- }
- for _, programSpec := range collectionSpec.Programs {
- program := t.collection.Programs[programSpec.Name]
- if t.disableL7Tracing {
- switch programSpec.Name {
- case "sys_enter_writev", "sys_enter_write", "sys_enter_sendto", "sys_enter_sendmsg":
- continue
- case "sys_enter_read", "sys_enter_readv", "sys_enter_recvfrom", "sys_enter_recvmsg":
- continue
- case "sys_exit_read", "sys_exit_readv", "sys_exit_recvfrom", "sys_exit_recvmsg":
- continue
- }
- }
- var l link.Link
- switch programSpec.Type {
- case ebpf.TracePoint:
- parts := strings.SplitN(programSpec.AttachTo, "/", 2)
- l, err = link.Tracepoint(parts[0], parts[1], program, nil)
- case ebpf.Kprobe:
- if strings.HasPrefix(programSpec.SectionName, "uprobe/") {
- t.uprobes[programSpec.Name] = program
- continue
- }
- l, err = link.Kprobe(programSpec.AttachTo, program, nil)
- }
- if err != nil {
- t.Close()
- return fmt.Errorf("failed to link program: %w", err)
- }
- t.links = append(t.links, l)
- }
- return nil
- }
- func (t EventType) String() string {
- switch t {
- case EventTypeProcessStart:
- return "process-start"
- case EventTypeProcessExit:
- return "process-exit"
- case EventTypeConnectionOpen:
- return "connection-open"
- case EventTypeConnectionClose:
- return "connection-close"
- case EventTypeConnectionError:
- return "connection-error"
- case EventTypeListenOpen:
- return "listen-open"
- case EventTypeListenClose:
- return "listen-close"
- case EventTypeFileOpen:
- return "file-open"
- case EventTypeTCPRetransmit:
- return "tcp-retransmit"
- case EventTypeL7Request:
- return "l7-request"
- }
- return "unknown: " + strconv.Itoa(int(t))
- }
- func (t EventReason) String() string {
- switch t {
- case EventReasonNone:
- return "none"
- case EventReasonOOMKill:
- return "oom-kill"
- }
- return "unknown: " + strconv.Itoa(int(t))
- }
- type procEvent struct {
- Type EventType
- Pid uint32
- Reason uint32
- }
- type tcpEvent struct {
- Fd uint64
- Timestamp uint64
- Type EventType
- Pid uint32
- SPort uint16
- DPort uint16
- SAddr [16]byte
- DAddr [16]byte
- }
- type fileEvent struct {
- Type EventType
- Pid uint32
- Fd uint64
- }
- type l7Event struct {
- Fd uint64
- ConnectionTimestamp uint64
- Pid uint32
- Status uint32
- Duration uint64
- Protocol uint8
- Method uint8
- Padding uint16
- StatementId uint32
- PayloadSize uint64
- }
- func runEventsReader(name string, r *perf.Reader, ch chan<- Event, typ perfMapType) {
- for {
- rec, err := r.Read()
- if err != nil {
- if errors.Is(err, perf.ErrClosed) {
- break
- }
- continue
- }
- if rec.LostSamples > 0 {
- klog.Errorln(name, "lost samples:", rec.LostSamples)
- continue
- }
- var event Event
- switch typ {
- case perfMapTypeL7Events:
- v := &l7Event{}
- reader := bytes.NewBuffer(rec.RawSample)
- if err := binary.Read(reader, binary.LittleEndian, v); err != nil {
- klog.Warningln("failed to read msg:", err)
- continue
- }
- payload := reader.Bytes()
- req := &l7.RequestData{
- Protocol: l7.Protocol(v.Protocol),
- Status: l7.Status(v.Status),
- Duration: time.Duration(v.Duration),
- Method: l7.Method(v.Method),
- StatementId: v.StatementId,
- }
- switch {
- case v.PayloadSize == 0:
- case v.PayloadSize > MaxPayloadSize:
- req.Payload = payload[:MaxPayloadSize]
- default:
- req.Payload = payload[:v.PayloadSize]
- }
- event = Event{Type: EventTypeL7Request, Pid: v.Pid, Fd: v.Fd, Timestamp: v.ConnectionTimestamp, L7Request: req}
- case perfMapTypeFileEvents:
- v := &fileEvent{}
- if err := binary.Read(bytes.NewBuffer(rec.RawSample), binary.LittleEndian, v); err != nil {
- klog.Warningln("failed to read msg:", err)
- continue
- }
- event = Event{Type: v.Type, Pid: v.Pid, Fd: v.Fd}
- case perfMapTypeProcEvents:
- v := &procEvent{}
- if err := binary.Read(bytes.NewBuffer(rec.RawSample), binary.LittleEndian, v); err != nil {
- klog.Warningln("failed to read msg:", err)
- continue
- }
- event = Event{Type: v.Type, Reason: EventReason(v.Reason), Pid: v.Pid}
- case perfMapTypeTCPEvents:
- v := &tcpEvent{}
- if err := binary.Read(bytes.NewBuffer(rec.RawSample), binary.LittleEndian, v); err != nil {
- klog.Warningln("failed to read msg:", err)
- continue
- }
- event = Event{
- Type: v.Type,
- Pid: v.Pid,
- SrcAddr: ipPort(v.SAddr, v.SPort),
- DstAddr: ipPort(v.DAddr, v.DPort),
- Fd: v.Fd,
- Timestamp: v.Timestamp,
- }
- default:
- continue
- }
- ch <- event
- }
- }
- func ipPort(ip [16]byte, port uint16) netaddr.IPPort {
- i, _ := netaddr.FromStdIP(ip[:])
- return netaddr.IPPortFrom(i, port)
- }
|