tracer.go 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948
  1. package ebpftracer
  2. import (
  3. "bytes"
  4. debugelf "debug/elf"
  5. "encoding/binary"
  6. "encoding/hex"
  7. "errors"
  8. "fmt"
  9. "os"
  10. "strconv"
  11. "strings"
  12. "time"
  13. "github.com/coroot/coroot-node-agent/utils"
  14. "github.com/coroot/coroot-node-agent/utils/try"
  15. "github.com/cilium/ebpf"
  16. "github.com/cilium/ebpf/link"
  17. "github.com/cilium/ebpf/perf"
  18. "github.com/coroot/coroot-node-agent/common"
  19. "github.com/coroot/coroot-node-agent/ebpftracer/l7"
  20. "github.com/coroot/coroot-node-agent/ebpftracer/tracer"
  21. "github.com/coroot/coroot-node-agent/proc"
  22. . "github.com/coroot/coroot-node-agent/utils/modelse"
  23. klog "github.com/sirupsen/logrus"
  24. "golang.org/x/sys/unix"
  25. "inet.af/netaddr"
  26. )
  27. /*
  28. #define TASK_COMM_LEN 16
  29. #define BURST_DATA_BUF_SIZE 8192 // For brust send buffer
  30. #include <linux/types.h>
  31. struct __tuple_t {
  32. __u8 daddr[16];
  33. __u8 rcv_saddr[16];
  34. __u8 addr_len;
  35. __u8 l4_protocol;
  36. __u16 dport;
  37. __u16 num;
  38. };
  39. struct __socket_data {
  40. __u32 pid;
  41. __u32 tgid;
  42. __u64 coroutine_id;
  43. __u8 source;
  44. __u8 comm[TASK_COMM_LEN];
  45. __u64 socket_id;
  46. struct __tuple_t tuple;
  47. __u32 extra_data;
  48. __u32 extra_data_count;
  49. __u32 tcp_seq;
  50. __u64 thread_trace_id;
  51. __u64 timestamp;
  52. __u8 direction: 1;
  53. __u8 msg_type: 7;
  54. __u64 syscall_len;
  55. __u64 data_seq;
  56. __u16 data_type;
  57. __u16 data_len;
  58. char data[BURST_DATA_BUF_SIZE];
  59. } __attribute__((packed));
  60. struct __socket_data_buffer {
  61. __u32 events_num;
  62. __u32 len;
  63. char data[32760];
  64. };
  65. */
  66. import "C"
  67. type SocketData C.struct___socket_data
  68. type SocketDataBuffer C.struct___socket_data_buffer
  69. const MaxPayloadSize = 1024
  70. type EventType uint32
  71. type EventReason uint32
  72. const (
  73. EventTypeProcessStart EventType = 1
  74. EventTypeProcessExit EventType = 2
  75. EventTypeConnectionOpen EventType = 3
  76. EventTypeConnectionClose EventType = 4
  77. EventTypeConnectionError EventType = 5
  78. EventTypeListenOpen EventType = 6
  79. EventTypeListenClose EventType = 7
  80. EventTypeFileOpen EventType = 8
  81. EventTypeTCPRetransmit EventType = 9
  82. EventTypeL7Request EventType = 10
  83. EventTypeFunEnt EventType = 11
  84. EventTypeFunRet EventType = 12
  85. EventTypeAcceptOpen EventType = 13
  86. EventTypeAcceptClose EventType = 14
  87. EventReasonNone EventReason = 0
  88. EventReasonOOMKill EventReason = 1
  89. )
  90. type TrafficStats struct {
  91. BytesSent uint64
  92. BytesReceived uint64
  93. }
  94. type Event struct {
  95. StackEvent *StackEvent
  96. Type EventType
  97. Reason EventReason
  98. Pid uint32
  99. SrcAddr netaddr.IPPort
  100. DstAddr netaddr.IPPort
  101. Fd uint64
  102. Timestamp uint64
  103. Duration time.Duration
  104. L7Request *l7.RequestData
  105. TrafficStats *TrafficStats
  106. FirstReadTime uint64
  107. FirstWriteTime uint64
  108. NewReadTime uint64
  109. }
  110. type perfMapType uint8
  111. const (
  112. perfMapTypeProcEvents perfMapType = 1
  113. perfMapTypeTCPEvents perfMapType = 2
  114. perfMapTypeFileEvents perfMapType = 3
  115. perfMapTypeL7Events perfMapType = 4
  116. perfMapTypeSocketEvents perfMapType = 5
  117. perfMapTypeEventQueue perfMapType = 6
  118. perfMapTypePythonThreadEvents perfMapType = 7
  119. )
  120. type Tracer struct {
  121. kernelVersion string
  122. disableL7Tracing bool
  123. disableE2ETracing bool
  124. disableStackTracing bool
  125. collection *ebpf.Collection
  126. collectionSpec *ebpf.CollectionSpec
  127. readers map[string]*perf.Reader
  128. links []link.Link
  129. uprobes map[string]*ebpf.Program
  130. Symbols []debugelf.Symbol
  131. Uprobes []tracer.Uprobe
  132. UprobesMap map[string]tracer.Uprobe
  133. }
  134. func NewTracer(kernelVersion string, disableL7Tracing, disableE2ETracing, disableStackTracing bool) *Tracer {
  135. if disableL7Tracing {
  136. klog.Infoln("L7 tracing is disabled")
  137. } else {
  138. klog.Infoln("L7 tracing is enabled")
  139. }
  140. if disableE2ETracing {
  141. klog.Infoln("e2e is disabled")
  142. } else {
  143. klog.Infoln("e2e is enabled")
  144. }
  145. if disableStackTracing {
  146. klog.Infoln("L7 stack is disabled")
  147. } else {
  148. klog.Infoln("L7 stack is enabled")
  149. }
  150. return &Tracer{
  151. kernelVersion: kernelVersion,
  152. disableL7Tracing: disableL7Tracing,
  153. disableE2ETracing: disableE2ETracing,
  154. disableStackTracing: disableStackTracing,
  155. readers: map[string]*perf.Reader{},
  156. uprobes: map[string]*ebpf.Program{},
  157. links: []link.Link{},
  158. }
  159. }
  160. func (t *Tracer) Run(events chan<- Event) error {
  161. if err := t.ebpf(events); err != nil {
  162. return err
  163. }
  164. if err := t.init(events); err != nil {
  165. return err
  166. }
  167. return nil
  168. }
  169. func (t *Tracer) Close() {
  170. for k, p := range t.uprobes {
  171. if p != nil {
  172. err := p.Close()
  173. klog.WithError(err).Infof("[close] uprobes %s", k)
  174. }
  175. }
  176. for _, l := range t.links {
  177. if l != nil {
  178. err := l.Close()
  179. klog.WithError(err).Infof("[close] links")
  180. }
  181. }
  182. for k, r := range t.readers {
  183. if r != nil {
  184. err := r.Close()
  185. klog.WithError(err).Infof("[close] readers %s", k)
  186. }
  187. }
  188. if t.collection != nil {
  189. t.collection.Close()
  190. }
  191. }
  192. func (t *Tracer) init(ch chan<- Event) error {
  193. pids, err := proc.ListPids()
  194. if err != nil {
  195. return fmt.Errorf("failed to list pids: %w", err)
  196. }
  197. for _, pid := range pids {
  198. ch <- Event{Type: EventTypeProcessStart, Pid: pid}
  199. }
  200. fds, sockets := readFds(pids)
  201. for _, fd := range fds {
  202. ch <- Event{Type: EventTypeFileOpen, Pid: fd.pid, Fd: fd.fd}
  203. }
  204. listens := map[uint64]bool{}
  205. for _, s := range sockets {
  206. if s.Listen {
  207. listens[uint64(s.pid)<<32|uint64(s.SAddr.Port())] = true
  208. }
  209. }
  210. ebpfConnectionsMap := t.collection.Maps["active_connections"]
  211. timestamp := uint64(time.Now().UnixNano())
  212. for _, s := range sockets {
  213. typ := EventTypeConnectionOpen
  214. if s.Listen {
  215. typ = EventTypeListenOpen
  216. //} else if listens[uint64(s.pid)<<32|uint64(s.SAddr.Port())] || s.DAddr.Port() > s.SAddr.Port() { // inbound
  217. } else if listens[uint64(s.pid)<<32|uint64(s.SAddr.Port())] { // 存在误判
  218. continue
  219. }
  220. ch <- Event{
  221. Type: typ,
  222. Pid: s.pid,
  223. Timestamp: timestamp,
  224. Fd: s.fd,
  225. SrcAddr: s.SAddr,
  226. DstAddr: s.DAddr,
  227. }
  228. if typ == EventTypeConnectionOpen {
  229. id := ConnectionId{FD: s.fd, PID: s.pid}
  230. sip := s.SAddr.IP()
  231. sipbytes := sip.As16()
  232. dip := s.DAddr.IP()
  233. dipbytes := dip.As16()
  234. conn := Connection{Timestamp: timestamp, Saddr: sipbytes, Sport: s.SAddr.Port(), Daddr: dipbytes, Dport: s.DAddr.Port()}
  235. if err := ebpfConnectionsMap.Update(id, conn, ebpf.UpdateNoExist); err != nil {
  236. klog.Warningln(err)
  237. }
  238. }
  239. }
  240. return nil
  241. }
  242. func (t *Tracer) ActiveConnectionsIterator() *ebpf.MapIterator {
  243. return t.collection.Maps["active_connections"].Iterate()
  244. }
  245. func (t *Tracer) ActiveAcceptsIterator() *ebpf.MapIterator {
  246. return t.collection.Maps["active_accepts"].Iterate()
  247. }
  248. type perfMap struct {
  249. name string
  250. perCPUBufferSizePages int
  251. typ perfMapType
  252. }
  253. func (t *Tracer) ebpf(ch chan<- Event) error {
  254. kv := "v" + common.KernelMajorMinor(t.kernelVersion)
  255. path, prg, err := EbpfCode(kv)
  256. klog.Infof("kv is [%s], kernel version: [%s] path: [%s]", kv, t.kernelVersion, path)
  257. if len(prg) == 0 || err != nil {
  258. return fmt.Errorf("kv is %s, unsupported kernel version: [%s] path: [%s] err:<%v>", kv, t.kernelVersion, path, err)
  259. }
  260. _, debugFsErr := os.Stat("/sys/kernel/debug/tracing")
  261. _, traceFsErr := os.Stat("/sys/kernel/tracing")
  262. if debugFsErr != nil && traceFsErr != nil {
  263. return fmt.Errorf("kernel tracing is not available: debugfs or tracefs must be mounted")
  264. }
  265. collectionSpec, err := ebpf.LoadCollectionSpecFromReader(bytes.NewReader(prg))
  266. if err != nil {
  267. return fmt.Errorf("failed to load collection spec: %w", err)
  268. }
  269. _ = unix.Setrlimit(unix.RLIMIT_MEMLOCK, &unix.Rlimit{Cur: unix.RLIM_INFINITY, Max: unix.RLIM_INFINITY})
  270. tracer.PidFilter(collectionSpec)
  271. opts := &ebpf.CollectionOptions{MapReplacements: make(map[string]*ebpf.Map)}
  272. klog.Infof("[start] Look eBPF .maps")
  273. for _, spec := range collectionSpec.Maps {
  274. klog.Infoln(spec.Name)
  275. }
  276. klog.Infof("[end] Look eBPF .maps")
  277. tracer.MapInit(collectionSpec, opts)
  278. // TODO 多进程
  279. // tracer.SetConstants(collectionSpec)
  280. c, err := ebpf.NewCollectionWithOptions(collectionSpec, *opts)
  281. if err != nil {
  282. var verr *ebpf.VerifierError
  283. if errors.As(err, &verr) {
  284. klog.Errorf("----%+v", verr)
  285. }
  286. return fmt.Errorf("failed to load collection: %w", err)
  287. }
  288. tracer.Offset()
  289. t.collectionSpec = collectionSpec
  290. t.collection = c
  291. perfMaps := []perfMap{
  292. {name: "proc_events", typ: perfMapTypeProcEvents, perCPUBufferSizePages: 4},
  293. {name: "tcp_listen_events", typ: perfMapTypeTCPEvents, perCPUBufferSizePages: 4},
  294. {name: "tcp_connect_events", typ: perfMapTypeTCPEvents, perCPUBufferSizePages: 8},
  295. {name: "tcp_accept_events", typ: perfMapTypeTCPEvents, perCPUBufferSizePages: 8},
  296. {name: "tcp_retransmit_events", typ: perfMapTypeTCPEvents, perCPUBufferSizePages: 4},
  297. {name: "file_events", typ: perfMapTypeFileEvents, perCPUBufferSizePages: 4},
  298. {name: "event_queue", typ: perfMapTypeEventQueue, perCPUBufferSizePages: 32},
  299. {name: "python_thread_events", typ: perfMapTypePythonThreadEvents, perCPUBufferSizePages: 4},
  300. }
  301. tracer.MapInsert(c)
  302. if !t.DisableL7Tracing() {
  303. perfMaps = append(perfMaps, perfMap{name: "l7_events", typ: perfMapTypeL7Events, perCPUBufferSizePages: 32})
  304. }
  305. perfMaps = append(perfMaps, perfMap{name: MAP_PERF_SOCKET_DATA_NAME, typ: perfMapTypeSocketEvents, perCPUBufferSizePages: 64})
  306. klog.Infof("[start] Look eBPF perf_maps")
  307. for _, pm := range perfMaps {
  308. klog.Infoln(pm.name)
  309. m, ok := t.collection.Maps[pm.name]
  310. if ok {
  311. r, err := perf.NewReader(m, pm.perCPUBufferSizePages*os.Getpagesize())
  312. if err != nil {
  313. t.Close()
  314. return fmt.Errorf("failed to create ebpf reader: %w", err)
  315. }
  316. t.readers[pm.name] = r
  317. // event监听
  318. //go runEventsReader(pm.name, r, ch, pm.typ)
  319. try.GoParams(runEventsReader, utils.CatchFn, pm.name, r, ch, pm.typ)
  320. }
  321. }
  322. klog.Infof("[end] Look eBPF perf_maps")
  323. klog.Infof("[start] Look eBPF specPrograms")
  324. if err = t.LinkEbpfProg(); err != nil {
  325. return err
  326. }
  327. klog.Infof("[end] Look eBPF specPrograms")
  328. return nil
  329. }
  330. func (t *Tracer) LinkEbpfProg() error {
  331. klog.Infof("[start] Look eBPF specPrograms")
  332. var (
  333. l link.Link
  334. err error
  335. lastErr error
  336. )
  337. for _, programSpec := range t.collectionSpec.Programs {
  338. program := t.collection.Programs[programSpec.Name]
  339. klog.Infof("%s:[%s]", programSpec.SectionName, programSpec.Name)
  340. if t.DisableL7Tracing() {
  341. switch programSpec.Name {
  342. case "sys_enter_writev", "sys_enter_write", "sys_enter_sendto", "sys_enter_sendmsg", "sys_enter_sendmmsg":
  343. continue
  344. case "sys_enter_read", "sys_enter_readv", "sys_enter_recvfrom", "sys_enter_recvmsg":
  345. continue
  346. case "sys_exit_read", "sys_exit_readv", "sys_exit_recvfrom", "sys_exit_recvmsg":
  347. continue
  348. }
  349. }
  350. switch programSpec.Type {
  351. case ebpf.TracePoint:
  352. if strings.Contains(programSpec.SectionName, "prog") {
  353. continue
  354. }
  355. parts := strings.SplitN(programSpec.AttachTo, "/", 2)
  356. l, err = link.Tracepoint(parts[0], parts[1], program, nil)
  357. case ebpf.Kprobe:
  358. if strings.HasPrefix(programSpec.SectionName, "uprobe/") {
  359. t.uprobes[programSpec.Name] = program
  360. continue
  361. }
  362. if strings.HasPrefix(programSpec.SectionName, "kretprobe/") {
  363. l, err = link.Kretprobe(programSpec.AttachTo, program, nil)
  364. if err == nil {
  365. t.links = append(t.links, l)
  366. }
  367. continue
  368. }
  369. l, err = link.Kprobe(programSpec.AttachTo, program, nil)
  370. }
  371. if err != nil {
  372. lastErr = err
  373. t.Close()
  374. klog.Errorf("LinkEbpfProg failed to program[%s] link program: %s", programSpec.Name, err)
  375. //return fmt.Errorf("failed to link program: %w", err)
  376. } else {
  377. t.links = append(t.links, l)
  378. }
  379. }
  380. klog.Infof("[end] Look eBPF specPrograms")
  381. if lastErr != nil {
  382. return fmt.Errorf("failed to link program: %w", lastErr)
  383. }
  384. return nil
  385. }
  386. func (t *Tracer) UnlinkEbpfProg() error {
  387. var (
  388. lastErr error
  389. err error
  390. )
  391. /* 此处不应该处理 t.uprobes 中 ebpf-program
  392. for pName, p := range t.uprobes {
  393. if err = p.Close(); err != nil {
  394. lastErr = err
  395. klog.Errorf("UnlinkEbpfProg close program[%s] uprobe occurs error: %s", pName, err.Error())
  396. }
  397. }
  398. */
  399. for _, l := range t.links {
  400. if err = l.Close(); err != nil {
  401. lastErr = err
  402. klog.Errorf("UnlinkEbpfProg close link occurs error: %s", err.Error())
  403. }
  404. }
  405. return lastErr
  406. }
  407. func (t EventType) Int() int {
  408. return int(t)
  409. }
  410. func (t EventType) String() string {
  411. switch t {
  412. case EventTypeProcessStart:
  413. return "process-start"
  414. case EventTypeProcessExit:
  415. return "process-exit"
  416. case EventTypeConnectionOpen:
  417. return "connection-open"
  418. case EventTypeConnectionClose:
  419. return "connection-close"
  420. case EventTypeConnectionError:
  421. return "connection-error"
  422. case EventTypeListenOpen:
  423. return "listen-open"
  424. case EventTypeListenClose:
  425. return "listen-close"
  426. case EventTypeFileOpen:
  427. return "file-open"
  428. case EventTypeTCPRetransmit:
  429. return "tcp-retransmit"
  430. case EventTypeL7Request:
  431. return "l7-request"
  432. }
  433. return "unknown: " + strconv.Itoa(int(t))
  434. }
  435. func (t EventReason) String() string {
  436. switch t {
  437. case EventReasonNone:
  438. return "none"
  439. case EventReasonOOMKill:
  440. return "oom-kill"
  441. }
  442. return "unknown: " + strconv.Itoa(int(t))
  443. }
  444. type procEvent struct {
  445. Type EventType
  446. Pid uint32
  447. Reason uint32
  448. }
  449. type tcpEvent struct {
  450. Fd uint64
  451. Timestamp uint64
  452. Duration uint64
  453. FirstReadTime uint64
  454. FirstWriteTime uint64
  455. NewReadTime uint64
  456. Type EventType
  457. Pid uint32
  458. BytesSent uint64
  459. BytesReceived uint64
  460. SPort uint16
  461. DPort uint16
  462. SAddr [16]byte
  463. DAddr [16]byte
  464. }
  465. type fileEvent struct {
  466. Type EventType
  467. Pid uint32
  468. Fd uint64
  469. }
  470. // struct l7_event in l7.c
  471. type l7Event struct {
  472. Fd uint64
  473. ConnectionTimestamp uint64
  474. Pid uint32
  475. Status uint32
  476. Duration uint64
  477. Protocol uint8
  478. Method uint8
  479. Padding uint16
  480. StatementId uint32
  481. PayloadSize uint64
  482. TraceId uint64
  483. StartAt uint64 // ns
  484. EndtAt uint64 // ns
  485. TraceStart uint32
  486. TraceEnd uint32
  487. TraceType uint32
  488. EventCount uint32
  489. Sport uint16
  490. Dport uint16
  491. SAddr HashByte16
  492. DAddr HashByte16
  493. ComponentSport uint16
  494. ComponentDport uint16
  495. IsTls uint16
  496. ComponentSAddr HashByte16
  497. ComponentDAddr HashByte16
  498. AssumedAppId HashByte
  499. SpanId HashByte
  500. TraceIdFrom HashByte16
  501. CalledId HashByte
  502. InstanceIdFrom HashByte
  503. AppIdFrom HashByte
  504. SpanIdFrom HashByte
  505. TypeFrom [1]byte
  506. RPCTarget [64]byte
  507. ErrorMsg HashByte128
  508. MQ struct {
  509. Topic [256]byte // MQ topic (e.g., Kafka topic)
  510. Key [256]byte // MQ key (e.g., Kafka message key)
  511. }
  512. }
  513. type SocketDataBufferddd struct {
  514. EventsNum uint32
  515. Len uint32
  516. Data [32760]byte
  517. }
  518. const (
  519. TASK_COMM_LEN = 16
  520. BURST_DATA_BUF_SIZE = 8192
  521. )
  522. type Tuple struct {
  523. Daddr [16]uint8
  524. RcvSaddr [16]uint8
  525. AddrLen uint8
  526. L4Protocol uint8
  527. Dport uint16
  528. Num uint16
  529. }
  530. type SocketDatadddd struct {
  531. Pid uint32 // 表示线程号 如果'pid == tgid'表示一个进程, 否则是线程
  532. Tgid uint32 // 进程号
  533. CoroutineID uint64
  534. Source uint8
  535. Comm [TASK_COMM_LEN]byte
  536. SocketID uint64
  537. Tuple Tuple
  538. ExtraData uint32
  539. ExtraDataCount uint32
  540. TcpSeq uint32
  541. ThreadTraceID uint64
  542. Timestamp uint64
  543. Direction uint8
  544. MsgType uint8
  545. SyscallLen uint64
  546. DataSeq uint64
  547. DataType uint16
  548. DataLen uint16
  549. Data [BURST_DATA_BUF_SIZE]byte
  550. }
  551. type StackEvent struct {
  552. Type uint64
  553. Pid uint64
  554. TraceId uint64
  555. Goid uint64
  556. Ip uint64
  557. Bp uint64
  558. CallerIp uint64
  559. CallerBp uint64
  560. TimeNsStart uint64
  561. TimeNsEnd uint64
  562. // Nid uint64
  563. // Fpid uint64
  564. // Level uint64
  565. Location byte
  566. ClassName [100]byte
  567. MethedName [100]byte
  568. }
  569. type StackFunEvent struct {
  570. StackEvent StackEvent
  571. Uprobe *tracer.Uprobe
  572. }
  573. type pythonThreadEvent struct {
  574. Type EventType
  575. Pid uint32
  576. Duration uint64
  577. }
  578. func runEventsReader(name string, r *perf.Reader, ch chan<- Event, typ perfMapType) {
  579. for {
  580. rec, err := r.Read()
  581. if err != nil {
  582. if errors.Is(err, perf.ErrClosed) {
  583. break
  584. }
  585. continue
  586. }
  587. if rec.LostSamples > 0 {
  588. klog.Errorln(name, "lost samples:", rec.LostSamples)
  589. continue
  590. }
  591. var event Event
  592. switch typ {
  593. case perfMapTypeSocketEvents:
  594. //fmt.Println("perfMapTypeSocketEvents")
  595. // 假设 rec.RawSample 包含数据,类型为 []byte
  596. //rawData := rec.RawSample
  597. //fmt.Println("perfMapTypeSocketEvents2")
  598. //
  599. //// 创建一个 SocketDataBuffer 结构体实例
  600. //var buffer SocketDataBuffer
  601. //
  602. //// 创建一个字节缓冲区,并将数据填充到其中
  603. //reader := bytes.NewReader(rawData)
  604. //fmt.Println("perfMapTypeSocketEvents3")
  605. //fmt.Println(len(rawData))
  606. //// 使用 binary.Read 函数读取数据并解析为 SocketDataBuffer 结构体实例
  607. //if err := binary.Read(reader, binary.LittleEndian, &buffer); err != nil {
  608. // fmt.Println(reader.Len())
  609. // fmt.Println("Failed to read data:", err)
  610. // continue
  611. //}
  612. //fmt.Println("perfMapTypeSocketEvents4")
  613. //
  614. //// 打印解析后的数据
  615. //fmt.Println("EventsNum:", buffer.EventsNum)
  616. //fmt.Println("Len:", buffer.Len)
  617. //
  618. //// 打印 char data 的内容
  619. //fmt.Printf("Data: %s\n", string(buffer.Data[:buffer.Len])) // 仅打印实际长度的数据
  620. //socketDataBuffer := rec.RawSample
  621. // 解析 __socket_data_buffer
  622. //buf := (*SocketDataBuffer)(unsafe.Pointer(&rec.RawSample[0])) //nolint:gosec
  623. //
  624. //// 获取 char data[32760];
  625. //socketData := (*SocketData)(unsafe.Pointer(&buf.data[0])) //nolint:gosec
  626. //// todo
  627. //fmt.Printf("socketData.DataType:%d \n", (socketData.data_type))
  628. //fmt.Printf("socketData.DataLen:%d \n", (socketData.data_len))
  629. //
  630. //// 解析C结构体中的data字段
  631. //dataSlice := C.GoBytes(unsafe.Pointer(&socketData.data[0]), C.int(socketData.data_len))
  632. //// 打印或处理包含的数据
  633. //fmt.Printf("socketData.Payload:%v \n", string(dataSlice))
  634. /*todo */
  635. //socketData := (*(*[128]byte)(unsafe.Pointer(&eventC.line)))
  636. //dataPtr := unsafe.Pointer(&buf.data[0])
  637. //socketData := (*SocketData)(dataPtr)
  638. //reader2 := bytes.NewBuffer(rec.RawSample)
  639. // 222222
  640. //fmt.Println("socketData.Pid:", socketData.pid)
  641. //fmt.Println("socketData.Tgid:", socketData.tgid)
  642. //fmt.Println("socketData.CoroutineID:", socketData.coroutine_id)
  643. //fmt.Println("socketData.Source:", socketData.source)
  644. //
  645. //fmt.Printf("socketData.Comm: %s \n", socketData.comm)
  646. //fmt.Printf("socketData.SocketID :%v \n", socketData.socket_id)
  647. //fmt.Println("socketData.Tuple:", socketData.Tuple)
  648. //fmt.Println("socketData.ExtraData:", socketData.ExtraData)
  649. //fmt.Println("socketData.ExtraDataCount:", socketData.ExtraDataCount)
  650. //fmt.Println("socketData.TCPSeq:", socketData.TcpSeq)
  651. //fmt.Println("socketData.ThreadTraceID:", socketData.ThreadTraceID)
  652. //fmt.Println("socketData.Timestamp:", socketData.Timestamp)
  653. //fmt.Println("socketData.Direction:", socketData.Direction)
  654. //fmt.Println("socketData.MsgType:", socketData.MsgType)
  655. //fmt.Println("socketData.SyscallLen:", socketData.SyscallLen)
  656. //fmt.Println("socketData.DataSeq:", socketData.DataSeq)
  657. //socketData := &SocketData{}
  658. //reader := bytes.NewBuffer(rec.RawSample)
  659. //if err := binary.Read(reader, binary.LittleEndian, v); err != nil {
  660. // klog.Warningln("failed1 to read msg:", err)
  661. // continue
  662. //}
  663. //
  664. //var data []byte
  665. //payload := reader.Bytes()
  666. //switch {
  667. //case v.Len == 0:
  668. //case v.Len > 32760:
  669. // data = payload[:32760]
  670. //default:
  671. // data = payload[:v.Len]
  672. //}
  673. //////data2 := data[:v.Len]
  674. ////fmt.Println("perfMapTypeSocketEvents")
  675. //fmt.Println(v.EventsNum)
  676. //fmt.Println(v.Len)
  677. //fmt.Println(string(data))
  678. //
  679. //var data2 SocketData
  680. //reader2 := bytes.NewBuffer(data)
  681. //if err := binary.Read(reader2, binary.LittleEndian, data2); err != nil {
  682. // klog.Warningln("failed2 to read msg:", err)
  683. // continue
  684. //}
  685. //
  686. //fmt.Println(data2.Pid)
  687. //fmt.Println(data2.Tgid)
  688. //fmt.Println(string(v.Data))
  689. //continue
  690. case perfMapTypeL7Events:
  691. v := &l7Event{}
  692. reader := bytes.NewBuffer(rec.RawSample)
  693. if err := binary.Read(reader, binary.LittleEndian, v); err != nil {
  694. klog.Warningln("failed to read msg:", err)
  695. continue
  696. }
  697. //fmt.Println("v.TraceIdFrom")
  698. //fmt.Println(v.TraceIdFrom)
  699. //a := hex.EncodeToString(v.TraceIdFrom[:])
  700. //for _, b := range v.AssumedAppId {
  701. // fmt.Printf("v.AssumedAppId- %02\n", b)
  702. //}
  703. //fmt.Println(a)
  704. payload := reader.Bytes()
  705. req := &l7.RequestData{
  706. Protocol: l7.Protocol(v.Protocol),
  707. Pid: v.Pid,
  708. Status: l7.Status(v.Status),
  709. Duration: time.Duration(v.Duration),
  710. Method: l7.Method(v.Method),
  711. StatementId: v.StatementId,
  712. TraceId: v.TraceId,
  713. TraceStart: v.TraceStart,
  714. TraceEnd: v.TraceEnd,
  715. TraceType: v.TraceType,
  716. EventCount: v.EventCount,
  717. AssumedAppId: hex.EncodeToString(v.AssumedAppId[:]),
  718. SpanId: hex.EncodeToString(v.SpanId[:]),
  719. StartAt: v.StartAt,
  720. EndAt: v.EndtAt,
  721. ComponentSAddr: ipPort(v.ComponentSAddr, v.ComponentSport),
  722. ComponentDAddr: ipPort(v.ComponentDAddr, v.ComponentDport),
  723. DestAddrString: utils.BytesToString(v.RPCTarget[:]),
  724. ErrorMsg: utils.BytesToString(v.ErrorMsg[:]),
  725. IsTls: v.IsTls > 0,
  726. MQTopic: utils.BytesToString(v.MQ.Topic[:]),
  727. MQKey: utils.BytesToString(v.MQ.Key[:]),
  728. }
  729. if req.Protocol == l7.ProtocolHTTP {
  730. klog.Debugf("runEventsReader ComponentSAddr.String %s", req.ComponentSAddr.String())
  731. klog.Debugf("runEventsReader ComponentDAddr.String %s", req.ComponentDAddr.String())
  732. }
  733. if v.TraceEnd == TRACE_STATUS {
  734. req.ParentSpanContext.TraceIdFrom = hex.EncodeToString(v.TraceIdFrom[:])
  735. req.ParentSpanContext.CalledId = hex.EncodeToString(v.CalledId[:])
  736. req.ParentSpanContext.InstanceIdFrom = hex.EncodeToString(v.InstanceIdFrom[:])
  737. req.ParentSpanContext.AppIdFrom = hex.EncodeToString(v.AppIdFrom[:])
  738. req.ParentSpanContext.SpanIdFrom = hex.EncodeToString(v.SpanIdFrom[:])
  739. req.ParentSpanContext.TypeFrom = hex.EncodeToString(v.TypeFrom[:])
  740. // klog.Debugf("req.ParentSpanContext.TraceIdFrom %s", req.ParentSpanContext.TraceIdFrom)
  741. // klog.Debugf("req.ParentSpanContext.TypeFrom %s", req.ParentSpanContext.TypeFrom)
  742. req.SAddr = ipPort(v.SAddr, v.Sport)
  743. req.DAddr = ipPort(v.DAddr, v.Dport)
  744. // klog.Debugf("runEventsReader SAddr.String %s", req.SAddr.String())
  745. // klog.Debugf("runEventsReader DAddr.String %s", req.DAddr.String())
  746. }
  747. switch {
  748. case v.PayloadSize == 0:
  749. case v.PayloadSize > MaxPayloadSize:
  750. req.Payload = payload[:MaxPayloadSize]
  751. default:
  752. req.Payload = payload[:v.PayloadSize]
  753. }
  754. //fmt.Println("==========")
  755. //fmt.Println("req.Payload:", string(req.Payload))
  756. //fmt.Println("==========")
  757. event = Event{Type: EventTypeL7Request, Pid: v.Pid, Fd: v.Fd, Timestamp: v.ConnectionTimestamp, L7Request: req}
  758. case perfMapTypeFileEvents:
  759. v := &fileEvent{}
  760. if err := binary.Read(bytes.NewBuffer(rec.RawSample), binary.LittleEndian, v); err != nil {
  761. klog.Warningln("failed to read msg:", err)
  762. continue
  763. }
  764. event = Event{Type: v.Type, Pid: v.Pid, Fd: v.Fd}
  765. case perfMapTypeProcEvents:
  766. v := &procEvent{}
  767. if err := binary.Read(bytes.NewBuffer(rec.RawSample), binary.LittleEndian, v); err != nil {
  768. klog.Warningln("failed to read msg:", err)
  769. continue
  770. }
  771. event = Event{Type: v.Type, Reason: EventReason(v.Reason), Pid: v.Pid}
  772. case perfMapTypeTCPEvents:
  773. v := &tcpEvent{}
  774. if err := binary.Read(bytes.NewBuffer(rec.RawSample), binary.LittleEndian, v); err != nil {
  775. klog.Warningln("failed to read msg:", err)
  776. continue
  777. }
  778. event = Event{
  779. Type: v.Type,
  780. Pid: v.Pid,
  781. SrcAddr: ipPort(v.SAddr, v.SPort),
  782. DstAddr: ipPort(v.DAddr, v.DPort),
  783. Fd: v.Fd,
  784. Timestamp: v.Timestamp,
  785. Duration: time.Duration(v.Duration),
  786. }
  787. if v.Type == EventTypeConnectionClose {
  788. event.TrafficStats = &TrafficStats{
  789. BytesSent: v.BytesSent,
  790. BytesReceived: v.BytesReceived,
  791. }
  792. }
  793. event.FirstReadTime = v.FirstReadTime
  794. event.FirstWriteTime = v.FirstWriteTime
  795. event.NewReadTime = v.NewReadTime
  796. if v.Type == EventTypeAcceptClose {
  797. event.TrafficStats = &TrafficStats{
  798. BytesSent: v.BytesSent,
  799. BytesReceived: v.BytesReceived,
  800. }
  801. }
  802. case perfMapTypePythonThreadEvents:
  803. v := &pythonThreadEvent{}
  804. if err := binary.Read(bytes.NewBuffer(rec.RawSample), binary.LittleEndian, v); err != nil {
  805. klog.Warningln("failed to read msg:", err)
  806. continue
  807. }
  808. event = Event{
  809. Type: v.Type,
  810. Pid: v.Pid,
  811. Duration: time.Duration(v.Duration),
  812. }
  813. case perfMapTypeEventQueue:
  814. v := &StackEvent{}
  815. if err := binary.Read(bytes.NewBuffer(rec.RawSample), binary.LittleEndian, v); err != nil {
  816. klog.Warningln("failed to read msg:", err)
  817. continue
  818. }
  819. event = Event{
  820. Type: EventTypeFunEnt,
  821. StackEvent: v,
  822. }
  823. default:
  824. continue
  825. }
  826. ch <- event
  827. }
  828. }
  829. func ipPort(ip [16]byte, port uint16) netaddr.IPPort {
  830. i, _ := netaddr.FromStdIP(ip[:])
  831. return netaddr.IPPortFrom(i, port)
  832. }
  833. func (t *Tracer) InitKProcInfo(pid uint32, appInfo *AppInfo) error {
  834. var err error
  835. var info EbpfProcInfo
  836. if appInfo.EBPFProcInfo == nil {
  837. info = EbpfProcInfo{
  838. InstanceId: appInfo.InstanceIdHash.HashtVal,
  839. AppId: appInfo.AppIdHash.HashtVal,
  840. CodeType: uint16(appInfo.CodeType),
  841. }
  842. } else {
  843. info = *appInfo.EBPFProcInfo
  844. info.AppId = appInfo.AppIdHash.HashtVal
  845. }
  846. _, err = tracer.UpdateProcInfoToMap(t.collection, pid, info)
  847. if err != nil {
  848. klog.Error("failed to update program info", err)
  849. }
  850. appInfo.EBPFProcInfo = &info
  851. return err
  852. }
  853. func (t *Tracer) DelKProcInfo(pid uint32) error {
  854. _, err := tracer.DelProcInfoFromMap(t.collection, pid)
  855. if err != nil {
  856. klog.WithField("pid", pid).Error("failed to delete proc info", err)
  857. }
  858. return err
  859. }
  860. // TODO check language
  861. func (t *Tracer) DisableL7Tracing() bool {
  862. return t.disableL7Tracing
  863. }
  864. func (t *Tracer) DisableE2ETracing() bool {
  865. return t.disableE2ETracing
  866. }
  867. func (t *Tracer) DisableStackTracing() bool {
  868. return t.disableStackTracing
  869. }