blob: d52d20974b3ab3cbf1bdf88fc346e4469daccf64 [file] [log] [blame]
Brendan Gregg052f89c2015-10-13 15:35:58 -07001#!/usr/bin/python
Alexei Starovoitovbdf07732016-01-14 10:09:20 -08002# @lint-avoid-python-3-compatibility-imports
Brendan Gregg052f89c2015-10-13 15:35:58 -07003#
Alexei Starovoitovbdf07732016-01-14 10:09:20 -08004# tcpaccept Trace TCP accept()s.
5# For Linux, uses BCC, eBPF. Embedded C.
Brendan Gregg052f89c2015-10-13 15:35:58 -07006#
7# USAGE: tcpaccept [-h] [-t] [-p PID]
8#
9# This uses dynamic tracing of the kernel inet_csk_accept() socket function
10# (from tcp_prot.accept), and will need to be modified to match kernel changes.
Brendan Gregg052f89c2015-10-13 15:35:58 -070011#
Brendan Gregg052f89c2015-10-13 15:35:58 -070012# Copyright (c) 2015 Brendan Gregg.
13# Licensed under the Apache License, Version 2.0 (the "License")
14#
Alexei Starovoitovbdf07732016-01-14 10:09:20 -080015# 13-Oct-2015 Brendan Gregg Created this.
Brendan Gregg24825522016-02-14 16:32:29 -080016# 14-Feb-2016 " " Switch to bpf_perf_output.
Brendan Gregg052f89c2015-10-13 15:35:58 -070017
18from __future__ import print_function
19from bcc import BPF
Mark Drayton11de2982016-06-26 21:14:44 +010020from socket import inet_ntop, AF_INET, AF_INET6
21from struct import pack
Brendan Gregg052f89c2015-10-13 15:35:58 -070022import argparse
Brendan Gregg24825522016-02-14 16:32:29 -080023import ctypes as ct
Brendan Gregg052f89c2015-10-13 15:35:58 -070024
25# arguments
26examples = """examples:
Brendan Gregg000a4e62015-10-13 15:41:46 -070027 ./tcpaccept # trace all TCP accept()s
Brendan Gregg052f89c2015-10-13 15:35:58 -070028 ./tcpaccept -t # include timestamps
29 ./tcpaccept -p 181 # only trace PID 181
30"""
31parser = argparse.ArgumentParser(
Alexei Starovoitovbdf07732016-01-14 10:09:20 -080032 description="Trace TCP accepts",
33 formatter_class=argparse.RawDescriptionHelpFormatter,
34 epilog=examples)
Brendan Gregg052f89c2015-10-13 15:35:58 -070035parser.add_argument("-t", "--timestamp", action="store_true",
Alexei Starovoitovbdf07732016-01-14 10:09:20 -080036 help="include timestamp on output")
Brendan Gregg052f89c2015-10-13 15:35:58 -070037parser.add_argument("-p", "--pid",
Alexei Starovoitovbdf07732016-01-14 10:09:20 -080038 help="trace this PID only")
Nathan Scottcf0792f2018-02-02 16:56:50 +110039parser.add_argument("--ebpf", action="store_true",
40 help=argparse.SUPPRESS)
Brendan Gregg052f89c2015-10-13 15:35:58 -070041args = parser.parse_args()
42debug = 0
43
44# define BPF program
45bpf_text = """
46#include <uapi/linux/ptrace.h>
47#include <net/sock.h>
48#include <bcc/proto.h>
49
Brendan Gregg24825522016-02-14 16:32:29 -080050// separate data structs for ipv4 and ipv6
51struct ipv4_data_t {
52 // XXX: switch some to u32's when supported
53 u64 ts_us;
54 u64 pid;
Joe Yin365eade2018-06-21 13:41:03 +080055 u32 saddr;
56 u32 daddr;
Mark Drayton11de2982016-06-26 21:14:44 +010057 u64 ip;
Brendan Gregg24825522016-02-14 16:32:29 -080058 u64 lport;
59 char task[TASK_COMM_LEN];
60};
61BPF_PERF_OUTPUT(ipv4_events);
62
63struct ipv6_data_t {
Brendan Gregg24825522016-02-14 16:32:29 -080064 u64 ts_us;
65 u64 pid;
Mark Drayton11de2982016-06-26 21:14:44 +010066 unsigned __int128 saddr;
67 unsigned __int128 daddr;
Brendan Gregg24825522016-02-14 16:32:29 -080068 u64 ip;
Brendan Gregg24825522016-02-14 16:32:29 -080069 u64 lport;
70 char task[TASK_COMM_LEN];
71};
72BPF_PERF_OUTPUT(ipv6_events);
Joe Yin365eade2018-06-21 13:41:03 +080073"""
Brendan Gregg24825522016-02-14 16:32:29 -080074
Joe Yin365eade2018-06-21 13:41:03 +080075#
76# The following is the code for older kernels(Linux pre-4.16).
77# It uses kprobes to instrument inet_csk_accept(). On Linux 4.16 and
78# later, the sock:inet_sock_set_state tracepoint should be used instead, as
79# is done by the code that follows this.
80#
81bpf_text_kprobe = """
Brendan Gregg052f89c2015-10-13 15:35:58 -070082int kretprobe__inet_csk_accept(struct pt_regs *ctx)
83{
Naveen N. Rao4afa96a2016-05-03 14:54:21 +053084 struct sock *newsk = (struct sock *)PT_REGS_RC(ctx);
Alexei Starovoitovbdf07732016-01-14 10:09:20 -080085 u32 pid = bpf_get_current_pid_tgid();
Brendan Gregg052f89c2015-10-13 15:35:58 -070086
Alexei Starovoitovbdf07732016-01-14 10:09:20 -080087 if (newsk == NULL)
88 return 0;
Brendan Gregg052f89c2015-10-13 15:35:58 -070089
Alexei Starovoitovbdf07732016-01-14 10:09:20 -080090 // check this is TCP
91 u8 protocol = 0;
92 // workaround for reading the sk_protocol bitfield:
Joe Yin116bb402018-06-18 23:34:52 +080093
94 // Following comments add by Joe Yin:
95 // Unfortunately,it can not work since Linux 4.10,
96 // because the sk_wmem_queued is not following the bitfield of sk_protocol.
97 // And the following member is sk_gso_max_segs.
98 // So, we can use this:
99 // bpf_probe_read(&protocol, 1, (void *)((u64)&newsk->sk_gso_max_segs) - 3);
100 // In order to diff the pre-4.10 and 4.10+ ,introduce the variables gso_max_segs_offset,sk_lingertime,
101 // sk_lingertime is closed to the gso_max_segs_offset,and
102 // the offset between the two members is 4
103
104 int gso_max_segs_offset = offsetof(struct sock, sk_gso_max_segs);
105 int sk_lingertime_offset = offsetof(struct sock, sk_lingertime);
106
107 if (sk_lingertime_offset - gso_max_segs_offset == 4)
108 // 4.10+ with little endian
109#if __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__
Paul Chaignon8d78edd2018-06-29 07:47:44 +0200110 protocol = *(u8 *)((u64)&newsk->sk_gso_max_segs - 3);
Joe Yin116bb402018-06-18 23:34:52 +0800111 else
112 // pre-4.10 with little endian
Paul Chaignon8d78edd2018-06-29 07:47:44 +0200113 protocol = *(u8 *)((u64)&newsk->sk_wmem_queued - 3);
Joe Yin116bb402018-06-18 23:34:52 +0800114#elif __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
115 // 4.10+ with big endian
Paul Chaignon8d78edd2018-06-29 07:47:44 +0200116 protocol = *(u8 *)((u64)&newsk->sk_gso_max_segs - 1);
Joe Yin116bb402018-06-18 23:34:52 +0800117 else
118 // pre-4.10 with big endian
Paul Chaignon8d78edd2018-06-29 07:47:44 +0200119 protocol = *(u8 *)((u64)&newsk->sk_wmem_queued - 1);
Joe Yin116bb402018-06-18 23:34:52 +0800120#else
121# error "Fix your compiler's __BYTE_ORDER__?!"
122#endif
123
Alexei Starovoitovbdf07732016-01-14 10:09:20 -0800124 if (protocol != IPPROTO_TCP)
125 return 0;
Brendan Gregg10e1b142015-10-13 16:35:25 -0700126
Alexei Starovoitovbdf07732016-01-14 10:09:20 -0800127 // pull in details
128 u16 family = 0, lport = 0;
Paul Chaignona9f96c02018-06-15 00:27:08 +0200129 family = newsk->__sk_common.skc_family;
130 lport = newsk->__sk_common.skc_num;
Brendan Gregg052f89c2015-10-13 15:35:58 -0700131
Brendan Gregg24825522016-02-14 16:32:29 -0800132 if (family == AF_INET) {
133 struct ipv4_data_t data4 = {.pid = pid, .ip = 4};
134 data4.ts_us = bpf_ktime_get_ns() / 1000;
Paul Chaignona9f96c02018-06-15 00:27:08 +0200135 data4.saddr = newsk->__sk_common.skc_rcv_saddr;
136 data4.daddr = newsk->__sk_common.skc_daddr;
Brendan Gregg24825522016-02-14 16:32:29 -0800137 data4.lport = lport;
138 bpf_get_current_comm(&data4.task, sizeof(data4.task));
139 ipv4_events.perf_submit(ctx, &data4, sizeof(data4));
140
Alexei Starovoitovbdf07732016-01-14 10:09:20 -0800141 } else if (family == AF_INET6) {
Brendan Gregg24825522016-02-14 16:32:29 -0800142 struct ipv6_data_t data6 = {.pid = pid, .ip = 6};
143 data6.ts_us = bpf_ktime_get_ns() / 1000;
Mark Drayton11de2982016-06-26 21:14:44 +0100144 bpf_probe_read(&data6.saddr, sizeof(data6.saddr),
145 &newsk->__sk_common.skc_v6_rcv_saddr.in6_u.u6_addr32);
146 bpf_probe_read(&data6.daddr, sizeof(data6.daddr),
147 &newsk->__sk_common.skc_v6_daddr.in6_u.u6_addr32);
Brendan Gregg24825522016-02-14 16:32:29 -0800148 data6.lport = lport;
149 bpf_get_current_comm(&data6.task, sizeof(data6.task));
150 ipv6_events.perf_submit(ctx, &data6, sizeof(data6));
Alexei Starovoitovbdf07732016-01-14 10:09:20 -0800151 }
152 // else drop
Brendan Gregg052f89c2015-10-13 15:35:58 -0700153
Alexei Starovoitovbdf07732016-01-14 10:09:20 -0800154 return 0;
Brendan Gregg052f89c2015-10-13 15:35:58 -0700155}
156"""
157
Joe Yin365eade2018-06-21 13:41:03 +0800158bpf_text_tracepoint = """
159TRACEPOINT_PROBE(sock, inet_sock_set_state)
160{
161 if (args->protocol != IPPROTO_TCP)
162 return 0;
163 u32 pid = bpf_get_current_pid_tgid();
164 // pull in details
165 u16 family = 0, lport = 0;
166 family = args->family;
167 lport = args->sport;
168
169 if (family == AF_INET) {
170 struct ipv4_data_t data4 = {.pid = pid, .ip = 4};
171 data4.ts_us = bpf_ktime_get_ns() / 1000;
172 __builtin_memcpy(&data4.saddr, args->saddr, sizeof(data4.saddr));
173 __builtin_memcpy(&data4.daddr, args->daddr, sizeof(data4.daddr));
174 data4.lport = lport;
175 bpf_get_current_comm(&data4.task, sizeof(data4.task));
176 ipv4_events.perf_submit(args, &data4, sizeof(data4));
177 } else if (family == AF_INET6) {
178 struct ipv6_data_t data6 = {.pid = pid, .ip = 6};
179 data6.ts_us = bpf_ktime_get_ns() / 1000;
180 __builtin_memcpy(&data6.saddr, args->saddr, sizeof(data6.saddr));
181 __builtin_memcpy(&data6.daddr, args->daddr, sizeof(data6.daddr));
182 data6.lport = lport;
183 bpf_get_current_comm(&data6.task, sizeof(data6.task));
184 ipv6_events.perf_submit(args, &data6, sizeof(data6));
185 }
186 // else drop
187
188 return 0;
189}
190"""
191
192if (BPF.tracepoint_exists("sock", "inet_sock_set_state")):
193 bpf_text += bpf_text_tracepoint
194else:
195 bpf_text += bpf_text_kprobe
196
197
Brendan Gregg052f89c2015-10-13 15:35:58 -0700198# code substitutions
199if args.pid:
Alexei Starovoitovbdf07732016-01-14 10:09:20 -0800200 bpf_text = bpf_text.replace('FILTER',
201 'if (pid != %s) { return 0; }' % args.pid)
Brendan Gregg052f89c2015-10-13 15:35:58 -0700202else:
Alexei Starovoitovbdf07732016-01-14 10:09:20 -0800203 bpf_text = bpf_text.replace('FILTER', '')
Nathan Scottcf0792f2018-02-02 16:56:50 +1100204if debug or args.ebpf:
Alexei Starovoitovbdf07732016-01-14 10:09:20 -0800205 print(bpf_text)
Nathan Scottcf0792f2018-02-02 16:56:50 +1100206 if args.ebpf:
207 exit()
Brendan Gregg052f89c2015-10-13 15:35:58 -0700208
Brendan Gregg24825522016-02-14 16:32:29 -0800209# event data
210TASK_COMM_LEN = 16 # linux/sched.h
Mark Drayton11de2982016-06-26 21:14:44 +0100211
Brendan Gregg24825522016-02-14 16:32:29 -0800212class Data_ipv4(ct.Structure):
213 _fields_ = [
214 ("ts_us", ct.c_ulonglong),
215 ("pid", ct.c_ulonglong),
Joe Yin365eade2018-06-21 13:41:03 +0800216 ("saddr", ct.c_uint),
217 ("daddr", ct.c_uint),
Mark Drayton11de2982016-06-26 21:14:44 +0100218 ("ip", ct.c_ulonglong),
Brendan Gregg24825522016-02-14 16:32:29 -0800219 ("lport", ct.c_ulonglong),
220 ("task", ct.c_char * TASK_COMM_LEN)
221 ]
Mark Drayton11de2982016-06-26 21:14:44 +0100222
Brendan Gregg24825522016-02-14 16:32:29 -0800223class Data_ipv6(ct.Structure):
224 _fields_ = [
225 ("ts_us", ct.c_ulonglong),
226 ("pid", ct.c_ulonglong),
Mark Drayton11de2982016-06-26 21:14:44 +0100227 ("saddr", (ct.c_ulonglong * 2)),
228 ("daddr", (ct.c_ulonglong * 2)),
Brendan Gregg24825522016-02-14 16:32:29 -0800229 ("ip", ct.c_ulonglong),
Brendan Gregg24825522016-02-14 16:32:29 -0800230 ("lport", ct.c_ulonglong),
231 ("task", ct.c_char * TASK_COMM_LEN)
232 ]
233
234# process event
235def print_ipv4_event(cpu, data, size):
236 event = ct.cast(data, ct.POINTER(Data_ipv4)).contents
Mark Drayton11de2982016-06-26 21:14:44 +0100237 global start_ts
Brendan Gregg24825522016-02-14 16:32:29 -0800238 if args.timestamp:
239 if start_ts == 0:
240 start_ts = event.ts_us
Mark Drayton11de2982016-06-26 21:14:44 +0100241 print("%-9.3f" % ((float(event.ts_us) - start_ts) / 1000000), end="")
Rafael F78948e42017-03-26 14:54:25 +0200242 print("%-6d %-12.12s %-2d %-16s %-16s %-4d" % (event.pid,
243 event.task.decode(), event.ip,
244 inet_ntop(AF_INET, pack("I", event.daddr)),
Mark Drayton11de2982016-06-26 21:14:44 +0100245 inet_ntop(AF_INET, pack("I", event.saddr)), event.lport))
246
Brendan Gregg24825522016-02-14 16:32:29 -0800247def print_ipv6_event(cpu, data, size):
248 event = ct.cast(data, ct.POINTER(Data_ipv6)).contents
Mark Drayton11de2982016-06-26 21:14:44 +0100249 global start_ts
Brendan Gregg24825522016-02-14 16:32:29 -0800250 if args.timestamp:
251 if start_ts == 0:
252 start_ts = event.ts_us
Mark Drayton11de2982016-06-26 21:14:44 +0100253 print("%-9.3f" % ((float(event.ts_us) - start_ts) / 1000000), end="")
Rafael F78948e42017-03-26 14:54:25 +0200254 print("%-6d %-12.12s %-2d %-16s %-16s %-4d" % (event.pid,
255 event.task.decode(), event.ip, inet_ntop(AF_INET6, event.daddr),
Mark Drayton11de2982016-06-26 21:14:44 +0100256 inet_ntop(AF_INET6, event.saddr), event.lport))
Brendan Gregg24825522016-02-14 16:32:29 -0800257
Brendan Gregg052f89c2015-10-13 15:35:58 -0700258# initialize BPF
259b = BPF(text=bpf_text)
260
261# header
262if args.timestamp:
Alexei Starovoitovbdf07732016-01-14 10:09:20 -0800263 print("%-9s" % ("TIME(s)"), end="")
Brendan Gregg052f89c2015-10-13 15:35:58 -0700264print("%-6s %-12s %-2s %-16s %-16s %-4s" % ("PID", "COMM", "IP", "RADDR",
265 "LADDR", "LPORT"))
266
267start_ts = 0
268
Brendan Gregg24825522016-02-14 16:32:29 -0800269# read events
270b["ipv4_events"].open_perf_buffer(print_ipv4_event)
271b["ipv6_events"].open_perf_buffer(print_ipv6_event)
Brendan Gregg052f89c2015-10-13 15:35:58 -0700272while 1:
Teng Qindbf00292018-02-28 21:47:50 -0800273 b.perf_buffer_poll()