1 /*-
2 * SPDX-License-Identifier: BSD-2-Clause
3 *
4 * Copyright (c) 2016-2020 Netflix, Inc.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
8 * are met:
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 * 2. Redistributions in binary form must reproduce the above copyright
12 * notice, this list of conditions and the following disclaimer in the
13 * documentation and/or other materials provided with the distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 * SUCH DAMAGE.
26 */
27
28 #ifndef __tcp_log_buf_h__
29 #define __tcp_log_buf_h__
30
31 #define TCP_LOG_REASON_LEN 32
32 #define TCP_LOG_TAG_LEN 32
33 #define TCP_LOG_BUF_VER (9)
34
35 /*
36 * Because the (struct tcp_log_buffer) includes 8-byte uint64_t's, it requires
37 * 8-byte alignment to work properly on all platforms. Therefore, we will
38 * enforce 8-byte alignment for all the structures that may appear by
39 * themselves (instead of being embedded in another structure) in a data
40 * stream.
41 */
42 #define ALIGN_TCP_LOG __aligned(8)
43
44 /* Information about the socketbuffer state. */
45 struct tcp_log_sockbuf
46 {
47 uint32_t tls_sb_acc; /* available chars (sb->sb_acc) */
48 uint32_t tls_sb_ccc; /* claimed chars (sb->sb_ccc) */
49 uint32_t tls_sb_spare; /* spare */
50 };
51
52 /* Optional, verbose information that may be appended to an event log. */
53 struct tcp_log_verbose
54 {
55 #define TCP_FUNC_LEN 32
56 char tlv_snd_frm[TCP_FUNC_LEN]; /* tcp_output() caller */
57 char tlv_trace_func[TCP_FUNC_LEN]; /* Function that
58 generated trace */
59 uint32_t tlv_trace_line; /* Line number that generated trace */
60 uint8_t _pad[4];
61 } ALIGN_TCP_LOG;
62
63 /* Internal RACK state variables. */
64 struct tcp_log_rack
65 {
66 uint32_t tlr_rack_rtt; /* rc_rack_rtt */
67 uint8_t tlr_state; /* Internal RACK state */
68 uint8_t _pad[3]; /* Padding */
69 };
70
71 struct tcp_log_bbr {
72 uint64_t cur_del_rate;
73 uint64_t delRate;
74 uint64_t rttProp;
75 uint64_t bw_inuse;
76 uint32_t inflight;
77 uint32_t applimited;
78 uint32_t delivered;
79 uint32_t timeStamp;
80 uint32_t epoch;
81 uint32_t lt_epoch;
82 uint32_t pkts_out;
83 uint32_t flex1;
84 uint32_t flex2;
85 uint32_t flex3;
86 uint32_t flex4;
87 uint32_t flex5;
88 uint32_t flex6;
89 uint32_t lost;
90 uint16_t pacing_gain;
91 uint16_t cwnd_gain;
92 uint16_t flex7;
93 uint8_t bbr_state;
94 uint8_t bbr_substate;
95 uint8_t inhpts;
96 uint8_t __spare;
97 uint8_t use_lt_bw;
98 uint8_t flex8;
99 uint32_t pkt_epoch;
100 };
101
102 /* shadows tcp_log_bbr struct element sizes */
103 struct tcp_log_raw {
104 uint64_t u64_flex[4];
105 uint32_t u32_flex[14];
106 uint16_t u16_flex[3];
107 uint8_t u8_flex[6];
108 uint32_t u32_flex2[1];
109 };
110
111 struct tcp_log_uint64 {
112 uint64_t u64_flex[13];
113 };
114
115 struct tcp_log_sendfile {
116 uint64_t offset;
117 uint64_t length;
118 uint32_t flags;
119 };
120
121 /*
122 * tcp_log_stackspecific is currently being used as "event specific" log
123 * info by all stacks (i.e. struct tcp_log_bbr is used for generic event
124 * logging). Until this is cleaned up more generically and throughout,
125 * allow events to use the same space in the union.
126 */
127 union tcp_log_stackspecific
128 {
129 struct tcp_log_rack u_rack;
130 struct tcp_log_bbr u_bbr;
131 struct tcp_log_sendfile u_sf;
132 struct tcp_log_raw u_raw; /* "raw" log access */
133 struct tcp_log_uint64 u64_raw; /* just u64's - used by process info */
134 };
135
136 typedef union tcp_log_stackspecific tcp_log_eventspecific_t;
137
138 struct tcp_log_buffer
139 {
140 /* Event basics */
141 struct timeval tlb_tv; /* Timestamp of trace */
142 uint32_t tlb_ticks; /* Timestamp of trace */
143 uint32_t tlb_sn; /* Serial number */
144 uint8_t tlb_stackid; /* Stack ID */
145 uint8_t tlb_eventid; /* Event ID */
146 uint16_t tlb_eventflags; /* Flags for the record */
147 #define TLB_FLAG_RXBUF 0x0001 /* Includes receive buffer info */
148 #define TLB_FLAG_TXBUF 0x0002 /* Includes send buffer info */
149 #define TLB_FLAG_HDR 0x0004 /* Includes a TCP header */
150 #define TLB_FLAG_VERBOSE 0x0008 /* Includes function/line numbers */
151 #define TLB_FLAG_STACKINFO 0x0010 /* Includes stack-specific info */
152 int tlb_errno; /* Event error (if any) */
153
154 /* Internal session state */
155 struct tcp_log_sockbuf tlb_rxbuf; /* Receive buffer */
156 struct tcp_log_sockbuf tlb_txbuf; /* Send buffer */
157
158 int tlb_state; /* TCPCB t_state */
159 uint32_t tlb_starttime; /* TCPCB t_starttime */
160 uint32_t tlb_iss; /* TCPCB iss */
161 uint32_t tlb_flags; /* TCPCB flags */
162 uint32_t tlb_snd_una; /* TCPCB snd_una */
163 uint32_t tlb_snd_max; /* TCPCB snd_max */
164 uint32_t tlb_snd_cwnd; /* TCPCB snd_cwnd */
165 uint32_t tlb_snd_nxt; /* TCPCB snd_nxt */
166 uint32_t tlb_snd_recover;/* TCPCB snd_recover */
167 uint32_t tlb_snd_wnd; /* TCPCB snd_wnd */
168 uint32_t tlb_snd_ssthresh; /* TCPCB snd_ssthresh */
169 uint32_t tlb_srtt; /* TCPCB t_srtt */
170 uint32_t tlb_rttvar; /* TCPCB t_rttvar */
171 uint32_t tlb_rcv_up; /* TCPCB rcv_up */
172 uint32_t tlb_rcv_adv; /* TCPCB rcv_adv */
173 uint32_t tlb_flags2; /* TCPCB t_flags2 */
174 uint32_t tlb_rcv_nxt; /* TCPCB rcv_nxt */
175 uint32_t tlb_rcv_wnd; /* TCPCB rcv_wnd */
176 uint32_t tlb_dupacks; /* TCPCB t_dupacks */
177 int tlb_segqlen; /* TCPCB segqlen */
178 int tlb_snd_numholes; /* TCPCB snd_numholes */
179 uint32_t tlb_flex1; /* Event specific information */
180 uint32_t tlb_flex2; /* Event specific information */
181 uint32_t tlb_fbyte_in; /* TCPCB first byte in time */
182 uint32_t tlb_fbyte_out; /* TCPCB first byte out time */
183 uint8_t tlb_snd_scale:4, /* TCPCB snd_scale */
184 tlb_rcv_scale:4; /* TCPCB rcv_scale */
185 uint8_t _pad[3]; /* Padding */
186 /* Per-stack info */
187 union tcp_log_stackspecific tlb_stackinfo;
188 #define tlb_rack tlb_stackinfo.u_rack
189
190 /* The packet */
191 uint32_t tlb_len; /* The packet's data length */
192 struct tcphdr tlb_th; /* The TCP header */
193 uint8_t tlb_opts[TCP_MAXOLEN]; /* The TCP options */
194
195 /* Verbose information (optional) */
196 struct tcp_log_verbose tlb_verbose[0];
197 } ALIGN_TCP_LOG;
198
199 enum tcp_log_events {
200 TCP_LOG_IN = 1, /* Incoming packet 1 */
201 TCP_LOG_OUT, /* Transmit (without other event) 2 */
202 TCP_LOG_RTO, /* Retransmit timeout 3 */
203 TCP_LOG_SB_WAKE, /* Awaken socket buffer 4 */
204 TCP_UNUSED_5, /* Detected bad retransmission 5 */
205 TCP_LOG_PRR, /* Doing PRR 6 */
206 TCP_UNUSED_7, /* Detected reorder 7 */
207 TCP_LOG_HPTS, /* Hpts sending a packet 8 */
208 BBR_LOG_BBRUPD, /* We updated BBR info 9 */
209 BBR_LOG_BBRSND, /* We did a slot calculation and sending is done 10 */
210 BBR_LOG_ACKCLEAR, /* A ack clears all outstanding 11 */
211 TCP_UNUSED_12, /* The tcb had a packet input to it 12 */
212 BBR_LOG_TIMERSTAR, /* Start a timer 13 */
213 BBR_LOG_TIMERCANC, /* Cancel a timer 14 */
214 BBR_LOG_ENTREC, /* Entered recovery 15 */
215 BBR_LOG_EXITREC, /* Exited recovery 16 */
216 BBR_LOG_CWND, /* Cwnd change 17 */
217 BBR_LOG_BWSAMP, /* LT B/W sample has been made 18 */
218 BBR_LOG_MSGSIZE, /* We received a EMSGSIZE error 19 */
219 BBR_LOG_BBRRTT, /* BBR RTT is updated 20 */
220 BBR_LOG_JUSTRET, /* We just returned out of output 21 */
221 BBR_LOG_STATE, /* A BBR state change occurred 22 */
222 BBR_LOG_PKT_EPOCH, /* A BBR packet epoch occurred 23 */
223 BBR_LOG_PERSIST, /* BBR changed to/from a persists 24 */
224 TCP_LOG_FLOWEND, /* End of a flow 25 */
225 BBR_LOG_RTO, /* BBR's timeout includes BBR info 26 */
226 BBR_LOG_DOSEG_DONE, /* hpts do_segment completes 27 */
227 BBR_LOG_EXIT_GAIN, /* hpts do_segment completes 28 */
228 BBR_LOG_THRESH_CALC, /* Doing threshold calculation 29 */
229 TCP_LOG_MAPCHG, /* Map Changes to the sendmap 30 */
230 TCP_LOG_USERSEND, /* User level sends data 31 */
231 BBR_RSM_CLEARED, /* RSM cleared of ACK flags 32 */
232 BBR_LOG_STATE_TARGET, /* Log of target at state 33 */
233 BBR_LOG_TIME_EPOCH, /* A timed based Epoch occurred 34 */
234 BBR_LOG_TO_PROCESS, /* A to was processed 35 */
235 BBR_LOG_BBRTSO, /* TSO update 36 */
236 BBR_LOG_HPTSDIAG, /* Hpts diag insert 37 */
237 BBR_LOG_LOWGAIN, /* Low gain accounting 38 */
238 BBR_LOG_PROGRESS, /* Progress timer event 39 */
239 TCP_LOG_SOCKET_OPT, /* A socket option is set 40 */
240 BBR_LOG_TIMERPREP, /* A BBR var to debug out TLP issues 41 */
241 BBR_LOG_ENOBUF_JMP, /* We had a enobuf jump 42 */
242 BBR_LOG_HPTSI_CALC, /* calc the hptsi time 43 */
243 BBR_LOG_RTT_SHRINKS, /* We had a log reduction of rttProp 44 */
244 BBR_LOG_BW_RED_EV, /* B/W reduction events 45 */
245 BBR_LOG_REDUCE, /* old bbr log reduce for 4.1 and earlier 46*/
246 TCP_LOG_RTT, /* A rtt (in useconds) is being sampled and applied to the srtt algo 47 */
247 BBR_LOG_SETTINGS_CHG, /* Settings changed for loss response 48 */
248 TCP_UNUSED_49, /* SRTT gaining -- now not used 49 */
249 TCP_LOG_REASS, /* Reassembly buffer logging 50 */
250 TCP_HDWR_PACE_SIZE, /* TCP pacing size set (rl and rack uses this) 51 */
251 BBR_LOG_HDWR_PACE, /* TCP Hardware pacing log 52 */
252 BBR_LOG_TSTMP_VAL, /* Temp debug timestamp validation 53 */
253 TCP_LOG_CONNEND, /* End of connection 54 */
254 TCP_LOG_LRO, /* LRO entry 55 */
255 TCP_SACK_FILTER_RES, /* Results of SACK Filter 56 */
256 TCP_UNUSED_57, /* Sack Attack Detection 57 */
257 TCP_TIMELY_WORK, /* Logs regarding Timely CC tweaks 58 */
258 TCP_UNUSED_59, /* User space event data 59 */
259 TCP_LOG_SENDFILE, /* sendfile() logging for TCP connections 60 */
260 TCP_LOG_REQ_T, /* logging of request tracking 61 */
261 TCP_LOG_ACCOUNTING, /* Log of TCP Accounting data 62 */
262 TCP_LOG_FSB, /* FSB information 63 */
263 RACK_DSACK_HANDLING, /* Handling of DSACK in rack for reordering window 64 */
264 TCP_HYSTART, /* TCP Hystart logging 65 */
265 TCP_CHG_QUERY, /* Change query during fnc_init() 66 */
266 TCP_RACK_LOG_COLLAPSE, /* Window collapse by peer 67 */
267 TCP_RACK_TP_TRIGGERED, /* A rack tracepoint is triggered 68 */
268 TCP_HYBRID_PACING_LOG, /* Hybrid pacing log 69 */
269 TCP_LOG_PRU, /* TCP protocol user request 70 */
270 TCP_UNUSED_71, /* old TCP Policer detectionn, not used 71 */
271 TCP_PCM_MEASURE, /* TCP Path Capacity Measurement 72 */
272 TCP_LOG_END /* End (keep at end) 73 */
273 };
274
275 enum tcp_log_states {
276 TCP_LOG_STATE_RATIO_OFF = -2, /* Log ratio evaluation yielded an OFF
277 result. Only used for tlb_logstate */
278 TCP_LOG_STATE_CLEAR = -1, /* Deactivate and clear tracing. Passed
279 to tcp_log_state_change() but never
280 stored in any logstate variable */
281 TCP_LOG_STATE_OFF = 0, /* Pause */
282
283 /* Positively numbered states represent active logging modes */
284 TCP_LOG_STATE_TAIL=1, /* Keep the trailing events */
285 TCP_LOG_STATE_HEAD=2, /* Keep the leading events */
286 TCP_LOG_STATE_HEAD_AUTO=3, /* Keep the leading events, and
287 automatically dump them to the
288 device */
289 TCP_LOG_STATE_CONTINUAL=4, /* Continually dump the data when full */
290 TCP_LOG_STATE_TAIL_AUTO=5, /* Keep the trailing events, and
291 automatically dump them when the
292 session ends */
293 TCP_LOG_VIA_BBPOINTS=6 /* Log only if the BB point has been configured */
294 };
295
296 /* Use this if we don't know whether the operation succeeded. */
297 #define ERRNO_UNK (-1)
298
299 /*
300 * If the user included dev/tcp_log/tcp_log_dev.h, then include our private
301 * headers. Otherwise, there is no reason to pollute all the files with an
302 * additional include.
303 *
304 * This structure is aligned to an 8-byte boundary to match the alignment
305 * requirements of (struct tcp_log_buffer).
306 */
307 #ifdef __tcp_log_dev_h__
308 struct tcp_log_header {
309 struct tcp_log_common_header tlh_common;
310 #define tlh_version tlh_common.tlch_version
311 #define tlh_type tlh_common.tlch_type
312 #define tlh_length tlh_common.tlch_length
313 struct in_endpoints tlh_ie;
314 struct timeval tlh_offset; /* Uptime -> UTC offset */
315 char tlh_id[TCP_LOG_ID_LEN];
316 char tlh_reason[TCP_LOG_REASON_LEN];
317 char tlh_tag[TCP_LOG_TAG_LEN];
318 uint8_t tlh_af;
319 uint8_t _pad[7];
320 } ALIGN_TCP_LOG;
321
322 #ifdef _KERNEL
323 struct tcp_log_dev_log_queue {
324 struct tcp_log_dev_queue tldl_common;
325 char tldl_id[TCP_LOG_ID_LEN];
326 char tldl_reason[TCP_LOG_REASON_LEN];
327 char tldl_tag[TCP_LOG_TAG_LEN];
328 struct in_endpoints tldl_ie;
329 struct tcp_log_stailq tldl_entries;
330 int tldl_count;
331 uint8_t tldl_af;
332 };
333 #endif /* _KERNEL */
334 #endif /* __tcp_log_dev_h__ */
335
336 /*
337 * Defined BBPOINTS that can be used
338 * with TCP_LOG_VIA_BBPOINTS.
339 */
340 #define TCP_BBPOINT_NONE 0
341 #define TCP_BBPOINT_REQ_LEVEL_LOGGING 1
342
343 /*********************/
344 /* TCP Trace points */
345 /*********************/
346 /*
347 * TCP trace points are interesting points within
348 * the TCP code that the author/debugger may want
349 * to have BB logging enabled if we hit that point.
350 * In order to enable a trace point you set the
351 * sysctl var net.inet.tcp.bb.tp.number to
352 * one of the numbers listed below. You also
353 * must make sure net.inet.tcp.bb.tp.bbmode is
354 * non-zero, the default is 4 for continuous tracing.
355 * You also set in the number of connections you want
356 * have get BB logs in net.inet.tcp.bb.tp.count.
357 *
358 * Count will decrement every time BB logging is assigned
359 * to a connection that hit your tracepoint.
360 *
361 * You can enable all trace points by setting the number
362 * to 0xffffffff. You can disable all trace points by
363 * setting number to zero (or count to 0).
364 *
365 * Below are the enumerated list of tracepoints that
366 * have currently been defined in the code. Add more
367 * as you add a call to rack_trace_point(rack, <name>);
368 * where <name> is defined below.
369 */
370 #define TCP_TP_HWENOBUF 0x00000001 /* When we are doing hardware pacing and hit enobufs */
371 #define TCP_TP_ENOBUF 0x00000002 /* When we hit enobufs with software pacing */
372 #define TCP_TP_COLLAPSED_WND 0x00000003 /* When a peer to collapses its rwnd on us */
373 #define TCP_TP_COLLAPSED_RXT 0x00000004 /* When we actually retransmit a collapsed window rsm */
374 #define TCP_TP_REQ_LOG_FAIL 0x00000005 /* We tried to allocate a Request log but had no space */
375 #define TCP_TP_RESET_RCV 0x00000006 /* Triggers when we receive a RST */
376 #define TCP_TP_POLICER_DET 0x00000007 /* When we detect a policer */
377 #define TCP_TP_EXCESS_RXT TCP_TP_POLICER_DET /* alias */
378 #define TCP_TP_SAD_TRIGGERED 0x00000008 /* Sack Attack Detection triggers */
379 #define TCP_TP_SAD_SUSPECT 0x0000000a /* A sack has supicious information in it */
380 #define TCP_TP_PACED_BOTTOM 0x0000000b /* We have paced at the bottom */
381
382 #ifdef _KERNEL
383
384 extern uint32_t tcp_trace_point_config;
385 extern uint32_t tcp_trace_point_bb_mode;
386 extern int32_t tcp_trace_point_count;
387
388 /*
389 * Returns true if any sort of BB logging is enabled,
390 * commonly used throughout the codebase.
391 */
392 static inline int
tcp_bblogging_on(struct tcpcb * tp)393 tcp_bblogging_on(struct tcpcb *tp)
394 {
395 if (tp->_t_logstate <= TCP_LOG_STATE_OFF)
396 return (0);
397 if (tp->_t_logstate == TCP_LOG_VIA_BBPOINTS)
398 return (0);
399 return (1);
400 }
401
402 /*
403 * Returns true if we match a specific bbpoint when
404 * in TCP_LOG_VIA_BBPOINTS, but also returns true
405 * for all the other logging states.
406 */
407 static inline int
tcp_bblogging_point_on(struct tcpcb * tp,uint8_t bbpoint)408 tcp_bblogging_point_on(struct tcpcb *tp, uint8_t bbpoint)
409 {
410 if (tp->_t_logstate <= TCP_LOG_STATE_OFF)
411 return (0);
412 if ((tp->_t_logstate == TCP_LOG_VIA_BBPOINTS) &&
413 (tp->_t_logpoint == bbpoint))
414 return (1);
415 else if (tp->_t_logstate == TCP_LOG_VIA_BBPOINTS)
416 return (0);
417 return (1);
418 }
419
420 static inline void
tcp_set_bblog_state(struct tcpcb * tp,uint8_t ls,uint8_t bbpoint)421 tcp_set_bblog_state(struct tcpcb *tp, uint8_t ls, uint8_t bbpoint)
422 {
423 if ((ls == TCP_LOG_VIA_BBPOINTS) &&
424 (tp->_t_logstate == TCP_LOG_STATE_OFF)){
425 /*
426 * We don't allow a BBPOINTS set to override
427 * other types of BB logging set by other means such
428 * as the bb_ratio/bb_state URL parameters. In other
429 * words BBlogging must be *off* in order to turn on
430 * a BBpoint.
431 */
432 tp->_t_logpoint = bbpoint;
433 tp->_t_logstate = ls;
434 } else if (ls < TCP_LOG_VIA_BBPOINTS) {
435 tp->_t_logpoint = TCP_BBPOINT_NONE;
436 tp->_t_logstate = ls;
437 }
438 }
439
440 static inline uint32_t
tcp_get_bblog_state(struct tcpcb * tp)441 tcp_get_bblog_state(struct tcpcb *tp)
442 {
443 return (tp->_t_logstate);
444 }
445
446 static inline void
tcp_trace_point(struct tcpcb * tp,int num)447 tcp_trace_point(struct tcpcb *tp, int num)
448 {
449 #ifdef TCP_BLACKBOX
450 if (((tcp_trace_point_config == num) ||
451 (tcp_trace_point_config == 0xffffffff)) &&
452 (tcp_trace_point_bb_mode != 0) &&
453 (tcp_trace_point_count > 0) &&
454 (tcp_bblogging_on(tp) == 0)) {
455 int res;
456 res = atomic_fetchadd_int(&tcp_trace_point_count, -1);
457 if (res > 0) {
458 tcp_set_bblog_state(tp, tcp_trace_point_bb_mode, TCP_BBPOINT_NONE);
459 } else {
460 /* Loss a race assure its zero now */
461 tcp_trace_point_count = 0;
462 }
463 }
464 #endif
465 }
466
467 #define TCP_LOG_BUF_DEFAULT_SESSION_LIMIT 5000
468 #define TCP_LOG_BUF_DEFAULT_GLOBAL_LIMIT 5000000
469
470 /*
471 * TCP_LOG_EVENT_VERBOSE: The same as TCP_LOG_EVENT, except it always
472 * tries to record verbose information.
473 */
474 #define TCP_LOG_EVENT_VERBOSE(tp, th, rxbuf, txbuf, eventid, errornum, len, stackinfo, th_hostorder, tv) \
475 do { \
476 if (tcp_bblogging_on(tp)) \
477 tcp_log_event(tp, th, rxbuf, txbuf, eventid, \
478 errornum, len, stackinfo, th_hostorder, \
479 tp->t_output_caller, __func__, __LINE__, tv);\
480 } while (0)
481
482 /*
483 * TCP_LOG_EVENT: This is a macro so we can capture function/line
484 * information when needed. You can use the macro when you are not
485 * doing a lot of prep in the stack specific information i.e. you
486 * don't add extras (stackinfo). If you are adding extras which
487 * means filling out a stack variable instead use the tcp_log_event()
488 * function but enclose the call to the log (and all the setup) in a
489 * if (tcp_bblogging_on(tp)) {
490 * ... setup and logging call ...
491 * }
492 *
493 * Always use the macro tcp_bblogging_on() since sometimes the defintions
494 * do change.
495 *
496 * BBlogging also supports the concept of a BBpoint. The idea behind this
497 * is that when you set a specific BBpoint on and turn the logging into
498 * the BBpoint mode (TCP_LOG_VIA_BBPOINTS) you will be defining very very
499 * few of these points to come out. The point is specific to a code you
500 * want tied to that one BB logging. This allows you to turn on a much broader
501 * scale set of limited logging on more connections without overwhelming the
502 * I/O system with too much BBlogs. This of course means you need to be quite
503 * careful on how many BBlogs go with each point, but you can have multiple points
504 * only one of which is active at a time.
505 *
506 * To define a point you add it above under the define for TCP_BBPOINT_NONE (which
507 * is the default i.e. no point is defined. You then, for your point use the
508 * tcp_bblogging_point_on(struct tcpcb *tp, uint8_t bbpoint) inline to enclose
509 * your call to tcp_log_event. Do not use one of the TCP_LOGGING macros else
510 * your point will never come out. You specify your defined point in the bbpoint
511 * side of the inline. An example of this you can find in rack where the
512 * TCP_BBPOINT_REQ_LEVEL_LOGGING is used. There a specific set of logs are generated
513 * for each request that tcp is tracking.
514 *
515 * When turning on BB logging use the inline:
516 * tcp_set_bblog_state(struct tcpcb *tp, uint8_t ls, uint8_t bbpoint)
517 * the ls field is the logging state TCP_LOG_STATE_CONTINUAL etc. The
518 * bbpoint field is ignored unless the ls field is set to TCP_LOG_VIA_BBPOINTS.
519 * Currently there is only a socket option that turns on the non-BBPOINT
520 * logging.
521 *
522 * Prototype:
523 * TCP_LOG_EVENT(struct tcpcb *tp, struct tcphdr *th, struct sockbuf *rxbuf,
524 * struct sockbuf *txbuf, uint8_t eventid, int errornum,
525 * union tcp_log_stackspecific *stackinfo)
526 *
527 * tp is mandatory and must be write locked.
528 * th is optional; if present, it will appear in the record.
529 * rxbuf and txbuf are optional; if present, they will appear in the record.
530 * eventid is mandatory.
531 * errornum is mandatory (it indicates the success or failure of the
532 * operation associated with the event).
533 * len indicates the length of the packet. If no packet, use 0.
534 * stackinfo is optional; if present, it will appear in the record.
535 */
536 struct tcpcb;
537 #ifdef TCP_LOG_FORCEVERBOSE
538 #define TCP_LOG_EVENT TCP_LOG_EVENT_VERBOSE
539 #else
540 #define TCP_LOG_EVENT(tp, th, rxbuf, txbuf, eventid, errornum, len, stackinfo, th_hostorder) \
541 do { \
542 if (tcp_log_verbose) \
543 TCP_LOG_EVENT_VERBOSE(tp, th, rxbuf, txbuf, \
544 eventid, errornum, len, stackinfo, \
545 th_hostorder, NULL); \
546 else if (tcp_bblogging_on(tp)) \
547 tcp_log_event(tp, th, rxbuf, txbuf, eventid, \
548 errornum, len, stackinfo, th_hostorder, \
549 NULL, NULL, 0, NULL); \
550 } while (0)
551 #endif /* TCP_LOG_FORCEVERBOSE */
552 #define TCP_LOG_EVENTP(tp, th, rxbuf, txbuf, eventid, errornum, len, stackinfo, th_hostorder, tv) \
553 do { \
554 if (tcp_bblogging_on(tp)) \
555 tcp_log_event(tp, th, rxbuf, txbuf, eventid, \
556 errornum, len, stackinfo, th_hostorder, \
557 NULL, NULL, 0, tv); \
558 } while (0)
559
560 #ifdef TCP_BLACKBOX
561 extern bool tcp_log_verbose;
562 void tcp_log_drain(struct tcpcb *tp);
563 int tcp_log_dump_tp_logbuf(struct tcpcb *tp, char *reason, int how, bool force);
564 void tcp_log_dump_tp_bucket_logbufs(struct tcpcb *tp, char *reason);
565 struct tcp_log_buffer *tcp_log_event(struct tcpcb *tp, struct tcphdr *th, struct sockbuf *rxbuf,
566 struct sockbuf *txbuf, uint8_t eventid, int errornum, uint32_t len,
567 union tcp_log_stackspecific *stackinfo, int th_hostorder,
568 const char *output_caller, const char *func, int line, const struct timeval *tv);
569 size_t tcp_log_get_id(struct tcpcb *tp, char *buf);
570 size_t tcp_log_get_tag(struct tcpcb *tp, char *buf);
571 u_int tcp_log_get_id_cnt(struct tcpcb *tp);
572 int tcp_log_getlogbuf(struct sockopt *sopt, struct tcpcb *tp);
573 void tcp_log_init(void);
574 int tcp_log_set_id(struct tcpcb *tp, char *id);
575 int tcp_log_set_tag(struct tcpcb *tp, char *tag);
576 int tcp_log_state_change(struct tcpcb *tp, int state);
577 void tcp_log_tcpcbinit(struct tcpcb *tp);
578 void tcp_log_tcpcbfini(struct tcpcb *tp);
579 void tcp_log_flowend(struct tcpcb *tp);
580 void tcp_log_sendfile(struct socket *so, off_t offset, size_t nbytes,
581 int flags);
582 int tcp_log_apply_ratio(struct tcpcb *tp, int ratio);
583 #else /* !TCP_BLACKBOX */
584 #define tcp_log_verbose (false)
585
586 static inline struct tcp_log_buffer *
tcp_log_event(struct tcpcb * tp,struct tcphdr * th,struct sockbuf * rxbuf,struct sockbuf * txbuf,uint8_t eventid,int errornum,uint32_t len,union tcp_log_stackspecific * stackinfo,int th_hostorder,const char * output_caller,const char * func,int line,const struct timeval * tv)587 tcp_log_event(struct tcpcb *tp, struct tcphdr *th, struct sockbuf *rxbuf,
588 struct sockbuf *txbuf, uint8_t eventid, int errornum, uint32_t len,
589 union tcp_log_stackspecific *stackinfo, int th_hostorder,
590 const char *output_caller, const char *func, int line,
591 const struct timeval *tv)
592 {
593
594 return (NULL);
595 }
596 #endif /* TCP_BLACKBOX */
597
598 #endif /* _KERNEL */
599 #endif /* __tcp_log_buf_h__ */
600