123197Smckusick /* 229156Smckusick * Copyright (c) 1982, 1986 Regents of the University of California. 332789Sbostic * All rights reserved. 423197Smckusick * 544492Sbostic * %sccs.include.redist.c% 632789Sbostic * 7*57433Sandrew * @(#)tcp_var.h 7.11 (Berkeley) 01/08/93 823197Smckusick */ 94808Swnj 104808Swnj /* 114808Swnj * Kernel variables for tcp. 124808Swnj */ 134808Swnj 144808Swnj /* 155166Swnj * Tcp control block, one per tcp; fields: 164808Swnj */ 174881Swnj struct tcpcb { 185076Swnj struct tcpiphdr *seg_next; /* sequencing queue */ 195076Swnj struct tcpiphdr *seg_prev; 205246Sroot short t_state; /* state of this connection */ 215092Swnj short t_timer[TCPT_NTIMERS]; /* tcp timers */ 225166Swnj short t_rxtshift; /* log(2) of rexmt exp. backoff */ 2332034Skarels short t_rxtcur; /* current retransmit value */ 2432099Skarels short t_dupacks; /* consecutive dup acks recd */ 2527068Skarels u_short t_maxseg; /* maximum segment size */ 265246Sroot char t_force; /* 1 if forcing out a byte */ 27*57433Sandrew u_short t_flags; 28*57433Sandrew #define TF_ACKNOW 0x0001 /* ack peer immediately */ 29*57433Sandrew #define TF_DELACK 0x0002 /* ack, but try to delay it */ 30*57433Sandrew #define TF_NODELAY 0x0004 /* don't delay packets to coalesce */ 31*57433Sandrew #define TF_NOOPT 0x0008 /* don't use tcp options */ 32*57433Sandrew #define TF_SENTFIN 0x0010 /* have sent FIN */ 33*57433Sandrew #define TF_REQ_SCALE 0x0020 /* have/will request window scaling */ 34*57433Sandrew #define TF_RCVD_SCALE 0x0040 /* other side has requested scaling */ 35*57433Sandrew #define TF_REQ_TSTMP 0x0080 /* have/will request timestamps */ 36*57433Sandrew #define TF_RCVD_TSTMP 0x0100 /* a timestamp was received in SYN */ 37*57433Sandrew #define TF_SACK_PERMIT 0x0200 /* other side said I could SACK */ 38*57433Sandrew 394881Swnj struct tcpiphdr *t_template; /* skeletal packet for transmit */ 405067Swnj struct inpcb *t_inpcb; /* back pointer to internet pcb */ 414808Swnj /* 425067Swnj * The following fields are used as in the protocol specification. 435067Swnj * See RFC783, Dec. 1981, page 21. 444808Swnj */ 455067Swnj /* send sequence variables */ 465067Swnj tcp_seq snd_una; /* send unacknowledged */ 475067Swnj tcp_seq snd_nxt; /* send next */ 485067Swnj tcp_seq snd_up; /* send urgent pointer */ 495067Swnj tcp_seq snd_wl1; /* window update seg seq number */ 505067Swnj tcp_seq snd_wl2; /* window update seg ack number */ 515067Swnj tcp_seq iss; /* initial send sequence number */ 52*57433Sandrew u_long snd_wnd; /* send window */ 535067Swnj /* receive sequence variables */ 54*57433Sandrew u_long rcv_wnd; /* receive window */ 555067Swnj tcp_seq rcv_nxt; /* receive next */ 565067Swnj tcp_seq rcv_up; /* receive urgent pointer */ 575067Swnj tcp_seq irs; /* initial receive sequence number */ 585067Swnj /* 595067Swnj * Additional variables for this implementation. 605067Swnj */ 615076Swnj /* receive variables */ 625076Swnj tcp_seq rcv_adv; /* advertised window */ 635067Swnj /* retransmit variables */ 6444376Skarels tcp_seq snd_max; /* highest sequence number sent; 6517359Skarels * used to recognize retransmits 6617359Skarels */ 6732099Skarels /* congestion control (for slow start, source quench, retransmit after loss) */ 68*57433Sandrew u_long snd_cwnd; /* congestion-controlled window */ 69*57433Sandrew u_long snd_ssthresh; /* snd_cwnd size threshhold for 7032099Skarels * for slow start exponential to 7144376Skarels * linear switch 7244376Skarels */ 7331726Skarels /* 7444376Skarels * transmit timing stuff. See below for scale of srtt and rttvar. 7532099Skarels * "Variance" is actually smoothed difference. 7631726Skarels */ 775166Swnj short t_idle; /* inactivity time */ 785166Swnj short t_rtt; /* round trip time */ 795166Swnj tcp_seq t_rtseq; /* sequence number being timed */ 8031726Skarels short t_srtt; /* smoothed round-trip time */ 8131726Skarels short t_rttvar; /* variance in round-trip time */ 8244376Skarels u_short t_rttmin; /* minimum rtt allowed */ 83*57433Sandrew u_long max_sndwnd; /* largest window peer has offered */ 8444376Skarels 855443Swnj /* out-of-band data */ 865443Swnj char t_oobflags; /* have some */ 875550Swnj char t_iobc; /* input character */ 885443Swnj #define TCPOOB_HAVEDATA 0x01 8924822Skarels #define TCPOOB_HADDATA 0x02 9044376Skarels short t_softerror; /* possible error not yet reported */ 91*57433Sandrew 92*57433Sandrew /* RFC 1323 variables */ 93*57433Sandrew u_char snd_scale; /* window scaling for send window */ 94*57433Sandrew u_char rcv_scale; /* window scaling for recv window */ 95*57433Sandrew u_char request_r_scale; /* pending window scaling */ 96*57433Sandrew u_char requested_s_scale; 97*57433Sandrew u_long ts_recent; /* timestamp echo data */ 98*57433Sandrew u_long ts_recent_age; /* when last updated */ 99*57433Sandrew tcp_seq last_ack_sent; 1005067Swnj }; 1014808Swnj 1024881Swnj #define intotcpcb(ip) ((struct tcpcb *)(ip)->inp_ppcb) 1034881Swnj #define sototcpcb(so) (intotcpcb(sotoinpcb(so))) 1044881Swnj 10530527Skarels /* 10644376Skarels * The smoothed round-trip time and estimated variance 10744376Skarels * are stored as fixed point numbers scaled by the values below. 10844376Skarels * For convenience, these scales are also used in smoothing the average 10944376Skarels * (smoothed = (1/scale)sample + ((scale-1)/scale)smoothed). 11044376Skarels * With these scales, srtt has 3 bits to the right of the binary point, 11144376Skarels * and thus an "ALPHA" of 0.875. rttvar has 2 bits to the right of the 11244376Skarels * binary point, and is smoothed with an ALPHA of 0.75. 11344376Skarels */ 11444376Skarels #define TCP_RTT_SCALE 8 /* multiplier for srtt; 3 bits frac. */ 11544376Skarels #define TCP_RTT_SHIFT 3 /* shift for srtt; 3 bits frac. */ 11644376Skarels #define TCP_RTTVAR_SCALE 4 /* multiplier for rttvar; 2 bits */ 11744376Skarels #define TCP_RTTVAR_SHIFT 2 /* multiplier for rttvar; 2 bits */ 11844376Skarels 11944376Skarels /* 12044376Skarels * The initial retransmission should happen at rtt + 4 * rttvar. 12144376Skarels * Because of the way we do the smoothing, srtt and rttvar 12244376Skarels * will each average +1/2 tick of bias. When we compute 12344376Skarels * the retransmit timer, we want 1/2 tick of rounding and 12444376Skarels * 1 extra tick because of +-1/2 tick uncertainty in the 12544376Skarels * firing of the timer. The bias will give us exactly the 12644376Skarels * 1.5 tick we need. But, because the bias is 12744376Skarels * statistical, we have to test that we don't drop below 12844376Skarels * the minimum feasible timer (which is 2 ticks). 12944376Skarels * This macro assumes that the value of TCP_RTTVAR_SCALE 13044376Skarels * is the same as the multiplier for rttvar. 13144376Skarels */ 13244376Skarels #define TCP_REXMTVAL(tp) \ 13344376Skarels (((tp)->t_srtt >> TCP_RTT_SHIFT) + (tp)->t_rttvar) 13444376Skarels 13544376Skarels /* XXX 13644376Skarels * We want to avoid doing m_pullup on incoming packets but that 13744376Skarels * means avoiding dtom on the tcp reassembly code. That in turn means 13844376Skarels * keeping an mbuf pointer in the reassembly queue (since we might 13944376Skarels * have a cluster). As a quick hack, the source & destination 14044376Skarels * port numbers (which are no longer needed once we've located the 14144376Skarels * tcpcb) are overlayed with an mbuf pointer. 14244376Skarels */ 14344376Skarels #define REASS_MBUF(ti) (*(struct mbuf **)&((ti)->ti_t)) 14444376Skarels 14544376Skarels /* 14630527Skarels * TCP statistics. 14730527Skarels * Many of these should be kept per connection, 14830527Skarels * but that's inconvenient at the moment. 14930527Skarels */ 1504926Swnj struct tcpstat { 15130527Skarels u_long tcps_connattempt; /* connections initiated */ 15230527Skarels u_long tcps_accepts; /* connections accepted */ 15330527Skarels u_long tcps_connects; /* connections established */ 15430527Skarels u_long tcps_drops; /* connections dropped */ 15530527Skarels u_long tcps_conndrops; /* embryonic connections dropped */ 15630527Skarels u_long tcps_closed; /* conn. closed (includes drops) */ 15730527Skarels u_long tcps_segstimed; /* segs where we tried to get rtt */ 15830527Skarels u_long tcps_rttupdated; /* times we succeeded */ 15930527Skarels u_long tcps_delack; /* delayed acks sent */ 16030527Skarels u_long tcps_timeoutdrop; /* conn. dropped in rxmt timeout */ 16130527Skarels u_long tcps_rexmttimeo; /* retransmit timeouts */ 16230527Skarels u_long tcps_persisttimeo; /* persist timeouts */ 16330527Skarels u_long tcps_keeptimeo; /* keepalive timeouts */ 16430527Skarels u_long tcps_keepprobe; /* keepalive probes sent */ 16530527Skarels u_long tcps_keepdrops; /* connections dropped in keepalive */ 16630527Skarels 16730527Skarels u_long tcps_sndtotal; /* total packets sent */ 16830527Skarels u_long tcps_sndpack; /* data packets sent */ 16930527Skarels u_long tcps_sndbyte; /* data bytes sent */ 17030527Skarels u_long tcps_sndrexmitpack; /* data packets retransmitted */ 17130527Skarels u_long tcps_sndrexmitbyte; /* data bytes retransmitted */ 17230527Skarels u_long tcps_sndacks; /* ack-only packets sent */ 17330527Skarels u_long tcps_sndprobe; /* window probes sent */ 17430527Skarels u_long tcps_sndurg; /* packets sent with URG only */ 17530527Skarels u_long tcps_sndwinup; /* window update-only packets sent */ 17630527Skarels u_long tcps_sndctrl; /* control (SYN|FIN|RST) packets sent */ 17730527Skarels 17830527Skarels u_long tcps_rcvtotal; /* total packets received */ 17930527Skarels u_long tcps_rcvpack; /* packets received in sequence */ 18030527Skarels u_long tcps_rcvbyte; /* bytes received in sequence */ 18130527Skarels u_long tcps_rcvbadsum; /* packets received with ccksum errs */ 18230527Skarels u_long tcps_rcvbadoff; /* packets received with bad offset */ 18330527Skarels u_long tcps_rcvshort; /* packets received too short */ 18430527Skarels u_long tcps_rcvduppack; /* duplicate-only packets received */ 18530527Skarels u_long tcps_rcvdupbyte; /* duplicate-only bytes received */ 18630527Skarels u_long tcps_rcvpartduppack; /* packets with some duplicate data */ 18730527Skarels u_long tcps_rcvpartdupbyte; /* dup. bytes in part-dup. packets */ 18830527Skarels u_long tcps_rcvoopack; /* out-of-order packets received */ 18930527Skarels u_long tcps_rcvoobyte; /* out-of-order bytes received */ 19030527Skarels u_long tcps_rcvpackafterwin; /* packets with data after window */ 19130527Skarels u_long tcps_rcvbyteafterwin; /* bytes rcvd after window */ 19230527Skarels u_long tcps_rcvafterclose; /* packets rcvd after "close" */ 19330527Skarels u_long tcps_rcvwinprobe; /* rcvd window probe packets */ 19430527Skarels u_long tcps_rcvdupack; /* rcvd duplicate acks */ 19530527Skarels u_long tcps_rcvacktoomuch; /* rcvd acks for unsent data */ 19630527Skarels u_long tcps_rcvackpack; /* rcvd ack packets */ 19730527Skarels u_long tcps_rcvackbyte; /* bytes acked by rcvd acks */ 19830527Skarels u_long tcps_rcvwinupd; /* rcvd window update packets */ 199*57433Sandrew u_long tcps_pawsdrop; /* segments dropped due to PAWS */ 2004926Swnj }; 2014926Swnj 2024808Swnj #ifdef KERNEL 2035067Swnj struct inpcb tcb; /* head of queue of active tcpcb's */ 2045067Swnj struct tcpstat tcpstat; /* tcp statistics */ 205*57433Sandrew u_long tcp_now; /* for RFC 1323 timestamps */ 2064881Swnj struct tcpiphdr *tcp_template(); 20710398Ssam struct tcpcb *tcp_close(), *tcp_drop(); 20810398Ssam struct tcpcb *tcp_timers(), *tcp_disconnect(), *tcp_usrclosed(); 2094808Swnj #endif 210