天天看点

tcp tso

根据Linux的协议栈,在发送tcp数据时,最终会调用如下函数:

文件 net/ipv4/tcp.c 

int tcp_sendmsg(struct kiocb *iocb, struct sock *sk, struct msghdr *msg, size_t size)

在此函数中,要根据mss来将大数据拆分成小封包发送到网络上。

mss是通过如下函数获取的:

mss_now = tcp_send_mss(sk, &size_goal, flags);

static int tcp_send_mss(struct sock *sk, int *size_goal, int flags)

{

         int mss_now;

         mss_now = tcp_current_mss(sk);

         *size_goal = tcp_xmit_size_goal(sk, mss_now, !(flags & MSG_OOB));

         return mss_now;

}

tcp_current_mss返回TCP链接建立时协商的MSS,考虑协商的TCP选项。

tcp_xmit_size_goal考虑网卡是否支持gso,如果网卡支持gso,返回网卡的gso max size最为mss。

static unsigned int tcp_xmit_size_goal(struct sock *sk, u32 mss_now,

                                            int large_allowed)

{

         …

if (large_allowed && sk_can_gso(sk)) {

                   xmit_size_goal = ((sk->sk_gso_max_size - 1) -

                                      inet_csk(sk)->icsk_af_ops->net_header_len -

                                      inet_csk(sk)->icsk_ext_hdr_len -

                                      tp->tcp_header_len);

         …

         return max(xmit_size_goal, mss_now);

}

socket创建时对gso的设置:

void sk_setup_caps(struct sock *sk, struct dst_entry *dst)

{

         __sk_dst_set(sk, dst);

         sk->sk_route_caps = dst->dev->features;

         if (sk->sk_route_caps & NETIF_F_GSO)

                   sk->sk_route_caps |= NETIF_F_GSO_SOFTWARE;

         sk->sk_route_caps &= ~sk->sk_route_nocaps;

         if (sk_can_gso(sk)) {

                   if (dst->header_len) {

                            sk->sk_route_caps &= ~NETIF_F_GSO_MASK;

                   } else {

                            sk->sk_route_caps |= NETIF_F_SG | NETIF_F_HW_CSUM;

                            sk->sk_gso_max_size = dst->dev->gso_max_size;

                   }

         }

}

//完整的看一下gso对tcp发包过程的影响

int tcp_sendmsg(struct kiocb *iocb, struct socket *sock, struct msghdr *msg,

                   size_t size)

{

         mss_now = tcp_send_mss(sk, &size_goal, flags); //考虑gso后的mss

         sg = sk->sk_route_caps & NETIF_F_SG;

   ...

if (merge) {

          skb_shinfo(skb)->frags[i - 1].size +=      copy;

   } else {

          skb_fill_page_desc(skb, i, page, off, copy); //安排skb数据的存储方式

          if (TCP_PAGE(sk)) {

               get_page(page);

          } else if (off + copy < PAGE_SIZE) {

                get_page(page);

                TCP_PAGE(sk) = page;

          }

    }

......

}

//填充tcp数据分片结构:

skb_fill_page_desc()

{

         skb_frag_t *frag = &skb_shinfo(skb)->frags[i];

         frag->page                  = page;

         frag->page_offset    = off;

         frag->size                    = size;

         skb_shinfo(skb)->nr_frags = i + 1;

}

继续阅读