net: Consistent skb timestamping

author Eric Dumazet <eric.dumazet@gmail.com>

Sun, 16 May 2010 06:57:10 +0000 (23:57 -0700)

committer David S. Miller <davem@davemloft.net>

Sun, 16 May 2010 06:57:10 +0000 (23:57 -0700)
author Eric Dumazet <eric.dumazet@gmail.com>
Sun, 16 May 2010 06:57:10 +0000 (23:57 -0700)
committer David S. Miller <davem@davemloft.net>
Sun, 16 May 2010 06:57:10 +0000 (23:57 -0700)
diff --git a/Documentation/sysctl/net.txt b/Documentation/sysctl/net.txt

index df38ef046f8d1372ef2ff0d45debb7b15c04f64c..cbd05ffc606baa1ca06c59ca0c2ab19cac6c8e62 100644 (file)
--- a/Documentation/sysctl/net.txt
+++ b/Documentation/sysctl/net.txt
@@ -84,6 +84,16 @@ netdev_max_backlog
  Maximum number  of  packets,  queued  on  the  INPUT  side, when the interface
  receives packets faster than kernel can process them.
  
  Maximum number  of  packets,  queued  on  the  INPUT  side, when the interface
  receives packets faster than kernel can process them.
  
+netdev_tstamp_prequeue
+----------------------
+
+If set to 0, RX packet timestamps can be sampled after RPS processing, when
+the target CPU processes packets. It might give some delay on timestamps, but
+permit to distribute the load on several cpus.
+
+If set to 1 (default), timestamps are sampled as soon as possible, before
+queueing.
+
  optmem_max
  ----------
  
  optmem_max
  ----------
  
diff --git a/include/linux/netdevice.h b/include/linux/netdevice.h

index 69022d47d6f2ee5848af3f2211e0c3f2007633c1..c1b2341897c25681191f64bf99024c59531937ac 100644 (file)
--- a/include/linux/netdevice.h
+++ b/include/linux/netdevice.h
@@ -2100,6 +2100,7 @@ extern const struct net_device_stats *dev_get_stats(struct net_device *dev);
  extern void            dev_txq_stats_fold(const struct net_device *dev, struct net_device_stats *stats);
  
  extern int             netdev_max_backlog;
  extern void            dev_txq_stats_fold(const struct net_device *dev, struct net_device_stats *stats);
  
  extern int             netdev_max_backlog;
+extern int             netdev_tstamp_prequeue;
  extern int             weight_p;
  extern int             netdev_set_master(struct net_device *dev, struct net_device *master);
  extern int skb_checksum_help(struct sk_buff *skb);
  extern int             weight_p;
  extern int             netdev_set_master(struct net_device *dev, struct net_device *master);
  extern int skb_checksum_help(struct sk_buff *skb);
diff --git a/net/core/dev.c b/net/core/dev.c

index 5cbba0927a8e57eec79f062bd93e0fb0137a1dfe..988e42912e722c07739cf82f2f5b04c1310cd7c2 100644 (file)
--- a/net/core/dev.c
+++ b/net/core/dev.c
@@ -1454,7 +1454,7 @@ void net_disable_timestamp(void)
  }
  EXPORT_SYMBOL(net_disable_timestamp);
  
  }
  EXPORT_SYMBOL(net_disable_timestamp);
  
-static inline void net_timestamp(struct sk_buff *skb)
+static inline void net_timestamp_set(struct sk_buff *skb)
  {
         if (atomic_read(&netstamp_needed))
                 __net_timestamp(skb);
  {
         if (atomic_read(&netstamp_needed))
                 __net_timestamp(skb);
@@ -1462,6 +1462,12 @@ static inline void net_timestamp(struct sk_buff *skb)
                 skb->tstamp.tv64 = 0;
  }
  
                 skb->tstamp.tv64 = 0;
  }
  
+static inline void net_timestamp_check(struct sk_buff *skb)
+{
+       if (!skb->tstamp.tv64 && atomic_read(&netstamp_needed))
+               __net_timestamp(skb);
+}
+
  /**
   * dev_forward_skb - loopback an skb to another netif
   *
  /**
   * dev_forward_skb - loopback an skb to another netif
   *
@@ -1508,9 +1514,9 @@ static void dev_queue_xmit_nit(struct sk_buff *skb, struct net_device *dev)
  
  #ifdef CONFIG_NET_CLS_ACT
         if (!(skb->tstamp.tv64 && (G_TC_FROM(skb->tc_verd) & AT_INGRESS)))
  
  #ifdef CONFIG_NET_CLS_ACT
         if (!(skb->tstamp.tv64 && (G_TC_FROM(skb->tc_verd) & AT_INGRESS)))
-               net_timestamp(skb);
+               net_timestamp_set(skb);
  #else
  #else
-       net_timestamp(skb);
+       net_timestamp_set(skb);
  #endif
  
         rcu_read_lock();
  #endif
  
         rcu_read_lock();
@@ -2201,6 +2207,7 @@ EXPORT_SYMBOL(dev_queue_xmit);
    =======================================================================*/
  
  int netdev_max_backlog __read_mostly = 1000;
    =======================================================================*/
  
  int netdev_max_backlog __read_mostly = 1000;
+int netdev_tstamp_prequeue __read_mostly = 1;
  int netdev_budget __read_mostly = 300;
  int weight_p __read_mostly = 64;            /* old backlog weight */
  
  int netdev_budget __read_mostly = 300;
  int weight_p __read_mostly = 64;            /* old backlog weight */
  
@@ -2465,8 +2472,8 @@ int netif_rx(struct sk_buff *skb)
         if (netpoll_rx(skb))
                 return NET_RX_DROP;
  
         if (netpoll_rx(skb))
                 return NET_RX_DROP;
  
-       if (!skb->tstamp.tv64)
-               net_timestamp(skb);
+       if (netdev_tstamp_prequeue)
+               net_timestamp_check(skb);
  
  #ifdef CONFIG_RPS
         {
  
  #ifdef CONFIG_RPS
         {
@@ -2791,8 +2798,8 @@ static int __netif_receive_skb(struct sk_buff *skb)
         int ret = NET_RX_DROP;
         __be16 type;
  
         int ret = NET_RX_DROP;
         __be16 type;
  
-       if (!skb->tstamp.tv64)
-               net_timestamp(skb);
+       if (!netdev_tstamp_prequeue)
+               net_timestamp_check(skb);
  
         if (vlan_tx_tag_present(skb) && vlan_hwaccel_do_receive(skb))
                 return NET_RX_SUCCESS;
  
         if (vlan_tx_tag_present(skb) && vlan_hwaccel_do_receive(skb))
                 return NET_RX_SUCCESS;
@@ -2910,23 +2917,28 @@ out:
   */
  int netif_receive_skb(struct sk_buff *skb)
  {
   */
  int netif_receive_skb(struct sk_buff *skb)
  {
+       if (netdev_tstamp_prequeue)
+               net_timestamp_check(skb);
+
  #ifdef CONFIG_RPS
  #ifdef CONFIG_RPS
-       struct rps_dev_flow voidflow, *rflow = &voidflow;
-       int cpu, ret;
+       {
+               struct rps_dev_flow voidflow, *rflow = &voidflow;
+               int cpu, ret;
  
  
-       rcu_read_lock();
+               rcu_read_lock();
+
+               cpu = get_rps_cpu(skb->dev, skb, &rflow);
  
  
-       cpu = get_rps_cpu(skb->dev, skb, &rflow);
+               if (cpu >= 0) {
+                       ret = enqueue_to_backlog(skb, cpu, &rflow->last_qtail);
+                       rcu_read_unlock();
+               } else {
+                       rcu_read_unlock();
+                       ret = __netif_receive_skb(skb);
+               }
  
  
-       if (cpu >= 0) {
-               ret = enqueue_to_backlog(skb, cpu, &rflow->last_qtail);
-               rcu_read_unlock();
-       } else {
-               rcu_read_unlock();
-               ret = __netif_receive_skb(skb);
+               return ret;
         }
         }
-
-       return ret;
  #else
         return __netif_receive_skb(skb);
  #endif
  #else
         return __netif_receive_skb(skb);
  #endif
diff --git a/net/core/sysctl_net_core.c b/net/core/sysctl_net_core.c

index dcc7d25996ab32f3687b148100107a1b0f1e0ec6..01eee5d984be4b6d838357a56e0211508d0e31ba 100644 (file)
--- a/net/core/sysctl_net_core.c
+++ b/net/core/sysctl_net_core.c
@@ -121,6 +121,13 @@ static struct ctl_table net_core_table[] = {
                 .mode           = 0644,
                 .proc_handler   = proc_dointvec
         },
                 .mode           = 0644,
                 .proc_handler   = proc_dointvec
         },
+       {
+               .procname       = "netdev_tstamp_prequeue",
+               .data           = &netdev_tstamp_prequeue,
+               .maxlen         = sizeof(int),
+               .mode           = 0644,
+               .proc_handler   = proc_dointvec
+       },
         {
                 .procname       = "message_cost",
                 .data           = &net_ratelimit_state.interval,
         {
                 .procname       = "message_cost",
                 .data           = &net_ratelimit_state.interval,
author	Eric Dumazet <eric.dumazet@gmail.com>
	Sun, 16 May 2010 06:57:10 +0000 (23:57 -0700)
committer	David S. Miller <davem@davemloft.net>
	Sun, 16 May 2010 06:57:10 +0000 (23:57 -0700)
Documentation/sysctl/net.txt		patch \| blob \| history
include/linux/netdevice.h		patch \| blob \| history
net/core/dev.c		patch \| blob \| history
net/core/sysctl_net_core.c		patch \| blob \| history