xen-netback: disable rogue vif in kthread context

[firefly-linux-kernel-4.4.55.git] / drivers / net / xen-netback / netback.c
diff --git a/drivers/net/xen-netback/netback.c b/drivers/net/xen-netback/netback.c

index 5d2dd1d54173040f82ccafedf713ca8b3d930422..3f021e054ba1cc004dacde3f82df06a4e90e03a2 100644 (file)
--- a/drivers/net/xen-netback/netback.c
+++ b/drivers/net/xen-netback/netback.c
@@ -56,7 +56,7 @@ bool separate_tx_rx_irq = 1;
  module_param(separate_tx_rx_irq, bool, 0644);
  
  /* When guest ring is filled up, qdisc queues the packets for us, but we have
- * to timeout them, otherwise other guests' packets can get stucked there
+ * to timeout them, otherwise other guests' packets can get stuck there
   */
  unsigned int rx_drain_timeout_msecs = 10000;
  module_param(rx_drain_timeout_msecs, uint, 0444);
@@ -99,6 +99,9 @@ static inline unsigned long idx_to_kaddr(struct xenvif *vif,
         return (unsigned long)pfn_to_kaddr(idx_to_pfn(vif, idx));
  }
  
+#define callback_param(vif, pending_idx) \
+       (vif->pending_tx_info[pending_idx].callback_struct)
+
  /* Find the containing VIF's structure from a pointer in pending_tx_info array
   */
  static inline struct xenvif* ubuf_to_vif(struct ubuf_info *ubuf)
@@ -188,8 +191,8 @@ static bool start_new_rx_buffer(int offset, unsigned long size, int head)
          * into multiple copies tend to give large frags their
          * own buffers as before.
          */
-       if ((offset + size > MAX_BUFFER_OFFSET) &&
-           (size <= MAX_BUFFER_OFFSET) && offset && !head)
+       BUG_ON(size > MAX_BUFFER_OFFSET);
+       if ((offset + size > MAX_BUFFER_OFFSET) && offset && !head)
                 return true;
  
         return false;
@@ -508,6 +511,8 @@ static void xenvif_rx_action(struct xenvif *vif)
  
         while ((skb = skb_dequeue(&vif->rx_queue)) != NULL) {
                 RING_IDX max_slots_needed;
+               RING_IDX old_req_cons;
+               RING_IDX ring_slots_used;
                 int i;
  
                 /* We need a cheap worse case estimate for the number of
@@ -519,9 +524,28 @@ static void xenvif_rx_action(struct xenvif *vif)
                                                 PAGE_SIZE);
                 for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
                         unsigned int size;
+                       unsigned int offset;
+
                         size = skb_frag_size(&skb_shinfo(skb)->frags[i]);
-                       max_slots_needed += DIV_ROUND_UP(size, PAGE_SIZE);
+                       offset = skb_shinfo(skb)->frags[i].page_offset;
+
+                       /* For a worse-case estimate we need to factor in
+                        * the fragment page offset as this will affect the
+                        * number of times xenvif_gop_frag_copy() will
+                        * call start_new_rx_buffer().
+                        */
+                       max_slots_needed += DIV_ROUND_UP(offset + size,
+                                                        PAGE_SIZE);
                 }
+
+               /* To avoid the estimate becoming too pessimal for some
+                * frontends that limit posted rx requests, cap the estimate
+                * at MAX_SKB_FRAGS.
+                */
+               if (max_slots_needed > MAX_SKB_FRAGS)
+                       max_slots_needed = MAX_SKB_FRAGS;
+
+               /* We may need one more slot for GSO metadata */
                 if (skb_is_gso(skb) &&
                    (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV4 ||
                     skb_shinfo(skb)->gso_type & SKB_GSO_TCPV6))
@@ -536,8 +560,11 @@ static void xenvif_rx_action(struct xenvif *vif)
                 } else
                         vif->rx_last_skb_slots = 0;
  
+               old_req_cons = vif->rx.req_cons;
                 XENVIF_RX_CB(skb)->meta_slots_used = xenvif_gop_skb(skb, &npo);
-               BUG_ON(XENVIF_RX_CB(skb)->meta_slots_used > max_slots_needed);
+               ring_slots_used = vif->rx.req_cons - old_req_cons;
+
+               BUG_ON(ring_slots_used > max_slots_needed);
  
                 __skb_queue_tail(&rxq, skb);
         }
@@ -684,7 +711,8 @@ static void xenvif_tx_err(struct xenvif *vif,
  static void xenvif_fatal_tx_err(struct xenvif *vif)
  {
         netdev_err(vif->dev, "fatal error; disabling device\n");
-       xenvif_carrier_off(vif);
+       vif->disabled = true;
+       xenvif_kick_thread(vif);
  }
  
  static int xenvif_count_requests(struct xenvif *vif,
@@ -1020,12 +1048,12 @@ static void xenvif_fill_frags(struct xenvif *vif, struct sk_buff *skb)
                 /* If this is not the first frag, chain it to the previous*/
                 if (unlikely(prev_pending_idx == INVALID_PENDING_IDX))
                         skb_shinfo(skb)->destructor_arg =
-                               &vif->pending_tx_info[pending_idx].callback_struct;
+                               &callback_param(vif, pending_idx);
                 else if (likely(pending_idx != prev_pending_idx))
-                       vif->pending_tx_info[prev_pending_idx].callback_struct.ctx =
-                               &(vif->pending_tx_info[pending_idx].callback_struct);
+                       callback_param(vif, prev_pending_idx).ctx =
+                               &callback_param(vif, pending_idx);
  
-               vif->pending_tx_info[pending_idx].callback_struct.ctx = NULL;
+               callback_param(vif, pending_idx).ctx = NULL;
                 prev_pending_idx = pending_idx;
  
                 txp = &vif->pending_tx_info[pending_idx].req;
@@ -1185,7 +1213,7 @@ static unsigned xenvif_tx_build_gops(struct xenvif *vif, int budget)
                                    vif->tx.sring->req_prod, vif->tx.req_cons,
                                    XEN_NETIF_TX_RING_SIZE);
                         xenvif_fatal_tx_err(vif);
-                       continue;
+                       break;
                 }
  
                 work_to_do = RING_HAS_UNCONSUMED_REQUESTS(&vif->tx);
@@ -1395,13 +1423,13 @@ static int xenvif_tx_submit(struct xenvif *vif)
                 memcpy(skb->data,
                        (void *)(idx_to_kaddr(vif, pending_idx)|txp->offset),
                        data_len);
-               vif->pending_tx_info[pending_idx].callback_struct.ctx = NULL;
+               callback_param(vif, pending_idx).ctx = NULL;
                 if (data_len < txp->size) {
                         /* Append the packet payload as a fragment. */
                         txp->offset += data_len;
                         txp->size -= data_len;
                         skb_shinfo(skb)->destructor_arg =
-                               &vif->pending_tx_info[pending_idx].callback_struct;
+                               &callback_param(vif, pending_idx);
                 } else {
                         /* Schedule a response immediately. */
                         xenvif_idx_unmap(vif, pending_idx);
@@ -1545,7 +1573,6 @@ static inline void xenvif_tx_dealloc_action(struct xenvif *vif)
                                             idx_to_kaddr(vif, pending_idx),
                                             GNTMAP_host_map,
                                             vif->grant_tx_handle[pending_idx]);
-                       /* Btw. already unmapped? */
                         xenvif_grant_handle_reset(vif, pending_idx);
                         ++gop;
                 }
@@ -1678,12 +1705,20 @@ void xenvif_idx_unmap(struct xenvif *vif, u16 pending_idx)
                             idx_to_kaddr(vif, pending_idx),
                             GNTMAP_host_map,
                             vif->grant_tx_handle[pending_idx]);
-       /* Btw. already unmapped? */
         xenvif_grant_handle_reset(vif, pending_idx);
  
         ret = gnttab_unmap_refs(&tx_unmap_op, NULL,
                                 &vif->mmap_pages[pending_idx], 1);
-       BUG_ON(ret);
+       if (ret) {
+               netdev_err(vif->dev,
+                          "Unmap fail: ret: %d pending_idx: %d host_addr: %llx handle: %x status: %d\n",
+                          ret,
+                          pending_idx,
+                          tx_unmap_op.host_addr,
+                          tx_unmap_op.handle,
+                          tx_unmap_op.status);
+               BUG();
+       }
  
         xenvif_idx_release(vif, pending_idx, XEN_NETIF_RSP_OKAY);
  }
@@ -1774,7 +1809,18 @@ int xenvif_kthread_guest_rx(void *data)
         while (!kthread_should_stop()) {
                 wait_event_interruptible(vif->wq,
                                          rx_work_todo(vif) ||
+                                        vif->disabled ||
                                          kthread_should_stop());
+
+               /* This frontend is found to be rogue, disable it in
+                * kthread context. Currently this is only set when
+                * netback finds out frontend sends malformed packet,
+                * but we cannot disable the interface in softirq
+                * context so we defer it here.
+                */
+               if (unlikely(vif->disabled && netif_carrier_ok(vif->dev)))
+                       xenvif_carrier_off(vif);
+
                 if (kthread_should_stop())
                         break;