pf_ring DNA接收流程代碼分析

本文轉載自查看原文 2015-02-04 14:59 2740 pf_ring ixgbe/ 網卡

經過一個月的學習，對pf_ring DNA的內核部分有了一些認識，本文側重pf_ring對ixgbe的改動分析。

先說一說接收流程吧，流程如下：

其中,硬中斷處理函數是ixgbe_msix_clean_rings( );軟中斷處理函數是net_rx_action( )。

pf_ring對ixgbe的改動主要在ixgbe_poll()和ixgbe_clean_rx_irq()中。

在ixgbe_poll( )中遍歷每個隊列並輪詢處理數據包，代碼如下。

int ixgbe_poll(struct napi_struct *napi, int budget)
{
    struct ixgbe_q_vector *q_vector =
                   container_of(napi, struct ixgbe_q_vector, napi);
    struct ixgbe_adapter *adapter = q_vector->adapter;
    struct ixgbe_ring *ring;
    int per_ring_budget;
    bool clean_complete = true;

#if defined(CONFIG_DCA) || defined(CONFIG_DCA_MODULE)  //如果設定直接緩存訪問技術
    if (adapter->flags & IXGBE_FLAG_DCA_ENABLED)
        ixgbe_update_dca(q_vector);   //怎么一點兒性能提升都沒有呢?

#endif
    ixgbe_for_each_ring(ring, q_vector->tx)
        clean_complete &= ixgbe_clean_tx_irq(q_vector, ring);  //清理回收發送所用資源


#ifdef CONFIG_NET_RX_BUSY_POLL
    if (!ixgbe_qv_lock_napi(q_vector))
        return budget;
#endif

    /* attempt to distribute budget to each queue fairly, but don't allow
     * the budget to go below 1 because we'll exit polling */
    if (q_vector->rx.count > 1)
        per_ring_budget = max(budget/q_vector->rx.count, 1);
    else
        per_ring_budget = budget;     //默認為64，執行else分支
//for (ring = (q_vector->rx).ring;   ring != NULL;   ring = ring->next)

    ixgbe_for_each_ring(ring, q_vector->rx)  //循環遍歷每個ring    
        clean_complete &= (ixgbe_clean_rx_irq(q_vector, ring, per_ring_budget)
                                         < per_ring_budget);   //判斷已處理包數是否小於事先設定值

#ifdef CONFIG_NET_RX_BUSY_POLL
    ixgbe_qv_unlock_napi(q_vector); 
#endif

#ifndef HAVE_NETDEV_NAPI_LIST
    if (!netif_running(adapter->netdev))
        clean_complete = true;

#endif
    /* If all work not completed, return budget and keep polling  如果未全部完成*/
    if (!clean_complete)  
        return budget;

    /* all work done, exit the polling mode     如果已經全部完成 */
    napi_complete(napi);     //標記NAPI完成
    if (adapter->rx_itr_setting == 1)
        ixgbe_set_itr(q_vector);  //根據狀況調整中斷頻率
    if (!test_bit(__IXGBE_DOWN, &adapter->state))  //如果不是down狀態
        ixgbe_irq_enable_queues(adapter, ((u64)1 << q_vector->v_idx));  ////使能中斷隊列

    return 0;
}

pf_ring的修改只有一處：

#ifdef ENABLE_DNA
	if(!adapter->dna.dna_enabled)  //如果沒有啟動DNA
#endif   
	if (!test_bit(__IXGBE_DOWN, &adapter->state))  //如果不是down狀態
		ixgbe_irq_enable_queues(adapter, ((u64)1 << q_vector->v_idx)); //使能中斷隊列             
      //也就是說,DNA模式下不會執行使能中斷隊列

ixgbe_clean_rx_irq( )函數的代碼如下：

  1 static int ixgbe_clean_rx_irq(struct ixgbe_q_vector *q_vector,  //把ring buffer的內容取出來轉成sk_buff包
  2                    struct ixgbe_ring *rx_ring,
  3                    int budget)
  4 {
  5     unsigned int total_rx_bytes = 0, total_rx_packets = 0;
  6 #ifdef IXGBE_FCOE
  7     int ddp_bytes = 0;
  8 #endif /* IXGBE_FCOE */
  9     u16 cleaned_count = ixgbe_desc_unused(rx_ring);  //計算可清除的descriptors個數(打印其值為0，說明descriptors使用非常緊張)
 10 
 11     do {
 12         union ixgbe_adv_rx_desc *rx_desc;  ////描述符
 13         struct sk_buff *skb;    //套接字緩沖區
 14 
 15         /* return some buffers to hardware, one at a time is too slow */
 16         if (cleaned_count >= IXGBE_RX_BUFFER_WRITE) {  //超過16個
 17             ixgbe_alloc_rx_buffers(rx_ring, cleaned_count);   //替換出已使用的descriptors，並修改next_to_use值
 18             cleaned_count = 0;   
 19         }
 20                          //next_to_clean是可以清除的描述符編號，也就是網卡對描述符該做的工作已經做完，可以傳遞給上層協議
 21         rx_desc = IXGBE_RX_DESC(rx_ring, rx_ring->next_to_clean);  //將next_to_clean序號轉換成相應的描述符
 22 
 23         if (!ixgbe_test_staterr(rx_desc, IXGBE_RXD_STAT_DD))  //測試Descriptor Done位是否為1(表示網卡硬件已經處理完畢)
 24             break;  // 如果desc的DD位為0，則結束整個while循環，   也就是說，只有在DD位為1時才能往下執行
 25                                            
 26         /*
 27          * This memory barrier is needed to keep us from reading
 28          * any other fields out of the rx_desc until we know the
 29          * RXD_STAT_DD bit is set
 30          */
 31         rmb();
 32 
 33         /* retrieve  a buffer from the ring 根據描述符從接收環中提取一個緩沖單元*/
 34         skb = ixgbe_fetch_rx_buffer(rx_ring, rx_desc);  //分配skb
 35 
 36         /* exit if we failed to retrieve a buffer */
 37         if (!skb)
 38             break;
 39 
 40         cleaned_count++;
 41 
 42         /* place incomplete frames back on ring for completion  */
 43         if (ixgbe_is_non_eop(rx_ring, rx_desc, skb))  //返回false表示EOP位為1，並修改next_to_clean值，直接影響下一次循環的rx_desc
 44             continue;  //如果EOP為0，則結束本次循環，也就是說，只有在EOP為1時才能繼續往下執行   
 45 
 46         /* verify the packet layout is correct */
 47         if (ixgbe_cleanup_headers(rx_ring, rx_desc, skb))  //檢查數據包的header
 48             continue;  //如果header有誤則返回true並釋放skb
 49 
 50         /* probably a little skewed due to removing CRC */
 51         total_rx_bytes += skb->len;
 52  
 53         /* populate 填充 checksum, timestamp, VLAN, and protocol */
 54         ixgbe_process_skb_fields(rx_ring, rx_desc, skb);
 55 
 56 #ifdef IXGBE_FCOE
 57         /* if ddp, not passing to ULD unless for FCP_RSP or error */
 58         if (ixgbe_rx_is_fcoe(rx_ring, rx_desc)) {
 59             ddp_bytes = ixgbe_fcoe_ddp(q_vector->adapter,
 60                            rx_desc, skb);
 61             if (!ddp_bytes) {
 62                 dev_kfree_skb_any(skb);
 63 #ifndef NETIF_F_GRO
 64                 netdev_ring(rx_ring)->last_rx = jiffies;
 65 #endif
 66                 continue;
 67             }
 68         }
 69 
 70 #endif /* IXGBE_FCOE */
 71 #ifdef CONFIG_NET_RX_BUSY_POLL
 72         skb_mark_napi_id(skb, &q_vector->napi);
 73 #endif
 74         ixgbe_rx_skb(q_vector, rx_ring, rx_desc, skb);  //調用netif_receive_skb接收數據包
 75 
 76         /* update budget accounting */
 77         total_rx_packets++;
 78     } while (likely(total_rx_packets < budget));  //是否已經達到設備的budget
 79 
 80 #ifdef IXGBE_FCOE
 81     /* include DDPed FCoE data */
 82     if (ddp_bytes > 0) {
 83         unsigned int mss;
 84 
 85         mss = netdev_ring(rx_ring)->mtu - sizeof(struct fcoe_hdr) -
 86             sizeof(struct fc_frame_header) -
 87             sizeof(struct fcoe_crc_eof);
 88         if (mss > 512)
 89             mss &= ~511;
 90         total_rx_bytes += ddp_bytes;
 91         total_rx_packets += DIV_ROUND_UP(ddp_bytes, mss);
 92     }
 93 
 94 #endif /* IXGBE_FCOE */
 95     u64_stats_update_begin(&rx_ring->syncp);
 96     rx_ring->stats.packets += total_rx_packets;
 97     rx_ring->stats.bytes += total_rx_bytes;
 98     u64_stats_update_end(&rx_ring->syncp);
 99     q_vector->rx.total_packets += total_rx_packets;
100     q_vector->rx.total_bytes += total_rx_bytes;
101 
102     if (cleaned_count)  //經過清理之后，現在就有cleaned_count個DMA描述符可供網卡硬件重新使用 103         ixgbe_alloc_rx_buffers(rx_ring, cleaned_count);  //分配clean_count個page建立流式映射
104 
105 #ifndef IXGBE_NO_LRO
106     ixgbe_lro_flush_all(q_vector);
107 
108 #endif /* IXGBE_NO_LRO */
109     return total_rx_packets;
110 }

而pf_ring對ixgbe_clean_rx_irq( )函數的改動非常大：

static int ixgbe_clean_rx_irq(struct ixgbe_q_vector *q_vector,
			       struct ixgbe_ring *rx_ring,
			       int budget)
{
	unsigned int total_rx_bytes = 0, total_rx_packets = 0;
#ifdef IXGBE_FCOE
	int ddp_bytes = 0;
#endif /* IXGBE_FCOE */
	u16 cleaned_count = ixgbe_desc_unused(rx_ring);
#ifdef ENABLE_DNA
	struct ixgbe_adapter *adapter = q_vector->adapter;
	if(adapter->dna.dna_enabled)
		return(dna_ixgbe_clean_rx_irq(q_vector, rx_ring, budget));   //拋棄intel原有處理流程，調用PF_RING DNA獨有的清理函數
#endif

	..........................

}

再來秀一秀dna_ixgbe_clean_rx_irq()函數吧：

  1 static bool dna_ixgbe_clean_rx_irq(struct ixgbe_q_vector *q_vector,
  2                   struct ixgbe_ring *rx_ring, int budget) {
  3   union ixgbe_adv_rx_desc    *rx_desc, *shadow_rx_desc, *next_rx_desc;
  4   u32                staterr;
  5   u16                i, num_laps = 0, last_cleaned_idx;
  6   struct ixgbe_adapter            *adapter = q_vector->adapter;
  7   struct ixgbe_hw        *hw = &adapter->hw;
  8   unsigned int total_rx_packets = 0;
  9 
 10   last_cleaned_idx  = i = IXGBE_READ_REG(hw, IXGBE_RDT(rx_ring->reg_idx));  //讀取tail
 11   if(++i == rx_ring->count)
 12     i = 0;
 13 
 14   rx_ring->next_to_clean = i;  //把i賦給next_to_clean
 15 
 16   //i = IXGBE_READ_REG(hw, IXGBE_RDT(rx_ring->reg_idx));
 17   rx_desc = IXGBE_RX_DESC(rx_ring, i);    //得到描述符
 18   staterr = le32_to_cpu(rx_desc->wb.upper.status_error);   //讀取描述符狀態
 19 
 20   if(rx_ring->dna.queue_in_use) {   //如果應用程序正在使用該接收隊列
 21     /*
 22       A userland application is using the queue so it's not time to
 23       mess up 弄亂 with indexes but just to wakeup apps (if waiting)
 24     */
 25 
 26     /* trick for appplications calling poll/select directly (indexes not in sync of one position at most) */
 27     if (!(staterr & IXGBE_RXD_STAT_DD)) {
 28       u16 next_i = i;
 29       if(++next_i == rx_ring->count) next_i = 0;
 30       next_rx_desc = IXGBE_RX_DESC(rx_ring, next_i);
 31       staterr = le32_to_cpu(next_rx_desc->wb.upper.status_error);
 32      }
 33 
 34     if(staterr & IXGBE_RXD_STAT_DD) {
 35       if(unlikely(enable_debug))
 36     printk(KERN_INFO "DNA: got a packet [index=%d]!\n", i);
 37 
 38       if(waitqueue_active(&rx_ring->dna.rx_tx.rx.packet_waitqueue)) {
 39     wake_up_interruptible(&rx_ring->dna.rx_tx.rx.packet_waitqueue);
 40     rx_ring->dna.rx_tx.rx.interrupt_received = 1;
 41 
 42     if(unlikely(enable_debug))
 43       printk("%s(%s): woken up ring=%d, [slot=%d] XXX\n",
 44          __FUNCTION__, rx_ring->netdev->name,
 45          rx_ring->reg_idx, i);
 46       }
 47     }
 48 
 49     // goto dump_stats;
 50     return(!!budget);
 51   }
 52 
 53   /* Only 82598 needs kernel housekeeping 家務  (82599 does not need that thanks
 54      to the drop bit), as the drop flag does not seem to work
 55      只有82598網卡因drop標志位似乎不能工作而需要做雜務處理，
 56      而82599不需要繼續執行
 57   */
 58   if(adapter->hw.mac.type != ixgbe_mac_82598EB)  
 59     return(!!budget);   //可是，82599網卡怎么收包呢?
 60 
 61   if( /* staterr || */ enable_debug) {
 62     printk("[DNA] %s(): %s@%d [used=%d][idx=%d][next_to_use=%u][#unused=%d][staterr=%d][full=%d][pkt_ptr=%llu]\n", __FUNCTION__,
 63        rx_ring->netdev->name, rx_ring->queue_index,
 64        rx_ring->dna.queue_in_use, i, rx_ring->next_to_use,
 65        ixgbe_desc_unused(rx_ring), staterr, dna_ixgbe_rx_dump(rx_ring), rx_desc->read.pkt_addr);
 66   }
 67 
 68   /*
 69     This RX queue is not in use   用戶空間的程序沒有使用該接收隊列
 70 
 71     IMPORTANT
 72     We need to poll queues not in use as otherwise they will stop the operations
 73     also on queues where there is an application running that consumes the packets
 74   */
 75   while(staterr & IXGBE_RXD_STAT_DD) {    //輪詢DD狀態的描述符
 76     shadow_rx_desc = IXGBE_RX_DESC(rx_ring, i+rx_ring->count);    //影子描述符
 77     rx_desc->wb.upper.status_error = 0, last_cleaned_idx = i;
 78     rx_desc->read.hdr_addr = shadow_rx_desc->read.hdr_addr, rx_desc->read.pkt_addr = shadow_rx_desc->read.pkt_addr;  //從影子描述符中取出數據包和包頭的DMA地址
 79 
 80     rmb();  //內存屏障，保證代碼執行順序
 81 
 82     // REMOVE BELOW
 83     // ixgbe_release_rx_desc(rx_ring, i); /* Not needed */
 84 
 85     i++, num_laps++, budget--;
 86     if(i == rx_ring->count)  //環狀數組，逆轉
 87       i = 0;
 88 
 89     rx_desc = IXGBE_RX_DESC(rx_ring, i); //取出描述符
 90     prefetch(rx_desc);     //預取描述符
 91     staterr = le32_to_cpu(rx_desc->wb.upper.status_error);
 92 
 93     if(budget == 0) break;
 94   }
 95 
 96   rx_ring->stats.packets += total_rx_packets;
 97   // rx_ring->stats.bytes += total_rx_bytes;
 98   q_vector->rx.total_packets += total_rx_packets;
 99   // q_vector->rx.total_bytes += total_rx_bytes;
100 
101   /* Update register   更新寄存器 */
102   rx_ring->next_to_clean = i, IXGBE_WRITE_REG(&adapter->hw, IXGBE_RDT(rx_ring->reg_idx), last_cleaned_idx);
103 
104   if(unlikely(enable_debug)) {  //忽略
105     int j=0, full = 0, other = 0, null_dma = 0;
106     struct ixgbe_rx_buffer *bi;
107 
108     for(j=0; j<rx_ring->count; j++) {
109       rx_desc = IXGBE_RX_DESC(rx_ring, j);
110       prefetch(rx_desc);
111       staterr = le32_to_cpu(rx_desc->wb.upper.status_error);
112 
113       bi = &rx_ring->rx_buffer_info[i];
114 
115       if(staterr & IXGBE_RXD_STAT_DD)
116     full++;  //DD狀態
117       else if(staterr)
118     other++;  //非DD狀態
119 
120       if(bi->dma == 0) null_dma++;
121     }
122 
123     printk("[DNA] %s(): %s@%d [laps=%d][budget=%d][full=%d/other=%d][next_to_clean=%u][next_to_use=%d][#unused=%d][null_dma=%d]\n",
124        __FUNCTION__,
125        rx_ring->netdev->name, rx_ring->queue_index,
126        num_laps, budget, full, other,
127        rx_ring->next_to_clean, rx_ring->next_to_use,
128        ixgbe_desc_unused(rx_ring), null_dma);
129   }
130 
131   return(!!budget);
132 }

其實，還有個很重要的函數ixgbe_alloc_rx_buffers( )，主要用來分配DMA page映射網卡的FIFO，代碼如下。

void ixgbe_alloc_rx_buffers(struct ixgbe_ring *rx_ring, u16 cleaned_count)
{
    union ixgbe_adv_rx_desc *rx_desc;
    struct ixgbe_rx_buffer *bi;
    u16 i = rx_ring->next_to_use;  //接收環中下一個可使用的描述符編號， next_to_use之后是目前可以DMA映射與傳輸的描述符

    /* nothing to do */
    if (!cleaned_count)   //如果需要替換的緩存單元個數為0
        return;

    rx_desc = IXGBE_RX_DESC(rx_ring, i);  //取第i個描述符
    bi = &rx_ring->rx_buffer_info[i];     //取第i個緩存單元
    i -= rx_ring->count;        //減去count

    do {
#ifdef CONFIG_IXGBE_DISABLE_PACKET_SPLIT                            //禁止包分割
        if (!ixgbe_alloc_mapped_skb(rx_ring, bi))  //分配rx_buf_len即2048字節來建立流式映射
#else                                                                                     //默認情形，允許包分割
        if (!ixgbe_alloc_mapped_page(rx_ring, bi))  //分配page來建立流式映射，使用的是高端內存
        
#endif
            break;

        /*  即便buffer_addrs沒變，也要更新desc，因為每次硬件寫回會擦除這個buffer_addrs信息
         * Refresh the desc even if buffer_addrs didn't change
         * because each write-back erases 擦除 this info.
         */
#ifdef CONFIG_IXGBE_DISABLE_PACKET_SPLIT     //禁止包分割
        rx_desc->read.pkt_addr = cpu_to_le64(bi->dma);  
#else                                                               //默認情況下允許包分割
        rx_desc->read.pkt_addr = cpu_to_le64(bi->dma + bi->page_offset);  //設置pkt_addr
#endif

        rx_desc++;  //指向下一個接收描述符
        bi++;          //指向下一個接收緩存單元
        i++;            //指向下一個接收描述符編號
        if (unlikely(!i)) {  //如果下一個接收描述符編號i為0
            rx_desc = IXGBE_RX_DESC(rx_ring, 0);  //描述符為0
            bi = rx_ring->rx_buffer_info;    //緩沖單元指向緩沖區起始位置
            i -= rx_ring->count;  //65536減去count
        }

        /* clear the hdr_addr for the next_to_use descriptor */
        rx_desc->read.hdr_addr = 0;  //清除下一個描述符的hdr_addr

        cleaned_count--;   //需要替換的緩存單元個數減一
    } while (cleaned_count);

    i += rx_ring->count;  //加上count

    if (rx_ring->next_to_use != i)       //如果next_to_use與i不一致
        ixgbe_release_rx_desc(rx_ring, i);   //更新next_to_use和next_to_alloc變量
}

而pf_ring也采用了它自己的函數dna_ixgbe_alloc_rx_buffers：

#ifdef ENABLE_DNA
	struct ixgbe_adapter *adapter = netdev_priv(rx_ring->netdev);

	if(adapter->dna.dna_enabled) {
		if(rx_ring->netdev)
			dna_ixgbe_alloc_rx_buffers(rx_ring);   //拋棄intel實現的方法，采用PF_RING DMA方式自己的內存分配方案
		return;
	}
#endif

void dna_ixgbe_alloc_rx_buffers(struct ixgbe_ring *rx_ring) {
  union ixgbe_adv_rx_desc *rx_desc, *shadow_rx_desc;
  struct ixgbe_rx_buffer *bi;
  u16 i;
  struct ixgbe_adapter     *adapter = netdev_priv(rx_ring->netdev);
  struct ixgbe_hw       *hw = &adapter->hw;
  u16                    cache_line_size;
  struct ixgbe_ring     *tx_ring = adapter->tx_ring[rx_ring->queue_index];
  struct pfring_hooks   *hook = (struct pfring_hooks*)rx_ring->netdev->pfring_ptr;
  mem_ring_info         rx_info = {0};
  mem_ring_info         tx_info = {0};
  int                   num_slots_per_page;

  /* Check if the memory has been already allocated */
  if(rx_ring->dna.memory_allocated) return;

  /* nothing to do or no valid netdev defined */
  if (!netdev_ring(rx_ring))
    return;

  if (!hook) {
    printk("[DNA] WARNING The PF_RING module is NOT loaded.\n");
    printk("[DNA] WARNING Please load it, before loading this module\n");
    return;
  }

  init_waitqueue_head(&rx_ring->dna.rx_tx.rx.packet_waitqueue);

  cache_line_size = cpu_to_le16(IXGBE_READ_PCIE_WORD(hw, IXGBE_PCI_DEVICE_CACHE_LINE_SIZE));
  cache_line_size &= 0x00FF;
  cache_line_size *= PCI_DEVICE_CACHE_LINE_SIZE_BYTES;
  if(cache_line_size == 0) cache_line_size = 64;

  if(unlikely(enable_debug))
    printk("%s(): pci cache line size %d\n",__FUNCTION__, cache_line_size);

  rx_ring->dna.packet_slot_len  = ALIGN(rx_ring->rx_buf_len, cache_line_size); //1600 slot長度
  rx_ring->dna.packet_num_slots = rx_ring->count;    //8192  slot個數

  rx_ring->dna.tot_packet_memory = PAGE_SIZE << DNA_MAX_CHUNK_ORDER;   //4096*32=131072  全部包內存  這個有什么用?

  num_slots_per_page = rx_ring->dna.tot_packet_memory / rx_ring->dna.packet_slot_len;  //131072/1600=81

  rx_ring->dna.num_memory_pages = (rx_ring->dna.packet_num_slots + num_slots_per_page-1) / num_slots_per_page;  //(8192+81-1)/81=102

  /* Packet Split disabled in DNA mode */
  //if (ring_is_ps_enabled(rx_ring)) {
    /* data will be put in this buffer */
    /* Original fuction allocate PAGE_SIZE/2 for this buffer*/
  //  rx_ring->dna.packet_slot_len  += PAGE_SIZE/2;
  //}

  if(unlikely(enable_debug))
    printk("%s(): RX dna.packet_slot_len=%d tot_packet_memory=%d num_memory_pages=%u num_slots_per_page=%d\n",
       __FUNCTION__, 
       rx_ring->dna.packet_slot_len,   //1600
       rx_ring->dna.tot_packet_memory,  //131072
       rx_ring->dna.num_memory_pages,  //102
       num_slots_per_page); //81

  for(i=0; i<rx_ring->dna.num_memory_pages; i++) {  //102次
    rx_ring->dna.rx_tx.rx.packet_memory[i] =    //slot槽
      alloc_contiguous_memory(&rx_ring->dna.tot_packet_memory,  //4096*32字節
                        &rx_ring->dna.mem_order,   //返回頁數
                        rx_ring->q_vector->numa_node);  //指定numa節點

    if (rx_ring->dna.rx_tx.rx.packet_memory[i] == 0) {  //如果分配失敗
      printk("\n\n%s() ERROR: not enough memory for RX DMA ring!!\n\n\n",
         __FUNCTION__);
      return;
    }

    if(unlikely(enable_debug))
      printk("[DNA] %s(): Successfully allocated RX %u@%u bytes at 0x%08lx [slot_len=%d]\n",
         __FUNCTION__, rx_ring->dna.tot_packet_memory, i,
         rx_ring->dna.rx_tx.rx.packet_memory[i], rx_ring->dna.packet_slot_len);
  }

  if(unlikely(enable_debug))
    printk("[DNA] %s(): %s@%d ptr=%p memory allocated on node %d\n", __FUNCTION__, 
      rx_ring->netdev->name, rx_ring->queue_index, rx_ring, rx_ring->q_vector->numa_node);

  for(i=0; i < rx_ring->count; i++) {  //8192
    u_int offset, page_index;
    char *pkt;

    page_index = i / num_slots_per_page;  // i/81
    offset = (i % num_slots_per_page) * rx_ring->dna.packet_slot_len;
    pkt = (char *)(rx_ring->dna.rx_tx.rx.packet_memory[page_index] + offset); //DMA緩沖區的地址

    /*
    if(unlikely(enable_debug))
      printk("[DNA] %s(): Successfully remapped RX %u@%u bytes at 0x%08lx [slot_len=%d][page_index=%u][offset=%u]\n",
         __FUNCTION__, rx_ring->dna.tot_packet_memory, i,
         rx_ring->dna.rx_tx.rx.packet_memory[i],
         rx_ring->dna.packet_slot_len, page_index, offset);
    */

    bi      = &rx_ring->rx_buffer_info[i];
    bi->skb = NULL;
    rx_desc = IXGBE_RX_DESC(rx_ring, i);

    if(unlikely(enable_debug))
      printk("%s(): Mapping RX slot %d of %d [pktaddr=%p][rx_desc=%p][offset=%u]\n",
         __FUNCTION__, i, rx_ring->dna.packet_num_slots,
         pkt, rx_desc, offset);
                                          //為什么只是做了一次DMA流式映射呢???????????
    bi->dma = pci_map_single(to_pci_dev(rx_ring->dev), pkt,       //進行流式DMA映射  
                 rx_ring->dna.packet_slot_len,   //1600
                 PCI_DMA_BIDIRECTIONAL /* PCI_DMA_FROMDEVICE */ );

    /* Packet Split disabled in DNA mode    禁止數據包分割*/
    //if (!ring_is_ps_enabled(rx_ring)) {   
      rx_desc->read.hdr_addr = 0;
      rx_desc->read.pkt_addr = cpu_to_le64(bi->dma);
    //} else {
    //  rx_desc->read.hdr_addr = cpu_to_le64(bi->dma);
    //  rx_desc->read.pkt_addr = cpu_to_le64(bi->dma + rx_ring->dna.packet_slot_len);
    //}

    rx_desc->wb.upper.status_error = 0;

    shadow_rx_desc = IXGBE_RX_DESC(rx_ring, i + rx_ring->count);  //計算影子描述符表的地址
    memcpy(shadow_rx_desc, rx_desc, sizeof(union ixgbe_adv_rx_desc));//把原描述符表全部復制到影子描述表

    if(unlikely(enable_debug)) {
      print_adv_rx_descr(rx_desc);
      print_adv_rx_descr(shadow_rx_desc);
    }

    ixgbe_release_rx_desc(rx_ring, i);
  } /* for */

  /* Shadow */
  rx_desc = IXGBE_RX_DESC(rx_ring, 0);

  /* Resetting index
     rx_ring->next_to_use   = the last slot where the next incoming packets can be copied (tail) */
  ixgbe_release_rx_desc(rx_ring, rx_ring->count-1);
  /* rx_ring->next_to_clean = the slot where the next incoming packet will be read (head) */
  rx_ring->next_to_clean = 0;

  /* Register with PF_RING */

  if(unlikely(enable_debug))
    printk("[DNA] next_to_clean=%u/next_to_use=%u [register=%d]\n",
       rx_ring->next_to_clean, rx_ring->next_to_use, IXGBE_READ_REG(hw, IXGBE_RDT(rx_ring->reg_idx)));

  /* Allocate TX memory */
  tx_ring->dna.tot_packet_memory = rx_ring->dna.tot_packet_memory;
  tx_ring->dna.packet_slot_len   = rx_ring->dna.packet_slot_len;
  tx_ring->dna.packet_num_slots  = tx_ring->count;
  tx_ring->dna.mem_order         = rx_ring->dna.mem_order;
  tx_ring->dna.num_memory_pages  = (tx_ring->dna.packet_num_slots + num_slots_per_page-1) / num_slots_per_page;

  dna_ixgbe_alloc_tx_buffers(tx_ring, hook);

  rx_info.packet_memory_num_chunks    = rx_ring->dna.num_memory_pages;
  rx_info.packet_memory_chunk_len     = rx_ring->dna.tot_packet_memory;
  rx_info.packet_memory_num_slots     = rx_ring->dna.packet_num_slots;
  rx_info.packet_memory_slot_len      = rx_ring->dna.packet_slot_len;
  rx_info.descr_packet_memory_tot_len = 2 * rx_ring->size;
  
  tx_info.packet_memory_num_chunks    = tx_ring->dna.num_memory_pages;
  tx_info.packet_memory_chunk_len     = tx_ring->dna.tot_packet_memory;
  tx_info.packet_memory_num_slots     = tx_ring->dna.packet_num_slots;
  tx_info.packet_memory_slot_len      = tx_ring->dna.packet_slot_len;
  tx_info.descr_packet_memory_tot_len = 2 * tx_ring->size;
                       //原來如此，通過調用函數 dna_device_handler，把驅動有關信息告訴pf_ring模塊
  hook->ring_dna_device_handler(add_device_mapping,
                dna_v1,
                  &rx_info,
                &tx_info,
                rx_ring->dna.rx_tx.rx.packet_memory,                   //接收包內存
                rx_ring->desc, /* Packet descriptors  接收包描述符內存 */
                tx_ring->dna.rx_tx.tx.packet_memory,                    //發送包內存
                tx_ring->desc, /* Packet descriptors   發送包描述符內存 */
                (void*)rx_ring->netdev->mem_start,                    //物理網卡內存
                rx_ring->netdev->mem_end - rx_ring->netdev->mem_start,
                rx_ring->queue_index, /* Channel Id */
                rx_ring->netdev,
                rx_ring->dev, /* for DMA mapping */
                dna_model(hw),
                rx_ring->netdev->dev_addr,
                &rx_ring->dna.rx_tx.rx.packet_waitqueue,
                &rx_ring->dna.rx_tx.rx.interrupt_received,
                (void*)rx_ring, (void*)tx_ring,
                wait_packet_function_ptr,
                notify_function_ptr);

  rx_ring->dna.memory_allocated = 1;

  if(unlikely(enable_debug))
    printk("[DNA] ixgbe: %s: Enabled DNA on queue %d [RX][size=%u][count=%d] [TX][size=%u][count=%d]\n",
       rx_ring->netdev->name, rx_ring->queue_index, rx_ring->size, rx_ring->count, tx_ring->size, tx_ring->count);
#if 0
  if(adapter->hw.mac.type != ixgbe_mac_82598EB)
    ixgbe_irq_disable_queues(rx_ring->q_vector->adapter, ((u64)1 << rx_ring->queue_index));
#endif
}

免責聲明！

本站轉載的文章為個人學習借鑒使用，本站對版權不負任何法律責任。如果侵犯了您的隱私權益，請聯系本站郵箱yoyou2525@163.com刪除。

猜您在找 八、uboot 代碼流程分析---C環境建立七、uboot 代碼流程分析---start.S nginx的請求接收流程（一） STM32 USB數據接收與數據發送程序流程分析【原創】k8s源代碼分析-----kubelet（1）主要流程 Intel 82599 ixgbe & ixgbevf CNA 卡驅動分析02——VF/PF/MailBox RING0,RING1,RING2,RING3 ring0和ring3的區別 linux的initrd機制和initramfs機制之根文件掛載流程：代碼分析【轉】 [Android6.0][RK3399] 雙屏異顯代碼實現流程分析（一）【轉】