tx_buff = &tx_pool->tx_buff[index];
                adapter->netdev->stats.tx_packets--;
                adapter->netdev->stats.tx_bytes -= tx_buff->skb->len;
-               adapter->tx_stats_buffers[queue_num].packets--;
+               adapter->tx_stats_buffers[queue_num].batched_packets--;
                adapter->tx_stats_buffers[queue_num].bytes -=
                                                tx_buff->skb->len;
                dev_kfree_skb_any(tx_buff->skb);
        unsigned int tx_map_failed = 0;
        union sub_crq indir_arr[16];
        unsigned int tx_dropped = 0;
-       unsigned int tx_packets = 0;
+       unsigned int tx_dpackets = 0;
+       unsigned int tx_bpackets = 0;
        unsigned int tx_bytes = 0;
        dma_addr_t data_dma_addr;
        struct netdev_queue *txq;
                if (lpar_rc != H_SUCCESS)
                        goto tx_err;
 
+               tx_dpackets++;
                goto early_exit;
        }
 
                        goto tx_err;
        }
 
+       tx_bpackets++;
+
 early_exit:
        if (atomic_add_return(num_entries, &tx_scrq->used)
                                        >= adapter->req_tx_entries_per_subcrq) {
                netif_stop_subqueue(netdev, queue_num);
        }
 
-       tx_packets++;
        tx_bytes += skb->len;
        txq_trans_cond_update(txq);
        ret = NETDEV_TX_OK;
        rcu_read_unlock();
        netdev->stats.tx_dropped += tx_dropped;
        netdev->stats.tx_bytes += tx_bytes;
-       netdev->stats.tx_packets += tx_packets;
+       netdev->stats.tx_packets += tx_bpackets + tx_dpackets;
        adapter->tx_send_failed += tx_send_failed;
        adapter->tx_map_failed += tx_map_failed;
-       adapter->tx_stats_buffers[queue_num].packets += tx_packets;
+       adapter->tx_stats_buffers[queue_num].batched_packets += tx_bpackets;
+       adapter->tx_stats_buffers[queue_num].direct_packets += tx_dpackets;
        adapter->tx_stats_buffers[queue_num].bytes += tx_bytes;
        adapter->tx_stats_buffers[queue_num].dropped_packets += tx_dropped;
 
                memcpy(data, ibmvnic_stats[i].name, ETH_GSTRING_LEN);
 
        for (i = 0; i < adapter->req_tx_queues; i++) {
-               snprintf(data, ETH_GSTRING_LEN, "tx%d_packets", i);
+               snprintf(data, ETH_GSTRING_LEN, "tx%d_batched_packets", i);
+               data += ETH_GSTRING_LEN;
+
+               snprintf(data, ETH_GSTRING_LEN, "tx%d_direct_packets", i);
                data += ETH_GSTRING_LEN;
 
                snprintf(data, ETH_GSTRING_LEN, "tx%d_bytes", i);
                                      (adapter, ibmvnic_stats[i].offset));
 
        for (j = 0; j < adapter->req_tx_queues; j++) {
-               data[i] = adapter->tx_stats_buffers[j].packets;
+               data[i] = adapter->tx_stats_buffers[j].batched_packets;
+               i++;
+               data[i] = adapter->tx_stats_buffers[j].direct_packets;
                i++;
                data[i] = adapter->tx_stats_buffers[j].bytes;
                i++;