mlx5en: Optimise away duplicate UAR pointers.

This change also reduces the size of the mlx5e_sq structure so that the last
queue_state element will fit into the previous cacheline and then the mlx5e_sq
structure becomes one cacheline less for amd64.

Sponsored by:	Mellanox Technologies
MFC after:	1 week
This commit is contained in:
Hans Petter Selasky 2016-09-16 11:40:45 +00:00
parent 28f22ccea3
commit 5eadc44ceb
2 changed files with 3 additions and 7 deletions

View File

@ -528,8 +528,7 @@ struct mlx5e_sq {
/* read only */ /* read only */
struct mlx5_wq_cyc wq; struct mlx5_wq_cyc wq;
void __iomem *uar_map; struct mlx5_uar uar;
void __iomem *uar_bf_map;
struct ifnet *ifp; struct ifnet *ifp;
u32 sqn; u32 sqn;
u32 bf_buf_size; u32 bf_buf_size;
@ -538,7 +537,6 @@ struct mlx5e_sq {
/* control path */ /* control path */
struct mlx5_wq_ctrl wq_ctrl; struct mlx5_wq_ctrl wq_ctrl;
struct mlx5_uar uar;
struct mlx5e_priv *priv; struct mlx5e_priv *priv;
int tc; int tc;
unsigned int queue_state; unsigned int queue_state;
@ -780,13 +778,13 @@ mlx5e_tx_notify_hw(struct mlx5e_sq *sq, u32 *wqe, int bf_sz)
wmb(); wmb();
if (bf_sz) { if (bf_sz) {
__iowrite64_copy(sq->uar_bf_map + ofst, wqe, bf_sz); __iowrite64_copy(sq->uar.bf_map + ofst, wqe, bf_sz);
/* flush the write-combining mapped buffer */ /* flush the write-combining mapped buffer */
wmb(); wmb();
} else { } else {
mlx5_write64(wqe, sq->uar_map + ofst, NULL); mlx5_write64(wqe, sq->uar.map + ofst, NULL);
} }
sq->bf_offset ^= sq->bf_buf_size; sq->bf_offset ^= sq->bf_buf_size;

View File

@ -956,8 +956,6 @@ mlx5e_create_sq(struct mlx5e_channel *c,
goto err_unmap_free_uar; goto err_unmap_free_uar;
sq->wq.db = &sq->wq.db[MLX5_SND_DBR]; sq->wq.db = &sq->wq.db[MLX5_SND_DBR];
sq->uar_map = sq->uar.map;
sq->uar_bf_map = sq->uar.bf_map;
sq->bf_buf_size = (1 << MLX5_CAP_GEN(mdev, log_bf_reg_size)) / 2; sq->bf_buf_size = (1 << MLX5_CAP_GEN(mdev, log_bf_reg_size)) / 2;
err = mlx5e_alloc_sq_db(sq); err = mlx5e_alloc_sq_db(sq);