mirror of
https://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
synced 2025-01-01 18:53:30 +00:00
net/smc: Use percpu ref for wr tx reference
The refcount wr_tx_refcnt may cause cache thrashing problems among cores and we can use percpu ref to mitigate this issue here. We gain some performance improvement with percpu ref here on our customized smc-r verion. Applying cache alignment may also mitigate this problem but it seem more reasonable to use percpu ref here. We can also replace wr_reg_refcnt with one percpu reference like wr_tx_refcnt. redis-benchmark on smc-r with atomic wr_tx_refcnt: SET: 525707.06 requests per second, p50=0.087 msec GET: 554877.38 requests per second, p50=0.087 msec redis-benchmark on the percpu_ref version: SET: 540482.06 requests per second, p50=0.087 msec GET: 570711.12 requests per second, p50=0.079 msec Cases are like "redis-benchmark -h x.x.x.x -q -t set,get -P 1 -n 5000000 -c 50 -d 10 --threads 4". Signed-off-by: Kai Shen <KaiShen@linux.alibaba.com> Reviewed-by: Tony Lu <tonylu@linux.alibaba.com> Signed-off-by: David S. Miller <davem@davemloft.net>
This commit is contained in:
parent
d27d367d3b
commit
79a22238b4
@ -106,7 +106,10 @@ struct smc_link {
|
|||||||
unsigned long *wr_tx_mask; /* bit mask of used indexes */
|
unsigned long *wr_tx_mask; /* bit mask of used indexes */
|
||||||
u32 wr_tx_cnt; /* number of WR send buffers */
|
u32 wr_tx_cnt; /* number of WR send buffers */
|
||||||
wait_queue_head_t wr_tx_wait; /* wait for free WR send buf */
|
wait_queue_head_t wr_tx_wait; /* wait for free WR send buf */
|
||||||
atomic_t wr_tx_refcnt; /* tx refs to link */
|
struct {
|
||||||
|
struct percpu_ref wr_tx_refs;
|
||||||
|
} ____cacheline_aligned_in_smp;
|
||||||
|
struct completion tx_ref_comp;
|
||||||
|
|
||||||
struct smc_wr_buf *wr_rx_bufs; /* WR recv payload buffers */
|
struct smc_wr_buf *wr_rx_bufs; /* WR recv payload buffers */
|
||||||
struct ib_recv_wr *wr_rx_ibs; /* WR recv meta data */
|
struct ib_recv_wr *wr_rx_ibs; /* WR recv meta data */
|
||||||
@ -122,7 +125,10 @@ struct smc_link {
|
|||||||
|
|
||||||
struct ib_reg_wr wr_reg; /* WR register memory region */
|
struct ib_reg_wr wr_reg; /* WR register memory region */
|
||||||
wait_queue_head_t wr_reg_wait; /* wait for wr_reg result */
|
wait_queue_head_t wr_reg_wait; /* wait for wr_reg result */
|
||||||
atomic_t wr_reg_refcnt; /* reg refs to link */
|
struct {
|
||||||
|
struct percpu_ref wr_reg_refs;
|
||||||
|
} ____cacheline_aligned_in_smp;
|
||||||
|
struct completion reg_ref_comp;
|
||||||
enum smc_wr_reg_state wr_reg_state; /* state of wr_reg request */
|
enum smc_wr_reg_state wr_reg_state; /* state of wr_reg request */
|
||||||
|
|
||||||
u8 gid[SMC_GID_SIZE];/* gid matching used vlan id*/
|
u8 gid[SMC_GID_SIZE];/* gid matching used vlan id*/
|
||||||
|
@ -377,12 +377,11 @@ int smc_wr_reg_send(struct smc_link *link, struct ib_mr *mr)
|
|||||||
if (rc)
|
if (rc)
|
||||||
return rc;
|
return rc;
|
||||||
|
|
||||||
atomic_inc(&link->wr_reg_refcnt);
|
percpu_ref_get(&link->wr_reg_refs);
|
||||||
rc = wait_event_interruptible_timeout(link->wr_reg_wait,
|
rc = wait_event_interruptible_timeout(link->wr_reg_wait,
|
||||||
(link->wr_reg_state != POSTED),
|
(link->wr_reg_state != POSTED),
|
||||||
SMC_WR_REG_MR_WAIT_TIME);
|
SMC_WR_REG_MR_WAIT_TIME);
|
||||||
if (atomic_dec_and_test(&link->wr_reg_refcnt))
|
percpu_ref_put(&link->wr_reg_refs);
|
||||||
wake_up_all(&link->wr_reg_wait);
|
|
||||||
if (!rc) {
|
if (!rc) {
|
||||||
/* timeout - terminate link */
|
/* timeout - terminate link */
|
||||||
smcr_link_down_cond_sched(link);
|
smcr_link_down_cond_sched(link);
|
||||||
@ -647,8 +646,10 @@ void smc_wr_free_link(struct smc_link *lnk)
|
|||||||
smc_wr_wakeup_tx_wait(lnk);
|
smc_wr_wakeup_tx_wait(lnk);
|
||||||
|
|
||||||
smc_wr_tx_wait_no_pending_sends(lnk);
|
smc_wr_tx_wait_no_pending_sends(lnk);
|
||||||
wait_event(lnk->wr_reg_wait, (!atomic_read(&lnk->wr_reg_refcnt)));
|
percpu_ref_kill(&lnk->wr_reg_refs);
|
||||||
wait_event(lnk->wr_tx_wait, (!atomic_read(&lnk->wr_tx_refcnt)));
|
wait_for_completion(&lnk->reg_ref_comp);
|
||||||
|
percpu_ref_kill(&lnk->wr_tx_refs);
|
||||||
|
wait_for_completion(&lnk->tx_ref_comp);
|
||||||
|
|
||||||
if (lnk->wr_rx_dma_addr) {
|
if (lnk->wr_rx_dma_addr) {
|
||||||
ib_dma_unmap_single(ibdev, lnk->wr_rx_dma_addr,
|
ib_dma_unmap_single(ibdev, lnk->wr_rx_dma_addr,
|
||||||
@ -847,6 +848,20 @@ void smc_wr_add_dev(struct smc_ib_device *smcibdev)
|
|||||||
tasklet_setup(&smcibdev->send_tasklet, smc_wr_tx_tasklet_fn);
|
tasklet_setup(&smcibdev->send_tasklet, smc_wr_tx_tasklet_fn);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static void smcr_wr_tx_refs_free(struct percpu_ref *ref)
|
||||||
|
{
|
||||||
|
struct smc_link *lnk = container_of(ref, struct smc_link, wr_tx_refs);
|
||||||
|
|
||||||
|
complete(&lnk->tx_ref_comp);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void smcr_wr_reg_refs_free(struct percpu_ref *ref)
|
||||||
|
{
|
||||||
|
struct smc_link *lnk = container_of(ref, struct smc_link, wr_reg_refs);
|
||||||
|
|
||||||
|
complete(&lnk->reg_ref_comp);
|
||||||
|
}
|
||||||
|
|
||||||
int smc_wr_create_link(struct smc_link *lnk)
|
int smc_wr_create_link(struct smc_link *lnk)
|
||||||
{
|
{
|
||||||
struct ib_device *ibdev = lnk->smcibdev->ibdev;
|
struct ib_device *ibdev = lnk->smcibdev->ibdev;
|
||||||
@ -890,9 +905,15 @@ int smc_wr_create_link(struct smc_link *lnk)
|
|||||||
smc_wr_init_sge(lnk);
|
smc_wr_init_sge(lnk);
|
||||||
bitmap_zero(lnk->wr_tx_mask, SMC_WR_BUF_CNT);
|
bitmap_zero(lnk->wr_tx_mask, SMC_WR_BUF_CNT);
|
||||||
init_waitqueue_head(&lnk->wr_tx_wait);
|
init_waitqueue_head(&lnk->wr_tx_wait);
|
||||||
atomic_set(&lnk->wr_tx_refcnt, 0);
|
rc = percpu_ref_init(&lnk->wr_tx_refs, smcr_wr_tx_refs_free, 0, GFP_KERNEL);
|
||||||
|
if (rc)
|
||||||
|
goto dma_unmap;
|
||||||
|
init_completion(&lnk->tx_ref_comp);
|
||||||
init_waitqueue_head(&lnk->wr_reg_wait);
|
init_waitqueue_head(&lnk->wr_reg_wait);
|
||||||
atomic_set(&lnk->wr_reg_refcnt, 0);
|
rc = percpu_ref_init(&lnk->wr_reg_refs, smcr_wr_reg_refs_free, 0, GFP_KERNEL);
|
||||||
|
if (rc)
|
||||||
|
goto dma_unmap;
|
||||||
|
init_completion(&lnk->reg_ref_comp);
|
||||||
init_waitqueue_head(&lnk->wr_rx_empty_wait);
|
init_waitqueue_head(&lnk->wr_rx_empty_wait);
|
||||||
return rc;
|
return rc;
|
||||||
|
|
||||||
|
@ -63,14 +63,13 @@ static inline bool smc_wr_tx_link_hold(struct smc_link *link)
|
|||||||
{
|
{
|
||||||
if (!smc_link_sendable(link))
|
if (!smc_link_sendable(link))
|
||||||
return false;
|
return false;
|
||||||
atomic_inc(&link->wr_tx_refcnt);
|
percpu_ref_get(&link->wr_tx_refs);
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
static inline void smc_wr_tx_link_put(struct smc_link *link)
|
static inline void smc_wr_tx_link_put(struct smc_link *link)
|
||||||
{
|
{
|
||||||
if (atomic_dec_and_test(&link->wr_tx_refcnt))
|
percpu_ref_put(&link->wr_tx_refs);
|
||||||
wake_up_all(&link->wr_tx_wait);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
static inline void smc_wr_drain_cq(struct smc_link *lnk)
|
static inline void smc_wr_drain_cq(struct smc_link *lnk)
|
||||||
|
Loading…
Reference in New Issue
Block a user