linux-rdma.vger.kernel.org archive mirror
 help / color / mirror / Atom feed
* [PATCH V3] IB/mlx4: Use vmalloc for WR buffers when needed
@ 2015-10-08  5:27 Wengang Wang
       [not found] ` <1444282024-11425-1-git-send-email-wen.gang.wang-QHcLZuEGTsvQT0dZR+AlfA@public.gmane.org>
  0 siblings, 1 reply; 3+ messages in thread
From: Wengang Wang @ 2015-10-08  5:27 UTC (permalink / raw)
  To: linux-rdma-u79uwXL29TY76Z2rM5mHXA; +Cc: wen.gang.wang-QHcLZuEGTsvQT0dZR+AlfA

There are several hits that WR buffer allocation(kmalloc) failed.
It failed at order 3 and/or 4 contigous pages allocation. At the same time
there are actually 100MB+ free memory but well fragmented.
So try vmalloc when kmalloc failed.

Signed-off-by: Wengang Wang <wen.gang.wang-QHcLZuEGTsvQT0dZR+AlfA@public.gmane.org>
Acked-by: Or Gerlitz <ogerlitz-VPRAkNaXOzVWk0Htik3J/w@public.gmane.org>
---
 drivers/infiniband/hw/mlx4/qp.c  | 19 +++++++++++++------
 drivers/infiniband/hw/mlx4/srq.c | 11 ++++++++---
 2 files changed, 21 insertions(+), 9 deletions(-)

diff --git a/drivers/infiniband/hw/mlx4/qp.c b/drivers/infiniband/hw/mlx4/qp.c
index 4ad9be3..3ccbd3a 100644
--- a/drivers/infiniband/hw/mlx4/qp.c
+++ b/drivers/infiniband/hw/mlx4/qp.c
@@ -34,6 +34,7 @@
 #include <linux/log2.h>
 #include <linux/slab.h>
 #include <linux/netdevice.h>
+#include <linux/vmalloc.h>
 
 #include <rdma/ib_cache.h>
 #include <rdma/ib_pack.h>
@@ -786,8 +787,14 @@ static int create_qp_common(struct mlx4_ib_dev *dev, struct ib_pd *pd,
 		if (err)
 			goto err_mtt;
 
-		qp->sq.wrid  = kmalloc(qp->sq.wqe_cnt * sizeof (u64), gfp);
-		qp->rq.wrid  = kmalloc(qp->rq.wqe_cnt * sizeof (u64), gfp);
+		qp->sq.wrid = kmalloc(qp->sq.wqe_cnt * sizeof(u64), gfp);
+		if (!qp->sq.wrid)
+			qp->sq.wrid = __vmalloc(qp->sq.wqe_cnt * sizeof(u64),
+						gfp, PAGE_KERNEL);
+		qp->rq.wrid = kmalloc(qp->rq.wqe_cnt * sizeof(u64), gfp);
+		if (!qp->rq.wrid)
+			qp->rq.wrid = __vmalloc(qp->rq.wqe_cnt * sizeof(u64),
+						gfp, PAGE_KERNEL);
 		if (!qp->sq.wrid || !qp->rq.wrid) {
 			err = -ENOMEM;
 			goto err_wrid;
@@ -874,8 +881,8 @@ err_wrid:
 		if (qp_has_rq(init_attr))
 			mlx4_ib_db_unmap_user(to_mucontext(pd->uobject->context), &qp->db);
 	} else {
-		kfree(qp->sq.wrid);
-		kfree(qp->rq.wrid);
+		kvfree(qp->sq.wrid);
+		kvfree(qp->rq.wrid);
 	}
 
 err_mtt:
@@ -1050,8 +1057,8 @@ static void destroy_qp_common(struct mlx4_ib_dev *dev, struct mlx4_ib_qp *qp,
 					      &qp->db);
 		ib_umem_release(qp->umem);
 	} else {
-		kfree(qp->sq.wrid);
-		kfree(qp->rq.wrid);
+		kvfree(qp->sq.wrid);
+		kvfree(qp->rq.wrid);
 		if (qp->mlx4_ib_qp_type & (MLX4_IB_QPT_PROXY_SMI_OWNER |
 		    MLX4_IB_QPT_PROXY_SMI | MLX4_IB_QPT_PROXY_GSI))
 			free_proxy_bufs(&dev->ib_dev, qp);
diff --git a/drivers/infiniband/hw/mlx4/srq.c b/drivers/infiniband/hw/mlx4/srq.c
index dce5dfe..8d133c4 100644
--- a/drivers/infiniband/hw/mlx4/srq.c
+++ b/drivers/infiniband/hw/mlx4/srq.c
@@ -34,6 +34,7 @@
 #include <linux/mlx4/qp.h>
 #include <linux/mlx4/srq.h>
 #include <linux/slab.h>
+#include <linux/vmalloc.h>
 
 #include "mlx4_ib.h"
 #include "user.h"
@@ -172,8 +173,12 @@ struct ib_srq *mlx4_ib_create_srq(struct ib_pd *pd,
 
 		srq->wrid = kmalloc(srq->msrq.max * sizeof (u64), GFP_KERNEL);
 		if (!srq->wrid) {
-			err = -ENOMEM;
-			goto err_mtt;
+			srq->wrid = __vmalloc(srq->msrq.max * sizeof(u64),
+					      GFP_KERNEL, PAGE_KERNEL);
+			if (!srq->wrid) {
+				err = -ENOMEM;
+				goto err_mtt;
+			}
 		}
 	}
 
@@ -204,7 +209,7 @@ err_wrid:
 	if (pd->uobject)
 		mlx4_ib_db_unmap_user(to_mucontext(pd->uobject->context), &srq->db);
 	else
-		kfree(srq->wrid);
+		kvfree(srq->wrid);
 
 err_mtt:
 	mlx4_mtt_cleanup(dev->dev, &srq->mtt);
-- 
2.1.0

--
To unsubscribe from this list: send the line "unsubscribe linux-rdma" in
the body of a message to majordomo-u79uwXL29TY76Z2rM5mHXA@public.gmane.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

^ permalink raw reply related	[flat|nested] 3+ messages in thread

* Re: [PATCH V3] IB/mlx4: Use vmalloc for WR buffers when needed
       [not found] ` <1444282024-11425-1-git-send-email-wen.gang.wang-QHcLZuEGTsvQT0dZR+AlfA@public.gmane.org>
@ 2015-12-11 20:28   ` Matthew Finlay
       [not found]     ` <17CFA44C-D58F-49C0-B3CE-95D38C08E16B-VPRAkNaXOzVWk0Htik3J/w@public.gmane.org>
  0 siblings, 1 reply; 3+ messages in thread
From: Matthew Finlay @ 2015-12-11 20:28 UTC (permalink / raw)
  To: Wengang Wang, linux-rdma-u79uwXL29TY76Z2rM5mHXA

Hi Wengang,

I was going through your patch set here, and it seems that you missed changing kfree to kvfree in mlx4_ib_destroy_srq().  In the current code if the srq wrid is allocated using vmalloc, then on cleanup we will use kfree, which is a bug.

Thanks,
-matt




On 10/7/15, 10:27 PM, "linux-rdma-owner@vger.kernel.org on behalf of Wengang Wang" <linux-rdma-owner@vger.kernel.org on behalf of wen.gang.wang@oracle.com> wrote:

>There are several hits that WR buffer allocation(kmalloc) failed.
>It failed at order 3 and/or 4 contigous pages allocation. At the same time
>there are actually 100MB+ free memory but well fragmented.
>So try vmalloc when kmalloc failed.
>
>Signed-off-by: Wengang Wang <wen.gang.wang@oracle.com>
>Acked-by: Or Gerlitz <ogerlitz@mellanox.com>
>---
> drivers/infiniband/hw/mlx4/qp.c  | 19 +++++++++++++------
> drivers/infiniband/hw/mlx4/srq.c | 11 ++++++++---
> 2 files changed, 21 insertions(+), 9 deletions(-)
>
>diff --git a/drivers/infiniband/hw/mlx4/qp.c b/drivers/infiniband/hw/mlx4/qp.c
>index 4ad9be3..3ccbd3a 100644
>--- a/drivers/infiniband/hw/mlx4/qp.c
>+++ b/drivers/infiniband/hw/mlx4/qp.c
>@@ -34,6 +34,7 @@
> #include <linux/log2.h>
> #include <linux/slab.h>
> #include <linux/netdevice.h>
>+#include <linux/vmalloc.h>
> 
> #include <rdma/ib_cache.h>
> #include <rdma/ib_pack.h>
>@@ -786,8 +787,14 @@ static int create_qp_common(struct mlx4_ib_dev *dev, struct ib_pd *pd,
> 		if (err)
> 			goto err_mtt;
> 
>-		qp->sq.wrid  = kmalloc(qp->sq.wqe_cnt * sizeof (u64), gfp);
>-		qp->rq.wrid  = kmalloc(qp->rq.wqe_cnt * sizeof (u64), gfp);
>+		qp->sq.wrid = kmalloc(qp->sq.wqe_cnt * sizeof(u64), gfp);
>+		if (!qp->sq.wrid)
>+			qp->sq.wrid = __vmalloc(qp->sq.wqe_cnt * sizeof(u64),
>+						gfp, PAGE_KERNEL);
>+		qp->rq.wrid = kmalloc(qp->rq.wqe_cnt * sizeof(u64), gfp);
>+		if (!qp->rq.wrid)
>+			qp->rq.wrid = __vmalloc(qp->rq.wqe_cnt * sizeof(u64),
>+						gfp, PAGE_KERNEL);
> 		if (!qp->sq.wrid || !qp->rq.wrid) {
> 			err = -ENOMEM;
> 			goto err_wrid;
>@@ -874,8 +881,8 @@ err_wrid:
> 		if (qp_has_rq(init_attr))
> 			mlx4_ib_db_unmap_user(to_mucontext(pd->uobject->context), &qp->db);
> 	} else {
>-		kfree(qp->sq.wrid);
>-		kfree(qp->rq.wrid);
>+		kvfree(qp->sq.wrid);
>+		kvfree(qp->rq.wrid);
> 	}
> 
> err_mtt:
>@@ -1050,8 +1057,8 @@ static void destroy_qp_common(struct mlx4_ib_dev *dev, struct mlx4_ib_qp *qp,
> 					      &qp->db);
> 		ib_umem_release(qp->umem);
> 	} else {
>-		kfree(qp->sq.wrid);
>-		kfree(qp->rq.wrid);
>+		kvfree(qp->sq.wrid);
>+		kvfree(qp->rq.wrid);
> 		if (qp->mlx4_ib_qp_type & (MLX4_IB_QPT_PROXY_SMI_OWNER |
> 		    MLX4_IB_QPT_PROXY_SMI | MLX4_IB_QPT_PROXY_GSI))
> 			free_proxy_bufs(&dev->ib_dev, qp);
>diff --git a/drivers/infiniband/hw/mlx4/srq.c b/drivers/infiniband/hw/mlx4/srq.c
>index dce5dfe..8d133c4 100644
>--- a/drivers/infiniband/hw/mlx4/srq.c
>+++ b/drivers/infiniband/hw/mlx4/srq.c
>@@ -34,6 +34,7 @@
> #include <linux/mlx4/qp.h>
> #include <linux/mlx4/srq.h>
> #include <linux/slab.h>
>+#include <linux/vmalloc.h>
> 
> #include "mlx4_ib.h"
> #include "user.h"
>@@ -172,8 +173,12 @@ struct ib_srq *mlx4_ib_create_srq(struct ib_pd *pd,
> 
> 		srq->wrid = kmalloc(srq->msrq.max * sizeof (u64), GFP_KERNEL);
> 		if (!srq->wrid) {
>-			err = -ENOMEM;
>-			goto err_mtt;
>+			srq->wrid = __vmalloc(srq->msrq.max * sizeof(u64),
>+					      GFP_KERNEL, PAGE_KERNEL);
>+			if (!srq->wrid) {
>+				err = -ENOMEM;
>+				goto err_mtt;
>+			}
> 		}
> 	}
> 
>@@ -204,7 +209,7 @@ err_wrid:
> 	if (pd->uobject)
> 		mlx4_ib_db_unmap_user(to_mucontext(pd->uobject->context), &srq->db);
> 	else
>-		kfree(srq->wrid);
>+		kvfree(srq->wrid);
> 
> err_mtt:
> 	mlx4_mtt_cleanup(dev->dev, &srq->mtt);
>-- 
>2.1.0
>
>--
>To unsubscribe from this list: send the line "unsubscribe linux-rdma" in
>the body of a message to majordomo@vger.kernel.org
>More majordomo info at  http://vger.kernel.org/majordomo-info.html

^ permalink raw reply	[flat|nested] 3+ messages in thread

* Re: [PATCH V3] IB/mlx4: Use vmalloc for WR buffers when needed
       [not found]     ` <17CFA44C-D58F-49C0-B3CE-95D38C08E16B-VPRAkNaXOzVWk0Htik3J/w@public.gmane.org>
@ 2015-12-17  2:39       ` Wengang Wang
  0 siblings, 0 replies; 3+ messages in thread
From: Wengang Wang @ 2015-12-17  2:39 UTC (permalink / raw)
  To: Matthew Finlay, linux-rdma-u79uwXL29TY76Z2rM5mHXA

Hi Matt,

Yes, you are right.
Since the patch is already merged in, I am going to make a separated 
patch for that.

thanks,
wengang

在 2015年12月12日 04:28, Matthew Finlay 写道:
> Hi Wengang,
>
> I was going through your patch set here, and it seems that you missed changing kfree to kvfree in mlx4_ib_destroy_srq().  In the current code if the srq wrid is allocated using vmalloc, then on cleanup we will use kfree, which is a bug.
>
> Thanks,
> -matt
>
>
>
>
> On 10/7/15, 10:27 PM, "linux-rdma-owner-u79uwXL29TY76Z2rM5mHXA@public.gmane.org on behalf of Wengang Wang" <linux-rdma-owner-u79uwXL29TY76Z2rM5mHXA@public.gmane.org on behalf of wen.gang.wang-QHcLZuEGTsvQT0dZR+AlfA@public.gmane.org> wrote:
>
>> There are several hits that WR buffer allocation(kmalloc) failed.
>> It failed at order 3 and/or 4 contigous pages allocation. At the same time
>> there are actually 100MB+ free memory but well fragmented.
>> So try vmalloc when kmalloc failed.
>>
>> Signed-off-by: Wengang Wang <wen.gang.wang-QHcLZuEGTsvQT0dZR+AlfA@public.gmane.org>
>> Acked-by: Or Gerlitz <ogerlitz-VPRAkNaXOzVWk0Htik3J/w@public.gmane.org>
>> ---
>> drivers/infiniband/hw/mlx4/qp.c  | 19 +++++++++++++------
>> drivers/infiniband/hw/mlx4/srq.c | 11 ++++++++---
>> 2 files changed, 21 insertions(+), 9 deletions(-)
>>
>> diff --git a/drivers/infiniband/hw/mlx4/qp.c b/drivers/infiniband/hw/mlx4/qp.c
>> index 4ad9be3..3ccbd3a 100644
>> --- a/drivers/infiniband/hw/mlx4/qp.c
>> +++ b/drivers/infiniband/hw/mlx4/qp.c
>> @@ -34,6 +34,7 @@
>> #include <linux/log2.h>
>> #include <linux/slab.h>
>> #include <linux/netdevice.h>
>> +#include <linux/vmalloc.h>
>>
>> #include <rdma/ib_cache.h>
>> #include <rdma/ib_pack.h>
>> @@ -786,8 +787,14 @@ static int create_qp_common(struct mlx4_ib_dev *dev, struct ib_pd *pd,
>> 		if (err)
>> 			goto err_mtt;
>>
>> -		qp->sq.wrid  = kmalloc(qp->sq.wqe_cnt * sizeof (u64), gfp);
>> -		qp->rq.wrid  = kmalloc(qp->rq.wqe_cnt * sizeof (u64), gfp);
>> +		qp->sq.wrid = kmalloc(qp->sq.wqe_cnt * sizeof(u64), gfp);
>> +		if (!qp->sq.wrid)
>> +			qp->sq.wrid = __vmalloc(qp->sq.wqe_cnt * sizeof(u64),
>> +						gfp, PAGE_KERNEL);
>> +		qp->rq.wrid = kmalloc(qp->rq.wqe_cnt * sizeof(u64), gfp);
>> +		if (!qp->rq.wrid)
>> +			qp->rq.wrid = __vmalloc(qp->rq.wqe_cnt * sizeof(u64),
>> +						gfp, PAGE_KERNEL);
>> 		if (!qp->sq.wrid || !qp->rq.wrid) {
>> 			err = -ENOMEM;
>> 			goto err_wrid;
>> @@ -874,8 +881,8 @@ err_wrid:
>> 		if (qp_has_rq(init_attr))
>> 			mlx4_ib_db_unmap_user(to_mucontext(pd->uobject->context), &qp->db);
>> 	} else {
>> -		kfree(qp->sq.wrid);
>> -		kfree(qp->rq.wrid);
>> +		kvfree(qp->sq.wrid);
>> +		kvfree(qp->rq.wrid);
>> 	}
>>
>> err_mtt:
>> @@ -1050,8 +1057,8 @@ static void destroy_qp_common(struct mlx4_ib_dev *dev, struct mlx4_ib_qp *qp,
>> 					      &qp->db);
>> 		ib_umem_release(qp->umem);
>> 	} else {
>> -		kfree(qp->sq.wrid);
>> -		kfree(qp->rq.wrid);
>> +		kvfree(qp->sq.wrid);
>> +		kvfree(qp->rq.wrid);
>> 		if (qp->mlx4_ib_qp_type & (MLX4_IB_QPT_PROXY_SMI_OWNER |
>> 		    MLX4_IB_QPT_PROXY_SMI | MLX4_IB_QPT_PROXY_GSI))
>> 			free_proxy_bufs(&dev->ib_dev, qp);
>> diff --git a/drivers/infiniband/hw/mlx4/srq.c b/drivers/infiniband/hw/mlx4/srq.c
>> index dce5dfe..8d133c4 100644
>> --- a/drivers/infiniband/hw/mlx4/srq.c
>> +++ b/drivers/infiniband/hw/mlx4/srq.c
>> @@ -34,6 +34,7 @@
>> #include <linux/mlx4/qp.h>
>> #include <linux/mlx4/srq.h>
>> #include <linux/slab.h>
>> +#include <linux/vmalloc.h>
>>
>> #include "mlx4_ib.h"
>> #include "user.h"
>> @@ -172,8 +173,12 @@ struct ib_srq *mlx4_ib_create_srq(struct ib_pd *pd,
>>
>> 		srq->wrid = kmalloc(srq->msrq.max * sizeof (u64), GFP_KERNEL);
>> 		if (!srq->wrid) {
>> -			err = -ENOMEM;
>> -			goto err_mtt;
>> +			srq->wrid = __vmalloc(srq->msrq.max * sizeof(u64),
>> +					      GFP_KERNEL, PAGE_KERNEL);
>> +			if (!srq->wrid) {
>> +				err = -ENOMEM;
>> +				goto err_mtt;
>> +			}
>> 		}
>> 	}
>>
>> @@ -204,7 +209,7 @@ err_wrid:
>> 	if (pd->uobject)
>> 		mlx4_ib_db_unmap_user(to_mucontext(pd->uobject->context), &srq->db);
>> 	else
>> -		kfree(srq->wrid);
>> +		kvfree(srq->wrid);
>>
>> err_mtt:
>> 	mlx4_mtt_cleanup(dev->dev, &srq->mtt);
>> -- 
>> 2.1.0
>>
>> --
>> To unsubscribe from this list: send the line "unsubscribe linux-rdma" in
>> the body of a message to majordomo-u79uwXL29TY76Z2rM5mHXA@public.gmane.org
>> More majordomo info at  http://vger.kernel.org/majordomo-info.html
> N�����r��y���b�X��ǧv�^�)޺{.n�+����{��ٚ�{ay�\x1dʇڙ�,j\a��f���h���z�\x1e�w���\f���j:+v���w�j�m����\a����zZ+�����ݢj"��!tml=

--
To unsubscribe from this list: send the line "unsubscribe linux-rdma" in
the body of a message to majordomo-u79uwXL29TY76Z2rM5mHXA@public.gmane.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

^ permalink raw reply	[flat|nested] 3+ messages in thread

end of thread, other threads:[~2015-12-17  2:39 UTC | newest]

Thread overview: 3+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2015-10-08  5:27 [PATCH V3] IB/mlx4: Use vmalloc for WR buffers when needed Wengang Wang
     [not found] ` <1444282024-11425-1-git-send-email-wen.gang.wang-QHcLZuEGTsvQT0dZR+AlfA@public.gmane.org>
2015-12-11 20:28   ` Matthew Finlay
     [not found]     ` <17CFA44C-D58F-49C0-B3CE-95D38C08E16B-VPRAkNaXOzVWk0Htik3J/w@public.gmane.org>
2015-12-17  2:39       ` Wengang Wang

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).