From: Hillf Danton <hdanton@sina.com>
To: Mina Almasry <almasrymina@google.com>
Cc: mike.kravetz@oracle.com, shuah@kernel.org, rientjes@google.com,
shakeelb@google.com, gthelen@google.com,
akpm@linux-foundation.org, khalid.aziz@oracle.com,
linux-kernel@vger.kernel.org, linux-mm@kvack.org,
linux-kselftest@vger.kernel.org
Subject: Re: [RFC PATCH v2 1/5] hugetlb_cgroup: Add hugetlb_cgroup reservation counter
Date: Thu, 15 Aug 2019 11:53:52 +0800 [thread overview]
Message-ID: <20190815035352.14952-1-hdanton@sina.com> (raw)
In-Reply-To: <20190808231340.53601-1-almasrymina@google.com>
On Thu, 8 Aug 2019 16:13:36 -0700 Mina Almasry wrote:
>
> These counters will track hugetlb reservations rather than hugetlb
> memory faulted in. This patch only adds the counter, following patches
> add the charging and uncharging of the counter.
> ---
!?!
> include/linux/hugetlb.h | 2 +-
> mm/hugetlb_cgroup.c | 86 +++++++++++++++++++++++++++++++++++++----
> 2 files changed, 80 insertions(+), 8 deletions(-)
>
> diff --git a/include/linux/hugetlb.h b/include/linux/hugetlb.h
> index edfca42783192..6777b3013345d 100644
> --- a/include/linux/hugetlb.h
> +++ b/include/linux/hugetlb.h
> @@ -340,7 +340,7 @@ struct hstate {
> unsigned int surplus_huge_pages_node[MAX_NUMNODES];
> #ifdef CONFIG_CGROUP_HUGETLB
> /* cgroup control files */
> - struct cftype cgroup_files[5];
> + struct cftype cgroup_files[9];
Move that enum in this header file and replace numbers with characters
to easy both reading and maintaining.
> #endif
> char name[HSTATE_NAME_LEN];
> };
> diff --git a/mm/hugetlb_cgroup.c b/mm/hugetlb_cgroup.c
> index 68c2f2f3c05b7..708103663988a 100644
> --- a/mm/hugetlb_cgroup.c
> +++ b/mm/hugetlb_cgroup.c
> @@ -25,6 +25,10 @@ struct hugetlb_cgroup {
> * the counter to account for hugepages from hugetlb.
> */
> struct page_counter hugepage[HUGE_MAX_HSTATE];
> + /*
> + * the counter to account for hugepage reservations from hugetlb.
> + */
> + struct page_counter reserved_hugepage[HUGE_MAX_HSTATE];
> };
>
> #define MEMFILE_PRIVATE(x, val) (((x) << 16) | (val))
> @@ -33,6 +37,15 @@ struct hugetlb_cgroup {
>
> static struct hugetlb_cgroup *root_h_cgroup __read_mostly;
>
> +static inline
> +struct page_counter *get_counter(struct hugetlb_cgroup *h_cg, int idx,
> + bool reserved)
s/get_/hugetlb_cgroup_get_/ to make it not too generic.
> +{
> + if (reserved)
> + return &h_cg->reserved_hugepage[idx];
> + return &h_cg->hugepage[idx];
> +}
> +
> static inline
> struct hugetlb_cgroup *hugetlb_cgroup_from_css(struct cgroup_subsys_state *s)
> {
> @@ -256,28 +269,42 @@ void hugetlb_cgroup_uncharge_cgroup(int idx, unsigned long nr_pages,
>
> enum {
> RES_USAGE,
> + RES_RESERVATION_USAGE,
> RES_LIMIT,
> + RES_RESERVATION_LIMIT,
> RES_MAX_USAGE,
> + RES_RESERVATION_MAX_USAGE,
> RES_FAILCNT,
> + RES_RESERVATION_FAILCNT,
> };
>
> static u64 hugetlb_cgroup_read_u64(struct cgroup_subsys_state *css,
> struct cftype *cft)
> {
> struct page_counter *counter;
> + struct page_counter *reserved_counter;
> struct hugetlb_cgroup *h_cg = hugetlb_cgroup_from_css(css);
>
> counter = &h_cg->hugepage[MEMFILE_IDX(cft->private)];
> + reserved_counter = &h_cg->reserved_hugepage[MEMFILE_IDX(cft->private)];
>
> switch (MEMFILE_ATTR(cft->private)) {
> case RES_USAGE:
> return (u64)page_counter_read(counter) * PAGE_SIZE;
> + case RES_RESERVATION_USAGE:
> + return (u64)page_counter_read(reserved_counter) * PAGE_SIZE;
> case RES_LIMIT:
> return (u64)counter->max * PAGE_SIZE;
> + case RES_RESERVATION_LIMIT:
> + return (u64)reserved_counter->max * PAGE_SIZE;
> case RES_MAX_USAGE:
> return (u64)counter->watermark * PAGE_SIZE;
> + case RES_RESERVATION_MAX_USAGE:
> + return (u64)reserved_counter->watermark * PAGE_SIZE;
> case RES_FAILCNT:
> return counter->failcnt;
> + case RES_RESERVATION_FAILCNT:
> + return reserved_counter->failcnt;
> default:
> BUG();
> }
> @@ -291,6 +318,7 @@ static ssize_t hugetlb_cgroup_write(struct kernfs_open_file *of,
> int ret, idx;
> unsigned long nr_pages;
> struct hugetlb_cgroup *h_cg = hugetlb_cgroup_from_css(of_css(of));
> + bool reserved = false;
>
> if (hugetlb_cgroup_is_root(h_cg)) /* Can't set limit on root */
> return -EINVAL;
> @@ -303,10 +331,16 @@ static ssize_t hugetlb_cgroup_write(struct kernfs_open_file *of,
> idx = MEMFILE_IDX(of_cft(of)->private);
> nr_pages = round_down(nr_pages, 1 << huge_page_order(&hstates[idx]));
>
> + if (MEMFILE_ATTR(of_cft(of)->private) == RES_RESERVATION_LIMIT) {
> + reserved = true;
> + }
> +
> switch (MEMFILE_ATTR(of_cft(of)->private)) {
> + case RES_RESERVATION_LIMIT:
reserved = true;
/* fall thru */
> case RES_LIMIT:
> mutex_lock(&hugetlb_limit_mutex);
> - ret = page_counter_set_max(&h_cg->hugepage[idx], nr_pages);
> + ret = page_counter_set_max(get_counter(h_cg, idx, reserved),
> + nr_pages);
> mutex_unlock(&hugetlb_limit_mutex);
> break;
> default:
> @@ -320,18 +354,26 @@ static ssize_t hugetlb_cgroup_reset(struct kernfs_open_file *of,
> char *buf, size_t nbytes, loff_t off)
> {
> int ret = 0;
> - struct page_counter *counter;
> + struct page_counter *counter, *reserved_counter;
> struct hugetlb_cgroup *h_cg = hugetlb_cgroup_from_css(of_css(of));
>
> counter = &h_cg->hugepage[MEMFILE_IDX(of_cft(of)->private)];
> + reserved_counter = &h_cg->reserved_hugepage[
> + MEMFILE_IDX(of_cft(of)->private)];
>
> switch (MEMFILE_ATTR(of_cft(of)->private)) {
> case RES_MAX_USAGE:
> page_counter_reset_watermark(counter);
> break;
> + case RES_RESERVATION_MAX_USAGE:
> + page_counter_reset_watermark(reserved_counter);
> + break;
> case RES_FAILCNT:
> counter->failcnt = 0;
> break;
> + case RES_RESERVATION_FAILCNT:
> + reserved_counter->failcnt = 0;
> + break;
> default:
> ret = -EINVAL;
> break;
> @@ -357,7 +399,7 @@ static void __init __hugetlb_cgroup_file_init(int idx)
> struct hstate *h = &hstates[idx];
>
> /* format the size */
> - mem_fmt(buf, 32, huge_page_size(h));
> + mem_fmt(buf, sizeof(buf), huge_page_size(h));
>
> /* Add the limit file */
> cft = &h->cgroup_files[0];
> @@ -366,28 +408,58 @@ static void __init __hugetlb_cgroup_file_init(int idx)
> cft->read_u64 = hugetlb_cgroup_read_u64;
> cft->write = hugetlb_cgroup_write;
>
> - /* Add the usage file */
> + /* Add the reservation limit file */
> cft = &h->cgroup_files[1];
> + snprintf(cft->name, MAX_CFTYPE_NAME, "%s.reservation_limit_in_bytes",
> + buf);
> + cft->private = MEMFILE_PRIVATE(idx, RES_RESERVATION_LIMIT);
> + cft->read_u64 = hugetlb_cgroup_read_u64;
> + cft->write = hugetlb_cgroup_write;
> +
> + /* Add the usage file */
> + cft = &h->cgroup_files[2];
> snprintf(cft->name, MAX_CFTYPE_NAME, "%s.usage_in_bytes", buf);
> cft->private = MEMFILE_PRIVATE(idx, RES_USAGE);
> cft->read_u64 = hugetlb_cgroup_read_u64;
>
> + /* Add the reservation usage file */
> + cft = &h->cgroup_files[3];
> + snprintf(cft->name, MAX_CFTYPE_NAME, "%s.reservation_usage_in_bytes",
> + buf);
> + cft->private = MEMFILE_PRIVATE(idx, RES_RESERVATION_USAGE);
> + cft->read_u64 = hugetlb_cgroup_read_u64;
> +
> /* Add the MAX usage file */
> - cft = &h->cgroup_files[2];
> + cft = &h->cgroup_files[4];
> snprintf(cft->name, MAX_CFTYPE_NAME, "%s.max_usage_in_bytes", buf);
> cft->private = MEMFILE_PRIVATE(idx, RES_MAX_USAGE);
> cft->write = hugetlb_cgroup_reset;
> cft->read_u64 = hugetlb_cgroup_read_u64;
>
> + /* Add the MAX reservation usage file */
> + cft = &h->cgroup_files[5];
> + snprintf(cft->name, MAX_CFTYPE_NAME,
> + "%s.reservation_max_usage_in_bytes", buf);
> + cft->private = MEMFILE_PRIVATE(idx, RES_RESERVATION_MAX_USAGE);
> + cft->write = hugetlb_cgroup_reset;
> + cft->read_u64 = hugetlb_cgroup_read_u64;
> +
> /* Add the failcntfile */
> - cft = &h->cgroup_files[3];
> + cft = &h->cgroup_files[6];
> snprintf(cft->name, MAX_CFTYPE_NAME, "%s.failcnt", buf);
> cft->private = MEMFILE_PRIVATE(idx, RES_FAILCNT);
> cft->write = hugetlb_cgroup_reset;
> cft->read_u64 = hugetlb_cgroup_read_u64;
>
> + /* Add the reservation failcntfile */
> + cft = &h->cgroup_files[7];
> + snprintf(cft->name, MAX_CFTYPE_NAME, "%s.reservation_failcnt", buf);
> + cft->private = MEMFILE_PRIVATE(idx, RES_FAILCNT);
> + cft->write = hugetlb_cgroup_reset;
> + cft->read_u64 = hugetlb_cgroup_read_u64;
> +
> /* NULL terminate the last cft */
> - cft = &h->cgroup_files[4];
> + cft = &h->cgroup_files[8];
> memset(cft, 0, sizeof(*cft));
Replace numbers with characters.
>
> WARN_ON(cgroup_add_legacy_cftypes(&hugetlb_cgrp_subsys,
> --
> 2.23.0.rc1.153.gdeed80330f-goog
next prev parent reply other threads:[~2019-08-15 3:54 UTC|newest]
Thread overview: 20+ messages / expand[flat|nested] mbox.gz Atom feed top
2019-08-08 23:13 [RFC PATCH v2 0/5] hugetlb_cgroup: Add hugetlb_cgroup reservation limits Mina Almasry
2019-08-08 23:13 ` [RFC PATCH v2 1/5] hugetlb_cgroup: Add hugetlb_cgroup reservation counter Mina Almasry
2019-08-08 23:13 ` [RFC PATCH v2 2/5] hugetlb_cgroup: Add interface for charge/uncharge Mina Almasry
2019-08-08 23:13 ` [RFC PATCH v2 3/5] hugetlb_cgroup: Add reservation accounting for private mappings Mina Almasry
2019-08-08 23:13 ` [RFC PATCH v2 4/5] hugetlb_cgroup: Add accounting for shared mappings Mina Almasry
2019-08-13 23:54 ` Mike Kravetz
2019-08-14 16:46 ` Mike Kravetz
2019-08-15 23:04 ` Mina Almasry
2019-08-16 16:28 ` Mike Kravetz
2019-08-16 18:06 ` Mina Almasry
2019-08-15 23:08 ` Mina Almasry
2019-08-16 16:33 ` Mike Kravetz
2019-08-08 23:13 ` [RFC PATCH v2 5/5] hugetlb_cgroup: Add hugetlb_cgroup reservation tests Mina Almasry
2019-08-09 17:54 ` [RFC PATCH v2 0/5] hugetlb_cgroup: Add hugetlb_cgroup reservation limits Mike Kravetz
2019-08-09 19:42 ` Mina Almasry
2019-08-10 18:58 ` Mike Kravetz
2019-08-10 22:01 ` Mina Almasry
2019-08-13 23:40 ` Mike Kravetz
2019-08-15 3:53 ` Hillf Danton [this message]
2019-08-15 23:21 ` [RFC PATCH v2 1/5] hugetlb_cgroup: Add hugetlb_cgroup reservation counter Mina Almasry
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20190815035352.14952-1-hdanton@sina.com \
--to=hdanton@sina.com \
--cc=akpm@linux-foundation.org \
--cc=almasrymina@google.com \
--cc=gthelen@google.com \
--cc=khalid.aziz@oracle.com \
--cc=linux-kernel@vger.kernel.org \
--cc=linux-kselftest@vger.kernel.org \
--cc=linux-mm@kvack.org \
--cc=mike.kravetz@oracle.com \
--cc=rientjes@google.com \
--cc=shakeelb@google.com \
--cc=shuah@kernel.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).