mirror of
https://git.kernel.org/pub/scm/linux/kernel/git/stable/linux.git
synced 2025-01-19 12:00:00 +00:00
6a26f9c689
Currently the event counting provided by misc.events is hierarchical, it's not practical if user is only concerned with events of a specified cgroup. Therefore, introduce misc.events.local collect events specific to the given cgroup. This is analogous to memory.events.local and pids.events.local. Signed-off-by: Xiu Jianfeng <xiujianfeng@huawei.com> Signed-off-by: Tejun Heo <tj@kernel.org>
491 lines
11 KiB
C
491 lines
11 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
/*
|
|
* Miscellaneous cgroup controller
|
|
*
|
|
* Copyright 2020 Google LLC
|
|
* Author: Vipin Sharma <vipinsh@google.com>
|
|
*/
|
|
|
|
#include <linux/limits.h>
|
|
#include <linux/cgroup.h>
|
|
#include <linux/errno.h>
|
|
#include <linux/atomic.h>
|
|
#include <linux/slab.h>
|
|
#include <linux/misc_cgroup.h>
|
|
|
|
#define MAX_STR "max"
|
|
#define MAX_NUM U64_MAX
|
|
|
|
/* Miscellaneous res name, keep it in sync with enum misc_res_type */
|
|
static const char *const misc_res_name[] = {
|
|
#ifdef CONFIG_KVM_AMD_SEV
|
|
/* AMD SEV ASIDs resource */
|
|
"sev",
|
|
/* AMD SEV-ES ASIDs resource */
|
|
"sev_es",
|
|
#endif
|
|
};
|
|
|
|
/* Root misc cgroup */
|
|
static struct misc_cg root_cg;
|
|
|
|
/*
|
|
* Miscellaneous resources capacity for the entire machine. 0 capacity means
|
|
* resource is not initialized or not present in the host.
|
|
*
|
|
* root_cg.max and capacity are independent of each other. root_cg.max can be
|
|
* more than the actual capacity. We are using Limits resource distribution
|
|
* model of cgroup for miscellaneous controller.
|
|
*/
|
|
static u64 misc_res_capacity[MISC_CG_RES_TYPES];
|
|
|
|
/**
|
|
* parent_misc() - Get the parent of the passed misc cgroup.
|
|
* @cgroup: cgroup whose parent needs to be fetched.
|
|
*
|
|
* Context: Any context.
|
|
* Return:
|
|
* * struct misc_cg* - Parent of the @cgroup.
|
|
* * %NULL - If @cgroup is null or the passed cgroup does not have a parent.
|
|
*/
|
|
static struct misc_cg *parent_misc(struct misc_cg *cgroup)
|
|
{
|
|
return cgroup ? css_misc(cgroup->css.parent) : NULL;
|
|
}
|
|
|
|
/**
|
|
* valid_type() - Check if @type is valid or not.
|
|
* @type: misc res type.
|
|
*
|
|
* Context: Any context.
|
|
* Return:
|
|
* * true - If valid type.
|
|
* * false - If not valid type.
|
|
*/
|
|
static inline bool valid_type(enum misc_res_type type)
|
|
{
|
|
return type >= 0 && type < MISC_CG_RES_TYPES;
|
|
}
|
|
|
|
/**
|
|
* misc_cg_res_total_usage() - Get the current total usage of the resource.
|
|
* @type: misc res type.
|
|
*
|
|
* Context: Any context.
|
|
* Return: Current total usage of the resource.
|
|
*/
|
|
u64 misc_cg_res_total_usage(enum misc_res_type type)
|
|
{
|
|
if (valid_type(type))
|
|
return atomic64_read(&root_cg.res[type].usage);
|
|
|
|
return 0;
|
|
}
|
|
EXPORT_SYMBOL_GPL(misc_cg_res_total_usage);
|
|
|
|
/**
|
|
* misc_cg_set_capacity() - Set the capacity of the misc cgroup res.
|
|
* @type: Type of the misc res.
|
|
* @capacity: Supported capacity of the misc res on the host.
|
|
*
|
|
* If capacity is 0 then the charging a misc cgroup fails for that type.
|
|
*
|
|
* Context: Any context.
|
|
* Return:
|
|
* * %0 - Successfully registered the capacity.
|
|
* * %-EINVAL - If @type is invalid.
|
|
*/
|
|
int misc_cg_set_capacity(enum misc_res_type type, u64 capacity)
|
|
{
|
|
if (!valid_type(type))
|
|
return -EINVAL;
|
|
|
|
WRITE_ONCE(misc_res_capacity[type], capacity);
|
|
return 0;
|
|
}
|
|
EXPORT_SYMBOL_GPL(misc_cg_set_capacity);
|
|
|
|
/**
|
|
* misc_cg_cancel_charge() - Cancel the charge from the misc cgroup.
|
|
* @type: Misc res type in misc cg to cancel the charge from.
|
|
* @cg: Misc cgroup to cancel charge from.
|
|
* @amount: Amount to cancel.
|
|
*
|
|
* Context: Any context.
|
|
*/
|
|
static void misc_cg_cancel_charge(enum misc_res_type type, struct misc_cg *cg,
|
|
u64 amount)
|
|
{
|
|
WARN_ONCE(atomic64_add_negative(-amount, &cg->res[type].usage),
|
|
"misc cgroup resource %s became less than 0",
|
|
misc_res_name[type]);
|
|
}
|
|
|
|
static void misc_cg_update_watermark(struct misc_res *res, u64 new_usage)
|
|
{
|
|
u64 old;
|
|
|
|
while (true) {
|
|
old = atomic64_read(&res->watermark);
|
|
if (new_usage <= old)
|
|
break;
|
|
if (atomic64_cmpxchg(&res->watermark, old, new_usage) == old)
|
|
break;
|
|
}
|
|
}
|
|
|
|
static void misc_cg_event(enum misc_res_type type, struct misc_cg *cg)
|
|
{
|
|
atomic64_inc(&cg->res[type].events_local);
|
|
cgroup_file_notify(&cg->events_local_file);
|
|
|
|
for (; parent_misc(cg); cg = parent_misc(cg)) {
|
|
atomic64_inc(&cg->res[type].events);
|
|
cgroup_file_notify(&cg->events_file);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* misc_cg_try_charge() - Try charging the misc cgroup.
|
|
* @type: Misc res type to charge.
|
|
* @cg: Misc cgroup which will be charged.
|
|
* @amount: Amount to charge.
|
|
*
|
|
* Charge @amount to the misc cgroup. Caller must use the same cgroup during
|
|
* the uncharge call.
|
|
*
|
|
* Context: Any context.
|
|
* Return:
|
|
* * %0 - If successfully charged.
|
|
* * -EINVAL - If @type is invalid or misc res has 0 capacity.
|
|
* * -EBUSY - If max limit will be crossed or total usage will be more than the
|
|
* capacity.
|
|
*/
|
|
int misc_cg_try_charge(enum misc_res_type type, struct misc_cg *cg, u64 amount)
|
|
{
|
|
struct misc_cg *i, *j;
|
|
int ret;
|
|
struct misc_res *res;
|
|
u64 new_usage;
|
|
|
|
if (!(valid_type(type) && cg && READ_ONCE(misc_res_capacity[type])))
|
|
return -EINVAL;
|
|
|
|
if (!amount)
|
|
return 0;
|
|
|
|
for (i = cg; i; i = parent_misc(i)) {
|
|
res = &i->res[type];
|
|
|
|
new_usage = atomic64_add_return(amount, &res->usage);
|
|
if (new_usage > READ_ONCE(res->max) ||
|
|
new_usage > READ_ONCE(misc_res_capacity[type])) {
|
|
ret = -EBUSY;
|
|
goto err_charge;
|
|
}
|
|
misc_cg_update_watermark(res, new_usage);
|
|
}
|
|
return 0;
|
|
|
|
err_charge:
|
|
misc_cg_event(type, i);
|
|
|
|
for (j = cg; j != i; j = parent_misc(j))
|
|
misc_cg_cancel_charge(type, j, amount);
|
|
misc_cg_cancel_charge(type, i, amount);
|
|
return ret;
|
|
}
|
|
EXPORT_SYMBOL_GPL(misc_cg_try_charge);
|
|
|
|
/**
|
|
* misc_cg_uncharge() - Uncharge the misc cgroup.
|
|
* @type: Misc res type which was charged.
|
|
* @cg: Misc cgroup which will be uncharged.
|
|
* @amount: Charged amount.
|
|
*
|
|
* Context: Any context.
|
|
*/
|
|
void misc_cg_uncharge(enum misc_res_type type, struct misc_cg *cg, u64 amount)
|
|
{
|
|
struct misc_cg *i;
|
|
|
|
if (!(amount && valid_type(type) && cg))
|
|
return;
|
|
|
|
for (i = cg; i; i = parent_misc(i))
|
|
misc_cg_cancel_charge(type, i, amount);
|
|
}
|
|
EXPORT_SYMBOL_GPL(misc_cg_uncharge);
|
|
|
|
/**
|
|
* misc_cg_max_show() - Show the misc cgroup max limit.
|
|
* @sf: Interface file
|
|
* @v: Arguments passed
|
|
*
|
|
* Context: Any context.
|
|
* Return: 0 to denote successful print.
|
|
*/
|
|
static int misc_cg_max_show(struct seq_file *sf, void *v)
|
|
{
|
|
int i;
|
|
struct misc_cg *cg = css_misc(seq_css(sf));
|
|
u64 max;
|
|
|
|
for (i = 0; i < MISC_CG_RES_TYPES; i++) {
|
|
if (READ_ONCE(misc_res_capacity[i])) {
|
|
max = READ_ONCE(cg->res[i].max);
|
|
if (max == MAX_NUM)
|
|
seq_printf(sf, "%s max\n", misc_res_name[i]);
|
|
else
|
|
seq_printf(sf, "%s %llu\n", misc_res_name[i],
|
|
max);
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* misc_cg_max_write() - Update the maximum limit of the cgroup.
|
|
* @of: Handler for the file.
|
|
* @buf: Data from the user. It should be either "max", 0, or a positive
|
|
* integer.
|
|
* @nbytes: Number of bytes of the data.
|
|
* @off: Offset in the file.
|
|
*
|
|
* User can pass data like:
|
|
* echo sev 23 > misc.max, OR
|
|
* echo sev max > misc.max
|
|
*
|
|
* Context: Any context.
|
|
* Return:
|
|
* * >= 0 - Number of bytes processed in the input.
|
|
* * -EINVAL - If buf is not valid.
|
|
* * -ERANGE - If number is bigger than the u64 capacity.
|
|
*/
|
|
static ssize_t misc_cg_max_write(struct kernfs_open_file *of, char *buf,
|
|
size_t nbytes, loff_t off)
|
|
{
|
|
struct misc_cg *cg;
|
|
u64 max;
|
|
int ret = 0, i;
|
|
enum misc_res_type type = MISC_CG_RES_TYPES;
|
|
char *token;
|
|
|
|
buf = strstrip(buf);
|
|
token = strsep(&buf, " ");
|
|
|
|
if (!token || !buf)
|
|
return -EINVAL;
|
|
|
|
for (i = 0; i < MISC_CG_RES_TYPES; i++) {
|
|
if (!strcmp(misc_res_name[i], token)) {
|
|
type = i;
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (type == MISC_CG_RES_TYPES)
|
|
return -EINVAL;
|
|
|
|
if (!strcmp(MAX_STR, buf)) {
|
|
max = MAX_NUM;
|
|
} else {
|
|
ret = kstrtou64(buf, 0, &max);
|
|
if (ret)
|
|
return ret;
|
|
}
|
|
|
|
cg = css_misc(of_css(of));
|
|
|
|
if (READ_ONCE(misc_res_capacity[type]))
|
|
WRITE_ONCE(cg->res[type].max, max);
|
|
else
|
|
ret = -EINVAL;
|
|
|
|
return ret ? ret : nbytes;
|
|
}
|
|
|
|
/**
|
|
* misc_cg_current_show() - Show the current usage of the misc cgroup.
|
|
* @sf: Interface file
|
|
* @v: Arguments passed
|
|
*
|
|
* Context: Any context.
|
|
* Return: 0 to denote successful print.
|
|
*/
|
|
static int misc_cg_current_show(struct seq_file *sf, void *v)
|
|
{
|
|
int i;
|
|
u64 usage;
|
|
struct misc_cg *cg = css_misc(seq_css(sf));
|
|
|
|
for (i = 0; i < MISC_CG_RES_TYPES; i++) {
|
|
usage = atomic64_read(&cg->res[i].usage);
|
|
if (READ_ONCE(misc_res_capacity[i]) || usage)
|
|
seq_printf(sf, "%s %llu\n", misc_res_name[i], usage);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* misc_cg_peak_show() - Show the peak usage of the misc cgroup.
|
|
* @sf: Interface file
|
|
* @v: Arguments passed
|
|
*
|
|
* Context: Any context.
|
|
* Return: 0 to denote successful print.
|
|
*/
|
|
static int misc_cg_peak_show(struct seq_file *sf, void *v)
|
|
{
|
|
int i;
|
|
u64 watermark;
|
|
struct misc_cg *cg = css_misc(seq_css(sf));
|
|
|
|
for (i = 0; i < MISC_CG_RES_TYPES; i++) {
|
|
watermark = atomic64_read(&cg->res[i].watermark);
|
|
if (READ_ONCE(misc_res_capacity[i]) || watermark)
|
|
seq_printf(sf, "%s %llu\n", misc_res_name[i], watermark);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* misc_cg_capacity_show() - Show the total capacity of misc res on the host.
|
|
* @sf: Interface file
|
|
* @v: Arguments passed
|
|
*
|
|
* Only present in the root cgroup directory.
|
|
*
|
|
* Context: Any context.
|
|
* Return: 0 to denote successful print.
|
|
*/
|
|
static int misc_cg_capacity_show(struct seq_file *sf, void *v)
|
|
{
|
|
int i;
|
|
u64 cap;
|
|
|
|
for (i = 0; i < MISC_CG_RES_TYPES; i++) {
|
|
cap = READ_ONCE(misc_res_capacity[i]);
|
|
if (cap)
|
|
seq_printf(sf, "%s %llu\n", misc_res_name[i], cap);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int __misc_events_show(struct seq_file *sf, bool local)
|
|
{
|
|
struct misc_cg *cg = css_misc(seq_css(sf));
|
|
u64 events;
|
|
int i;
|
|
|
|
for (i = 0; i < MISC_CG_RES_TYPES; i++) {
|
|
if (local)
|
|
events = atomic64_read(&cg->res[i].events_local);
|
|
else
|
|
events = atomic64_read(&cg->res[i].events);
|
|
if (READ_ONCE(misc_res_capacity[i]) || events)
|
|
seq_printf(sf, "%s.max %llu\n", misc_res_name[i], events);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static int misc_events_show(struct seq_file *sf, void *v)
|
|
{
|
|
return __misc_events_show(sf, false);
|
|
}
|
|
|
|
static int misc_events_local_show(struct seq_file *sf, void *v)
|
|
{
|
|
return __misc_events_show(sf, true);
|
|
}
|
|
|
|
/* Misc cgroup interface files */
|
|
static struct cftype misc_cg_files[] = {
|
|
{
|
|
.name = "max",
|
|
.write = misc_cg_max_write,
|
|
.seq_show = misc_cg_max_show,
|
|
.flags = CFTYPE_NOT_ON_ROOT,
|
|
},
|
|
{
|
|
.name = "current",
|
|
.seq_show = misc_cg_current_show,
|
|
},
|
|
{
|
|
.name = "peak",
|
|
.seq_show = misc_cg_peak_show,
|
|
},
|
|
{
|
|
.name = "capacity",
|
|
.seq_show = misc_cg_capacity_show,
|
|
.flags = CFTYPE_ONLY_ON_ROOT,
|
|
},
|
|
{
|
|
.name = "events",
|
|
.flags = CFTYPE_NOT_ON_ROOT,
|
|
.file_offset = offsetof(struct misc_cg, events_file),
|
|
.seq_show = misc_events_show,
|
|
},
|
|
{
|
|
.name = "events.local",
|
|
.flags = CFTYPE_NOT_ON_ROOT,
|
|
.file_offset = offsetof(struct misc_cg, events_local_file),
|
|
.seq_show = misc_events_local_show,
|
|
},
|
|
{}
|
|
};
|
|
|
|
/**
|
|
* misc_cg_alloc() - Allocate misc cgroup.
|
|
* @parent_css: Parent cgroup.
|
|
*
|
|
* Context: Process context.
|
|
* Return:
|
|
* * struct cgroup_subsys_state* - css of the allocated cgroup.
|
|
* * ERR_PTR(-ENOMEM) - No memory available to allocate.
|
|
*/
|
|
static struct cgroup_subsys_state *
|
|
misc_cg_alloc(struct cgroup_subsys_state *parent_css)
|
|
{
|
|
enum misc_res_type i;
|
|
struct misc_cg *cg;
|
|
|
|
if (!parent_css) {
|
|
cg = &root_cg;
|
|
} else {
|
|
cg = kzalloc(sizeof(*cg), GFP_KERNEL);
|
|
if (!cg)
|
|
return ERR_PTR(-ENOMEM);
|
|
}
|
|
|
|
for (i = 0; i < MISC_CG_RES_TYPES; i++) {
|
|
WRITE_ONCE(cg->res[i].max, MAX_NUM);
|
|
atomic64_set(&cg->res[i].usage, 0);
|
|
}
|
|
|
|
return &cg->css;
|
|
}
|
|
|
|
/**
|
|
* misc_cg_free() - Free the misc cgroup.
|
|
* @css: cgroup subsys object.
|
|
*
|
|
* Context: Any context.
|
|
*/
|
|
static void misc_cg_free(struct cgroup_subsys_state *css)
|
|
{
|
|
kfree(css_misc(css));
|
|
}
|
|
|
|
/* Cgroup controller callbacks */
|
|
struct cgroup_subsys misc_cgrp_subsys = {
|
|
.css_alloc = misc_cg_alloc,
|
|
.css_free = misc_cg_free,
|
|
.legacy_cftypes = misc_cg_files,
|
|
.dfl_cftypes = misc_cg_files,
|
|
};
|