// SPDX-License-Identifier: GPL-2.0 /* * Miscellaneous cgroup controller * * Copyright 2020 Google LLC * Author: Vipin Sharma <vipinsh@google.com> */ #include <linux/limits.h> #include <linux/cgroup.h> #include <linux/errno.h> #include <linux/atomic.h> #include <linux/slab.h> #include <linux/misc_cgroup.h> #define MAX_STR "max" #define MAX_NUM U64_MAX /* Miscellaneous res name, keep it in sync with enum misc_res_type */ static const char *const misc_res_name[] = { #ifdef CONFIG_KVM_AMD_SEV /* AMD SEV ASIDs resource */ "sev", /* AMD SEV-ES ASIDs resource */ "sev_es", #endif }; /* Root misc cgroup */ static struct misc_cg root_cg; /* * Miscellaneous resources capacity for the entire machine. 0 capacity means * resource is not initialized or not present in the host. * * root_cg.max and capacity are independent of each other. root_cg.max can be * more than the actual capacity. We are using Limits resource distribution * model of cgroup for miscellaneous controller. */ static u64 misc_res_capacity[MISC_CG_RES_TYPES]; /** * parent_misc() - Get the parent of the passed misc cgroup. * @cgroup: cgroup whose parent needs to be fetched. * * Context: Any context. * Return: * * struct misc_cg* - Parent of the @cgroup. * * %NULL - If @cgroup is null or the passed cgroup does not have a parent. */ static struct misc_cg *parent_misc(struct misc_cg *cgroup) { return cgroup ? css_misc(cgroup->css.parent) : NULL; } /** * valid_type() - Check if @type is valid or not. * @type: misc res type. * * Context: Any context. * Return: * * true - If valid type. * * false - If not valid type. */ static inline bool valid_type(enum misc_res_type type) { return type >= 0 && type < MISC_CG_RES_TYPES; } /** * misc_cg_res_total_usage() - Get the current total usage of the resource. * @type: misc res type. * * Context: Any context. * Return: Current total usage of the resource. */ u64 misc_cg_res_total_usage(enum misc_res_type type) { if (valid_type(type)) return atomic64_read(&root_cg.res[type].usage); return 0; } EXPORT_SYMBOL_GPL(misc_cg_res_total_usage); /** * misc_cg_set_capacity() - Set the capacity of the misc cgroup res. * @type: Type of the misc res. * @capacity: Supported capacity of the misc res on the host. * * If capacity is 0 then the charging a misc cgroup fails for that type. * * Context: Any context. * Return: * * %0 - Successfully registered the capacity. * * %-EINVAL - If @type is invalid. */ int misc_cg_set_capacity(enum misc_res_type type, u64 capacity) { if (!valid_type(type)) return -EINVAL; WRITE_ONCE(misc_res_capacity[type], capacity); return 0; } EXPORT_SYMBOL_GPL(misc_cg_set_capacity); /** * misc_cg_cancel_charge() - Cancel the charge from the misc cgroup. * @type: Misc res type in misc cg to cancel the charge from. * @cg: Misc cgroup to cancel charge from. * @amount: Amount to cancel. * * Context: Any context. */ static void misc_cg_cancel_charge(enum misc_res_type type, struct misc_cg *cg, u64 amount) { WARN_ONCE(atomic64_add_negative(-amount, &cg->res[type].usage), "misc cgroup resource %s became less than 0", misc_res_name[type]); } static void misc_cg_update_watermark(struct misc_res *res, u64 new_usage) { u64 old; while (true) { old = atomic64_read(&res->watermark); if (new_usage <= old) break; if (atomic64_cmpxchg(&res->watermark, old, new_usage) == old) break; } } static void misc_cg_event(enum misc_res_type type, struct misc_cg *cg) { atomic64_inc(&cg->res[type].events_local); cgroup_file_notify(&cg->events_local_file); for (; parent_misc(cg); cg = parent_misc(cg)) { atomic64_inc(&cg->res[type].events); cgroup_file_notify(&cg->events_file); } } /** * misc_cg_try_charge() - Try charging the misc cgroup. * @type: Misc res type to charge. * @cg: Misc cgroup which will be charged. * @amount: Amount to charge. * * Charge @amount to the misc cgroup. Caller must use the same cgroup during * the uncharge call. * * Context: Any context. * Return: * * %0 - If successfully charged. * * -EINVAL - If @type is invalid or misc res has 0 capacity. * * -EBUSY - If max limit will be crossed or total usage will be more than the * capacity. */ int misc_cg_try_charge(enum misc_res_type type, struct misc_cg *cg, u64 amount) { struct misc_cg *i, *j; int ret; struct misc_res *res; u64 new_usage; if (!(valid_type(type) && cg && READ_ONCE(misc_res_capacity[type]))) return -EINVAL; if (!amount) return 0; for (i = cg; i; i = parent_misc(i)) { res = &i->res[type]; new_usage = atomic64_add_return(amount, &res->usage); if (new_usage > READ_ONCE(res->max) || new_usage > READ_ONCE(misc_res_capacity[type])) { ret = -EBUSY; goto err_charge; } misc_cg_update_watermark(res, new_usage); } return 0; err_charge: misc_cg_event(type, i); for (j = cg; j != i; j = parent_misc(j)) misc_cg_cancel_charge(type, j, amount); misc_cg_cancel_charge(type, i, amount); return ret; } EXPORT_SYMBOL_GPL(misc_cg_try_charge); /** * misc_cg_uncharge() - Uncharge the misc cgroup. * @type: Misc res type which was charged. * @cg: Misc cgroup which will be uncharged. * @amount: Charged amount. * * Context: Any context. */ void misc_cg_uncharge(enum misc_res_type type, struct misc_cg *cg, u64 amount) { struct misc_cg *i; if (!(amount && valid_type(type) && cg)) return; for (i = cg; i; i = parent_misc(i)) misc_cg_cancel_charge(type, i, amount); } EXPORT_SYMBOL_GPL(misc_cg_uncharge); /** * misc_cg_max_show() - Show the misc cgroup max limit. * @sf: Interface file * @v: Arguments passed * * Context: Any context. * Return: 0 to denote successful print. */ static int misc_cg_max_show(struct seq_file *sf, void *v) { int i; struct misc_cg *cg = css_misc(seq_css(sf)); u64 max; for (i = 0; i < MISC_CG_RES_TYPES; i++) { if (READ_ONCE(misc_res_capacity[i])) { max = READ_ONCE(cg->res[i].max); if (max == MAX_NUM) seq_printf(sf, "%s max\n", misc_res_name[i]); else seq_printf(sf, "%s %llu\n", misc_res_name[i], max); } } return 0; } /** * misc_cg_max_write() - Update the maximum limit of the cgroup. * @of: Handler for the file. * @buf: Data from the user. It should be either "max", 0, or a positive * integer. * @nbytes: Number of bytes of the data. * @off: Offset in the file. * * User can pass data like: * echo sev 23 > misc.max, OR * echo sev max > misc.max * * Context: Any context. * Return: * * >= 0 - Number of bytes processed in the input. * * -EINVAL - If buf is not valid. * * -ERANGE - If number is bigger than the u64 capacity. */ static ssize_t misc_cg_max_write(struct kernfs_open_file *of, char *buf, size_t nbytes, loff_t off) { struct misc_cg *cg; u64 max; int ret = 0, i; enum misc_res_type type = MISC_CG_RES_TYPES; char *token; buf = strstrip(buf); token = strsep(&buf, " "); if (!token || !buf) return -EINVAL; for (i = 0; i < MISC_CG_RES_TYPES; i++) { if (!strcmp(misc_res_name[i], token)) { type = i; break; } } if (type == MISC_CG_RES_TYPES) return -EINVAL; if (!strcmp(MAX_STR, buf)) { max = MAX_NUM; } else { ret = kstrtou64(buf, 0, &max); if (ret) return ret; } cg = css_misc(of_css(of)); if (READ_ONCE(misc_res_capacity[type])) WRITE_ONCE(cg->res[type].max, max); else ret = -EINVAL; return ret ? ret : nbytes; } /** * misc_cg_current_show() - Show the current usage of the misc cgroup. * @sf: Interface file * @v: Arguments passed * * Context: Any context. * Return: 0 to denote successful print. */ static int misc_cg_current_show(struct seq_file *sf, void *v) { int i; u64 usage; struct misc_cg *cg = css_misc(seq_css(sf)); for (i = 0; i < MISC_CG_RES_TYPES; i++) { usage = atomic64_read(&cg->res[i].usage); if (READ_ONCE(misc_res_capacity[i]) || usage) seq_printf(sf, "%s %llu\n", misc_res_name[i], usage); } return 0; } /** * misc_cg_peak_show() - Show the peak usage of the misc cgroup. * @sf: Interface file * @v: Arguments passed * * Context: Any context. * Return: 0 to denote successful print. */ static int misc_cg_peak_show(struct seq_file *sf, void *v) { int i; u64 watermark; struct misc_cg *cg = css_misc(seq_css(sf)); for (i = 0; i < MISC_CG_RES_TYPES; i++) { watermark = atomic64_read(&cg->res[i].watermark); if (READ_ONCE(misc_res_capacity[i]) || watermark) seq_printf(sf, "%s %llu\n", misc_res_name[i], watermark); } return 0; } /** * misc_cg_capacity_show() - Show the total capacity of misc res on the host. * @sf: Interface file * @v: Arguments passed * * Only present in the root cgroup directory. * * Context: Any context. * Return: 0 to denote successful print. */ static int misc_cg_capacity_show(struct seq_file *sf, void *v) { int i; u64 cap; for (i = 0; i < MISC_CG_RES_TYPES; i++) { cap = READ_ONCE(misc_res_capacity[i]); if (cap) seq_printf(sf, "%s %llu\n", misc_res_name[i], cap); } return 0; } static int __misc_events_show(struct seq_file *sf, bool local) { struct misc_cg *cg = css_misc(seq_css(sf)); u64 events; int i; for (i = 0; i < MISC_CG_RES_TYPES; i++) { if (local) events = atomic64_read(&cg->res[i].events_local); else events = atomic64_read(&cg->res[i].events); if (READ_ONCE(misc_res_capacity[i]) || events) seq_printf(sf, "%s.max %llu\n", misc_res_name[i], events); } return 0; } static int misc_events_show(struct seq_file *sf, void *v) { return __misc_events_show(sf, false); } static int misc_events_local_show(struct seq_file *sf, void *v) { return __misc_events_show(sf, true); } /* Misc cgroup interface files */ static struct cftype misc_cg_files[] = { { .name = "max", .write = misc_cg_max_write, .seq_show = misc_cg_max_show, .flags = CFTYPE_NOT_ON_ROOT, }, { .name = "current", .seq_show = misc_cg_current_show, }, { .name = "peak", .seq_show = misc_cg_peak_show, }, { .name = "capacity", .seq_show = misc_cg_capacity_show, .flags = CFTYPE_ONLY_ON_ROOT, }, { .name = "events", .flags = CFTYPE_NOT_ON_ROOT, .file_offset = offsetof(struct misc_cg, events_file), .seq_show = misc_events_show, }, { .name = "events.local", .flags = CFTYPE_NOT_ON_ROOT, .file_offset = offsetof(struct misc_cg, events_local_file), .seq_show = misc_events_local_show, }, {} }; /** * misc_cg_alloc() - Allocate misc cgroup. * @parent_css: Parent cgroup. * * Context: Process context. * Return: * * struct cgroup_subsys_state* - css of the allocated cgroup. * * ERR_PTR(-ENOMEM) - No memory available to allocate. */ static struct cgroup_subsys_state * misc_cg_alloc(struct cgroup_subsys_state *parent_css) { enum misc_res_type i; struct misc_cg *cg; if (!parent_css) { cg = &root_cg; } else { cg = kzalloc(sizeof(*cg), GFP_KERNEL); if (!cg) return ERR_PTR(-ENOMEM); } for (i = 0; i < MISC_CG_RES_TYPES; i++) { WRITE_ONCE(cg->res[i].max, MAX_NUM); atomic64_set(&cg->res[i].usage, 0); } return &cg->css; } /** * misc_cg_free() - Free the misc cgroup. * @css: cgroup subsys object. * * Context: Any context. */ static void misc_cg_free(struct cgroup_subsys_state *css) { kfree(css_misc(css)); } /* Cgroup controller callbacks */ struct cgroup_subsys misc_cgrp_subsys = { .css_alloc = misc_cg_alloc, .css_free = misc_cg_free, .legacy_cftypes = misc_cg_files, .dfl_cftypes = misc_cg_files, };