1c942fddfSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later
2c757249aSShailabh Nagar /*
3c757249aSShailabh Nagar * taskstats.c - Export per-task statistics to userland
4c757249aSShailabh Nagar *
5c757249aSShailabh Nagar * Copyright (C) Shailabh Nagar, IBM Corp. 2006
6c757249aSShailabh Nagar * (C) Balbir Singh, IBM Corp. 2006
7c757249aSShailabh Nagar */
8c757249aSShailabh Nagar
9c757249aSShailabh Nagar #include <linux/kernel.h>
10c757249aSShailabh Nagar #include <linux/taskstats_kern.h>
11f3cef7a9SJay Lan #include <linux/tsacct_kern.h>
120e0af57eSDr. Thomas Orgis #include <linux/acct.h>
136f44993fSShailabh Nagar #include <linux/delayacct.h>
14f9fd8914SShailabh Nagar #include <linux/cpumask.h>
15f9fd8914SShailabh Nagar #include <linux/percpu.h>
165a0e3ad6STejun Heo #include <linux/slab.h>
17846c7bb0SBalbir Singh #include <linux/cgroupstats.h>
18846c7bb0SBalbir Singh #include <linux/cgroup.h>
19846c7bb0SBalbir Singh #include <linux/fs.h>
20846c7bb0SBalbir Singh #include <linux/file.h>
214bd6e32aSEric W. Biederman #include <linux/pid_namespace.h>
22c757249aSShailabh Nagar #include <net/genetlink.h>
2360063497SArun Sharma #include <linux/atomic.h>
248c733420SZhang Xiao #include <linux/sched/cputime.h>
25c757249aSShailabh Nagar
26f9fd8914SShailabh Nagar /*
27f9fd8914SShailabh Nagar * Maximum length of a cpumask that can be specified in
28f9fd8914SShailabh Nagar * the TASKSTATS_CMD_ATTR_REGISTER/DEREGISTER_CPUMASK attribute
29f9fd8914SShailabh Nagar */
30f9fd8914SShailabh Nagar #define TASKSTATS_CPUMASK_MAXLEN (100+6*NR_CPUS)
31f9fd8914SShailabh Nagar
32b81f3ea9SVegard Nossum static DEFINE_PER_CPU(__u32, taskstats_seqnum);
33c757249aSShailabh Nagar static int family_registered;
34e18b890bSChristoph Lameter struct kmem_cache *taskstats_cache;
35c757249aSShailabh Nagar
36489111e5SJohannes Berg static struct genl_family family;
37c757249aSShailabh Nagar
387c1e0926SJakub Kicinski static const struct nla_policy taskstats_cmd_get_policy[] = {
39c757249aSShailabh Nagar [TASKSTATS_CMD_ATTR_PID] = { .type = NLA_U32 },
40c757249aSShailabh Nagar [TASKSTATS_CMD_ATTR_TGID] = { .type = NLA_U32 },
41f9fd8914SShailabh Nagar [TASKSTATS_CMD_ATTR_REGISTER_CPUMASK] = { .type = NLA_STRING },
42f9fd8914SShailabh Nagar [TASKSTATS_CMD_ATTR_DEREGISTER_CPUMASK] = { .type = NLA_STRING },};
43f9fd8914SShailabh Nagar
447c1e0926SJakub Kicinski static const struct nla_policy cgroupstats_cmd_get_policy[] = {
45846c7bb0SBalbir Singh [CGROUPSTATS_CMD_ATTR_FD] = { .type = NLA_U32 },
46846c7bb0SBalbir Singh };
47846c7bb0SBalbir Singh
48f9fd8914SShailabh Nagar struct listener {
49f9fd8914SShailabh Nagar struct list_head list;
50f9fd8914SShailabh Nagar pid_t pid;
51bb129994SShailabh Nagar char valid;
52c757249aSShailabh Nagar };
53c757249aSShailabh Nagar
54f9fd8914SShailabh Nagar struct listener_list {
55f9fd8914SShailabh Nagar struct rw_semaphore sem;
56f9fd8914SShailabh Nagar struct list_head list;
57f9fd8914SShailabh Nagar };
58f9fd8914SShailabh Nagar static DEFINE_PER_CPU(struct listener_list, listener_array);
59f9fd8914SShailabh Nagar
60f9fd8914SShailabh Nagar enum actions {
61f9fd8914SShailabh Nagar REGISTER,
62f9fd8914SShailabh Nagar DEREGISTER,
63f9fd8914SShailabh Nagar CPU_DONT_CARE
64f9fd8914SShailabh Nagar };
65c757249aSShailabh Nagar
prepare_reply(struct genl_info * info,u8 cmd,struct sk_buff ** skbp,size_t size)66c757249aSShailabh Nagar static int prepare_reply(struct genl_info *info, u8 cmd, struct sk_buff **skbp,
6737167485SOleg Nesterov size_t size)
68c757249aSShailabh Nagar {
69c757249aSShailabh Nagar struct sk_buff *skb;
70c757249aSShailabh Nagar void *reply;
71c757249aSShailabh Nagar
72c757249aSShailabh Nagar /*
73c757249aSShailabh Nagar * If new attributes are added, please revisit this allocation
74c757249aSShailabh Nagar */
753dabc715SThomas Graf skb = genlmsg_new(size, GFP_KERNEL);
76c757249aSShailabh Nagar if (!skb)
77c757249aSShailabh Nagar return -ENOMEM;
78c757249aSShailabh Nagar
79c757249aSShailabh Nagar if (!info) {
80cd85fc58SChristoph Lameter int seq = this_cpu_inc_return(taskstats_seqnum) - 1;
81c757249aSShailabh Nagar
8217c157c8SThomas Graf reply = genlmsg_put(skb, 0, seq, &family, 0, cmd);
83c757249aSShailabh Nagar } else
8417c157c8SThomas Graf reply = genlmsg_put_reply(skb, info, &family, 0, cmd);
85c757249aSShailabh Nagar if (reply == NULL) {
86c757249aSShailabh Nagar nlmsg_free(skb);
87c757249aSShailabh Nagar return -EINVAL;
88c757249aSShailabh Nagar }
89c757249aSShailabh Nagar
90c757249aSShailabh Nagar *skbp = skb;
91c757249aSShailabh Nagar return 0;
92c757249aSShailabh Nagar }
93c757249aSShailabh Nagar
94f9fd8914SShailabh Nagar /*
95f9fd8914SShailabh Nagar * Send taskstats data in @skb to listener with nl_pid @pid
96f9fd8914SShailabh Nagar */
send_reply(struct sk_buff * skb,struct genl_info * info)97134e6375SJohannes Berg static int send_reply(struct sk_buff *skb, struct genl_info *info)
98c757249aSShailabh Nagar {
99b529ccf2SArnaldo Carvalho de Melo struct genlmsghdr *genlhdr = nlmsg_data(nlmsg_hdr(skb));
100f9fd8914SShailabh Nagar void *reply = genlmsg_data(genlhdr);
101c757249aSShailabh Nagar
102053c095aSJohannes Berg genlmsg_end(skb, reply);
103c757249aSShailabh Nagar
104134e6375SJohannes Berg return genlmsg_reply(skb, info);
105c757249aSShailabh Nagar }
106c757249aSShailabh Nagar
107f9fd8914SShailabh Nagar /*
108f9fd8914SShailabh Nagar * Send taskstats data in @skb to listeners registered for @cpu's exit data
109f9fd8914SShailabh Nagar */
send_cpu_listeners(struct sk_buff * skb,struct listener_list * listeners)110115085eaSOleg Nesterov static void send_cpu_listeners(struct sk_buff *skb,
111115085eaSOleg Nesterov struct listener_list *listeners)
112f9fd8914SShailabh Nagar {
113b529ccf2SArnaldo Carvalho de Melo struct genlmsghdr *genlhdr = nlmsg_data(nlmsg_hdr(skb));
114f9fd8914SShailabh Nagar struct listener *s, *tmp;
115f9fd8914SShailabh Nagar struct sk_buff *skb_next, *skb_cur = skb;
116f9fd8914SShailabh Nagar void *reply = genlmsg_data(genlhdr);
11792333baaSLukas Bulwahn int delcount = 0;
118f9fd8914SShailabh Nagar
119053c095aSJohannes Berg genlmsg_end(skb, reply);
120f9fd8914SShailabh Nagar
121bb129994SShailabh Nagar down_read(&listeners->sem);
122d94a0415SShailabh Nagar list_for_each_entry(s, &listeners->list, list) {
12392333baaSLukas Bulwahn int rc;
12492333baaSLukas Bulwahn
125f9fd8914SShailabh Nagar skb_next = NULL;
126f9fd8914SShailabh Nagar if (!list_is_last(&s->list, &listeners->list)) {
127f9fd8914SShailabh Nagar skb_next = skb_clone(skb_cur, GFP_KERNEL);
128d94a0415SShailabh Nagar if (!skb_next)
129f9fd8914SShailabh Nagar break;
130f9fd8914SShailabh Nagar }
131134e6375SJohannes Berg rc = genlmsg_unicast(&init_net, skb_cur, s->pid);
132d94a0415SShailabh Nagar if (rc == -ECONNREFUSED) {
133bb129994SShailabh Nagar s->valid = 0;
134bb129994SShailabh Nagar delcount++;
135f9fd8914SShailabh Nagar }
136f9fd8914SShailabh Nagar skb_cur = skb_next;
137f9fd8914SShailabh Nagar }
138bb129994SShailabh Nagar up_read(&listeners->sem);
139f9fd8914SShailabh Nagar
140d94a0415SShailabh Nagar if (skb_cur)
141d94a0415SShailabh Nagar nlmsg_free(skb_cur);
142d94a0415SShailabh Nagar
143bb129994SShailabh Nagar if (!delcount)
144d94a0415SShailabh Nagar return;
145bb129994SShailabh Nagar
146bb129994SShailabh Nagar /* Delete invalidated entries */
147bb129994SShailabh Nagar down_write(&listeners->sem);
148bb129994SShailabh Nagar list_for_each_entry_safe(s, tmp, &listeners->list, list) {
149bb129994SShailabh Nagar if (!s->valid) {
150bb129994SShailabh Nagar list_del(&s->list);
151bb129994SShailabh Nagar kfree(s);
152bb129994SShailabh Nagar }
153bb129994SShailabh Nagar }
154bb129994SShailabh Nagar up_write(&listeners->sem);
155f9fd8914SShailabh Nagar }
156f9fd8914SShailabh Nagar
exe_add_tsk(struct taskstats * stats,struct task_struct * tsk)1570e0af57eSDr. Thomas Orgis static void exe_add_tsk(struct taskstats *stats, struct task_struct *tsk)
1580e0af57eSDr. Thomas Orgis {
1590e0af57eSDr. Thomas Orgis /* No idea if I'm allowed to access that here, now. */
1600e0af57eSDr. Thomas Orgis struct file *exe_file = get_task_exe_file(tsk);
1610e0af57eSDr. Thomas Orgis
1620e0af57eSDr. Thomas Orgis if (exe_file) {
1630e0af57eSDr. Thomas Orgis /* Following cp_new_stat64() in stat.c . */
1640e0af57eSDr. Thomas Orgis stats->ac_exe_dev =
1650e0af57eSDr. Thomas Orgis huge_encode_dev(exe_file->f_inode->i_sb->s_dev);
1660e0af57eSDr. Thomas Orgis stats->ac_exe_inode = exe_file->f_inode->i_ino;
1670e0af57eSDr. Thomas Orgis fput(exe_file);
1680e0af57eSDr. Thomas Orgis } else {
1690e0af57eSDr. Thomas Orgis stats->ac_exe_dev = 0;
1700e0af57eSDr. Thomas Orgis stats->ac_exe_inode = 0;
1710e0af57eSDr. Thomas Orgis }
1720e0af57eSDr. Thomas Orgis }
1730e0af57eSDr. Thomas Orgis
fill_stats(struct user_namespace * user_ns,struct pid_namespace * pid_ns,struct task_struct * tsk,struct taskstats * stats)1744bd6e32aSEric W. Biederman static void fill_stats(struct user_namespace *user_ns,
1754bd6e32aSEric W. Biederman struct pid_namespace *pid_ns,
1764bd6e32aSEric W. Biederman struct task_struct *tsk, struct taskstats *stats)
177c757249aSShailabh Nagar {
17851de4d90SOleg Nesterov memset(stats, 0, sizeof(*stats));
179c757249aSShailabh Nagar /*
180c757249aSShailabh Nagar * Each accounting subsystem adds calls to its functions to
181c757249aSShailabh Nagar * fill in relevant parts of struct taskstsats as follows
182c757249aSShailabh Nagar *
1837d94ddddSShailabh Nagar * per-task-foo(stats, tsk);
184c757249aSShailabh Nagar */
185c757249aSShailabh Nagar
1867d94ddddSShailabh Nagar delayacct_add_tsk(stats, tsk);
187f3cef7a9SJay Lan
188f3cef7a9SJay Lan /* fill in basic acct fields */
1896f44993fSShailabh Nagar stats->version = TASKSTATS_VERSION;
190b663a79cSMaxim Uvarov stats->nvcsw = tsk->nvcsw;
191b663a79cSMaxim Uvarov stats->nivcsw = tsk->nivcsw;
1924bd6e32aSEric W. Biederman bacct_add_tsk(user_ns, pid_ns, stats, tsk);
1936f44993fSShailabh Nagar
1949acc1853SJay Lan /* fill in extended acct fields */
1959acc1853SJay Lan xacct_add_tsk(stats, tsk);
1960e0af57eSDr. Thomas Orgis
1970e0af57eSDr. Thomas Orgis /* add executable info */
1980e0af57eSDr. Thomas Orgis exe_add_tsk(stats, tsk);
199c757249aSShailabh Nagar }
200c757249aSShailabh Nagar
fill_stats_for_pid(pid_t pid,struct taskstats * stats)2013d9e0cf1SMichael Holzheu static int fill_stats_for_pid(pid_t pid, struct taskstats *stats)
202c757249aSShailabh Nagar {
203a98b6094SOleg Nesterov struct task_struct *tsk;
2043d9e0cf1SMichael Holzheu
2052ee08260SMike Rapoport tsk = find_get_task_by_vpid(pid);
2063d9e0cf1SMichael Holzheu if (!tsk)
2073d9e0cf1SMichael Holzheu return -ESRCH;
2084bd6e32aSEric W. Biederman fill_stats(current_user_ns(), task_active_pid_ns(current), tsk, stats);
2093d9e0cf1SMichael Holzheu put_task_struct(tsk);
2103d9e0cf1SMichael Holzheu return 0;
2113d9e0cf1SMichael Holzheu }
2123d9e0cf1SMichael Holzheu
fill_stats_for_tgid(pid_t tgid,struct taskstats * stats)2133d9e0cf1SMichael Holzheu static int fill_stats_for_tgid(pid_t tgid, struct taskstats *stats)
2143d9e0cf1SMichael Holzheu {
2153d9e0cf1SMichael Holzheu struct task_struct *tsk, *first;
216ad4ecbcbSShailabh Nagar unsigned long flags;
217a98b6094SOleg Nesterov int rc = -ESRCH;
2188c733420SZhang Xiao u64 delta, utime, stime;
2198c733420SZhang Xiao u64 start_time;
220c757249aSShailabh Nagar
221ad4ecbcbSShailabh Nagar /*
222ad4ecbcbSShailabh Nagar * Add additional stats from live tasks except zombie thread group
223ad4ecbcbSShailabh Nagar * leaders who are already counted with the dead tasks
224ad4ecbcbSShailabh Nagar */
225a98b6094SOleg Nesterov rcu_read_lock();
226cb41d6d0SPavel Emelyanov first = find_task_by_vpid(tgid);
227ad4ecbcbSShailabh Nagar
228a98b6094SOleg Nesterov if (!first || !lock_task_sighand(first, &flags))
229a98b6094SOleg Nesterov goto out;
230fca178c0SOleg Nesterov
231ad4ecbcbSShailabh Nagar if (first->signal->stats)
232ad4ecbcbSShailabh Nagar memcpy(stats, first->signal->stats, sizeof(*stats));
23351de4d90SOleg Nesterov else
23451de4d90SOleg Nesterov memset(stats, 0, sizeof(*stats));
235ad4ecbcbSShailabh Nagar
2368c733420SZhang Xiao start_time = ktime_get_ns();
237ed5378a3SOleg Nesterov for_each_thread(first, tsk) {
238d7c3f5f2SOleg Nesterov if (tsk->exit_state)
239ad4ecbcbSShailabh Nagar continue;
240c757249aSShailabh Nagar /*
241ad4ecbcbSShailabh Nagar * Accounting subsystem can call its functions here to
242c757249aSShailabh Nagar * fill in relevant parts of struct taskstsats as follows
243c757249aSShailabh Nagar *
244ad4ecbcbSShailabh Nagar * per-task-foo(stats, tsk);
245c757249aSShailabh Nagar */
246ad4ecbcbSShailabh Nagar delayacct_add_tsk(stats, tsk);
2476f44993fSShailabh Nagar
2488c733420SZhang Xiao /* calculate task elapsed time in nsec */
2498c733420SZhang Xiao delta = start_time - tsk->start_time;
2508c733420SZhang Xiao /* Convert to micro seconds */
2518c733420SZhang Xiao do_div(delta, NSEC_PER_USEC);
2528c733420SZhang Xiao stats->ac_etime += delta;
2538c733420SZhang Xiao
2548c733420SZhang Xiao task_cputime(tsk, &utime, &stime);
2558c733420SZhang Xiao stats->ac_utime += div_u64(utime, NSEC_PER_USEC);
2568c733420SZhang Xiao stats->ac_stime += div_u64(stime, NSEC_PER_USEC);
2578c733420SZhang Xiao
258b663a79cSMaxim Uvarov stats->nvcsw += tsk->nvcsw;
259b663a79cSMaxim Uvarov stats->nivcsw += tsk->nivcsw;
260ed5378a3SOleg Nesterov }
2616f44993fSShailabh Nagar
262a98b6094SOleg Nesterov unlock_task_sighand(first, &flags);
263a98b6094SOleg Nesterov rc = 0;
264a98b6094SOleg Nesterov out:
265a98b6094SOleg Nesterov rcu_read_unlock();
266a98b6094SOleg Nesterov
267a98b6094SOleg Nesterov stats->version = TASKSTATS_VERSION;
268c757249aSShailabh Nagar /*
2693a4fa0a2SRobert P. J. Day * Accounting subsystems can also add calls here to modify
270ad4ecbcbSShailabh Nagar * fields of taskstats.
271c757249aSShailabh Nagar */
272a98b6094SOleg Nesterov return rc;
273c757249aSShailabh Nagar }
274c757249aSShailabh Nagar
fill_tgid_exit(struct task_struct * tsk)275ad4ecbcbSShailabh Nagar static void fill_tgid_exit(struct task_struct *tsk)
276ad4ecbcbSShailabh Nagar {
277ad4ecbcbSShailabh Nagar unsigned long flags;
278ad4ecbcbSShailabh Nagar
279b8534d7bSOleg Nesterov spin_lock_irqsave(&tsk->sighand->siglock, flags);
280ad4ecbcbSShailabh Nagar if (!tsk->signal->stats)
281ad4ecbcbSShailabh Nagar goto ret;
282ad4ecbcbSShailabh Nagar
283ad4ecbcbSShailabh Nagar /*
284ad4ecbcbSShailabh Nagar * Each accounting subsystem calls its functions here to
285ad4ecbcbSShailabh Nagar * accumalate its per-task stats for tsk, into the per-tgid structure
286ad4ecbcbSShailabh Nagar *
287ad4ecbcbSShailabh Nagar * per-task-foo(tsk->signal->stats, tsk);
288ad4ecbcbSShailabh Nagar */
289ad4ecbcbSShailabh Nagar delayacct_add_tsk(tsk->signal->stats, tsk);
290ad4ecbcbSShailabh Nagar ret:
291b8534d7bSOleg Nesterov spin_unlock_irqrestore(&tsk->sighand->siglock, flags);
292ad4ecbcbSShailabh Nagar return;
293ad4ecbcbSShailabh Nagar }
294ad4ecbcbSShailabh Nagar
add_del_listener(pid_t pid,const struct cpumask * mask,int isadd)29541c7bb95SRusty Russell static int add_del_listener(pid_t pid, const struct cpumask *mask, int isadd)
296f9fd8914SShailabh Nagar {
297f9fd8914SShailabh Nagar struct listener_list *listeners;
29826c4caeaSVasiliy Kulikov struct listener *s, *tmp, *s2;
299f9fd8914SShailabh Nagar unsigned int cpu;
3000d20633bSChen Gang int ret = 0;
301ad4ecbcbSShailabh Nagar
30241c7bb95SRusty Russell if (!cpumask_subset(mask, cpu_possible_mask))
303f9fd8914SShailabh Nagar return -EINVAL;
304f9fd8914SShailabh Nagar
3054bd6e32aSEric W. Biederman if (current_user_ns() != &init_user_ns)
3064bd6e32aSEric W. Biederman return -EINVAL;
3074bd6e32aSEric W. Biederman
3084bd6e32aSEric W. Biederman if (task_active_pid_ns(current) != &init_pid_ns)
3094bd6e32aSEric W. Biederman return -EINVAL;
3104bd6e32aSEric W. Biederman
311f9fd8914SShailabh Nagar if (isadd == REGISTER) {
31241c7bb95SRusty Russell for_each_cpu(cpu, mask) {
31326c4caeaSVasiliy Kulikov s = kmalloc_node(sizeof(struct listener),
31426c4caeaSVasiliy Kulikov GFP_KERNEL, cpu_to_node(cpu));
3150d20633bSChen Gang if (!s) {
3160d20633bSChen Gang ret = -ENOMEM;
317f9fd8914SShailabh Nagar goto cleanup;
3180d20633bSChen Gang }
319f9fd8914SShailabh Nagar s->pid = pid;
320bb129994SShailabh Nagar s->valid = 1;
321f9fd8914SShailabh Nagar
322f9fd8914SShailabh Nagar listeners = &per_cpu(listener_array, cpu);
323f9fd8914SShailabh Nagar down_write(&listeners->sem);
324dfc428b6SOleg Nesterov list_for_each_entry(s2, &listeners->list, list) {
325a7295898SOleg Nesterov if (s2->pid == pid && s2->valid)
326dfc428b6SOleg Nesterov goto exists;
32726c4caeaSVasiliy Kulikov }
328f9fd8914SShailabh Nagar list_add(&s->list, &listeners->list);
32926c4caeaSVasiliy Kulikov s = NULL;
330dfc428b6SOleg Nesterov exists:
331f9fd8914SShailabh Nagar up_write(&listeners->sem);
332dfc428b6SOleg Nesterov kfree(s); /* nop if NULL */
333f9fd8914SShailabh Nagar }
334f9fd8914SShailabh Nagar return 0;
335f9fd8914SShailabh Nagar }
336f9fd8914SShailabh Nagar
337f9fd8914SShailabh Nagar /* Deregister or cleanup */
338f9fd8914SShailabh Nagar cleanup:
33941c7bb95SRusty Russell for_each_cpu(cpu, mask) {
340f9fd8914SShailabh Nagar listeners = &per_cpu(listener_array, cpu);
341f9fd8914SShailabh Nagar down_write(&listeners->sem);
342f9fd8914SShailabh Nagar list_for_each_entry_safe(s, tmp, &listeners->list, list) {
343f9fd8914SShailabh Nagar if (s->pid == pid) {
344f9fd8914SShailabh Nagar list_del(&s->list);
345f9fd8914SShailabh Nagar kfree(s);
346f9fd8914SShailabh Nagar break;
347f9fd8914SShailabh Nagar }
348f9fd8914SShailabh Nagar }
349f9fd8914SShailabh Nagar up_write(&listeners->sem);
350f9fd8914SShailabh Nagar }
3510d20633bSChen Gang return ret;
352f9fd8914SShailabh Nagar }
353f9fd8914SShailabh Nagar
parse(struct nlattr * na,struct cpumask * mask)35441c7bb95SRusty Russell static int parse(struct nlattr *na, struct cpumask *mask)
355f9fd8914SShailabh Nagar {
356f9fd8914SShailabh Nagar char *data;
357f9fd8914SShailabh Nagar int len;
358f9fd8914SShailabh Nagar int ret;
359f9fd8914SShailabh Nagar
360f9fd8914SShailabh Nagar if (na == NULL)
361f9fd8914SShailabh Nagar return 1;
362f9fd8914SShailabh Nagar len = nla_len(na);
363f9fd8914SShailabh Nagar if (len > TASKSTATS_CPUMASK_MAXLEN)
364f9fd8914SShailabh Nagar return -E2BIG;
365f9fd8914SShailabh Nagar if (len < 1)
366f9fd8914SShailabh Nagar return -EINVAL;
367f9fd8914SShailabh Nagar data = kmalloc(len, GFP_KERNEL);
368f9fd8914SShailabh Nagar if (!data)
369f9fd8914SShailabh Nagar return -ENOMEM;
370872f6903SFrancis Laniel nla_strscpy(data, na, len);
37129c0177eSRusty Russell ret = cpulist_parse(data, mask);
372f9fd8914SShailabh Nagar kfree(data);
373f9fd8914SShailabh Nagar return ret;
374f9fd8914SShailabh Nagar }
375f9fd8914SShailabh Nagar
mk_reply(struct sk_buff * skb,int type,u32 pid)37651de4d90SOleg Nesterov static struct taskstats *mk_reply(struct sk_buff *skb, int type, u32 pid)
37768062b86SOleg Nesterov {
37851de4d90SOleg Nesterov struct nlattr *na, *ret;
37968062b86SOleg Nesterov int aggr;
38068062b86SOleg Nesterov
38137167485SOleg Nesterov aggr = (type == TASKSTATS_TYPE_PID)
38237167485SOleg Nesterov ? TASKSTATS_TYPE_AGGR_PID
38337167485SOleg Nesterov : TASKSTATS_TYPE_AGGR_TGID;
38468062b86SOleg Nesterov
385ae0be8deSMichal Kubecek na = nla_nest_start_noflag(skb, aggr);
38637167485SOleg Nesterov if (!na)
38737167485SOleg Nesterov goto err;
3884be2c95dSJeff Mahoney
3893fa58266SChen Gang if (nla_put(skb, type, sizeof(pid), &pid) < 0) {
3903fa58266SChen Gang nla_nest_cancel(skb, na);
39151de4d90SOleg Nesterov goto err;
3923fa58266SChen Gang }
39380df5542SNicolas Dichtel ret = nla_reserve_64bit(skb, TASKSTATS_TYPE_STATS,
39480df5542SNicolas Dichtel sizeof(struct taskstats), TASKSTATS_TYPE_NULL);
3953fa58266SChen Gang if (!ret) {
3963fa58266SChen Gang nla_nest_cancel(skb, na);
39751de4d90SOleg Nesterov goto err;
3983fa58266SChen Gang }
39968062b86SOleg Nesterov nla_nest_end(skb, na);
40068062b86SOleg Nesterov
40151de4d90SOleg Nesterov return nla_data(ret);
40251de4d90SOleg Nesterov err:
40351de4d90SOleg Nesterov return NULL;
40468062b86SOleg Nesterov }
40568062b86SOleg Nesterov
cgroupstats_user_cmd(struct sk_buff * skb,struct genl_info * info)406846c7bb0SBalbir Singh static int cgroupstats_user_cmd(struct sk_buff *skb, struct genl_info *info)
407846c7bb0SBalbir Singh {
408846c7bb0SBalbir Singh int rc = 0;
409846c7bb0SBalbir Singh struct sk_buff *rep_skb;
410846c7bb0SBalbir Singh struct cgroupstats *stats;
411846c7bb0SBalbir Singh struct nlattr *na;
412846c7bb0SBalbir Singh size_t size;
413846c7bb0SBalbir Singh u32 fd;
414846c7bb0SBalbir Singh
415846c7bb0SBalbir Singh na = info->attrs[CGROUPSTATS_CMD_ATTR_FD];
416846c7bb0SBalbir Singh if (!na)
417846c7bb0SBalbir Singh return -EINVAL;
418846c7bb0SBalbir Singh
419846c7bb0SBalbir Singh fd = nla_get_u32(info->attrs[CGROUPSTATS_CMD_ATTR_FD]);
420*8152f820SAl Viro CLASS(fd, f)(fd);
421*8152f820SAl Viro if (fd_empty(f))
422f9615984SAdrian Bunk return 0;
423f9615984SAdrian Bunk
424846c7bb0SBalbir Singh size = nla_total_size(sizeof(struct cgroupstats));
425846c7bb0SBalbir Singh
426846c7bb0SBalbir Singh rc = prepare_reply(info, CGROUPSTATS_CMD_NEW, &rep_skb,
427846c7bb0SBalbir Singh size);
428846c7bb0SBalbir Singh if (rc < 0)
429*8152f820SAl Viro return rc;
430846c7bb0SBalbir Singh
431846c7bb0SBalbir Singh na = nla_reserve(rep_skb, CGROUPSTATS_TYPE_CGROUP_STATS,
432846c7bb0SBalbir Singh sizeof(struct cgroupstats));
43325353b33SAlan Cox if (na == NULL) {
4340324b5a4SJesper Juhl nlmsg_free(rep_skb);
435*8152f820SAl Viro return -EMSGSIZE;
43625353b33SAlan Cox }
43725353b33SAlan Cox
438846c7bb0SBalbir Singh stats = nla_data(na);
439846c7bb0SBalbir Singh memset(stats, 0, sizeof(*stats));
440846c7bb0SBalbir Singh
4411da91ea8SAl Viro rc = cgroupstats_build(stats, fd_file(f)->f_path.dentry);
442f9615984SAdrian Bunk if (rc < 0) {
443f9615984SAdrian Bunk nlmsg_free(rep_skb);
444*8152f820SAl Viro return rc;
445846c7bb0SBalbir Singh }
446846c7bb0SBalbir Singh
447*8152f820SAl Viro return send_reply(rep_skb, info);
448846c7bb0SBalbir Singh }
449846c7bb0SBalbir Singh
cmd_attr_register_cpumask(struct genl_info * info)45093233125SMichael Holzheu static int cmd_attr_register_cpumask(struct genl_info *info)
451c757249aSShailabh Nagar {
45241c7bb95SRusty Russell cpumask_var_t mask;
45393233125SMichael Holzheu int rc;
454f9fd8914SShailabh Nagar
45541c7bb95SRusty Russell if (!alloc_cpumask_var(&mask, GFP_KERNEL))
45641c7bb95SRusty Russell return -ENOMEM;
45741c7bb95SRusty Russell rc = parse(info->attrs[TASKSTATS_CMD_ATTR_REGISTER_CPUMASK], mask);
458f9fd8914SShailabh Nagar if (rc < 0)
45993233125SMichael Holzheu goto out;
46015e47304SEric W. Biederman rc = add_del_listener(info->snd_portid, mask, REGISTER);
46193233125SMichael Holzheu out:
46241c7bb95SRusty Russell free_cpumask_var(mask);
463f9fd8914SShailabh Nagar return rc;
46441c7bb95SRusty Russell }
465c757249aSShailabh Nagar
cmd_attr_deregister_cpumask(struct genl_info * info)46693233125SMichael Holzheu static int cmd_attr_deregister_cpumask(struct genl_info *info)
46793233125SMichael Holzheu {
46893233125SMichael Holzheu cpumask_var_t mask;
46993233125SMichael Holzheu int rc;
47093233125SMichael Holzheu
47193233125SMichael Holzheu if (!alloc_cpumask_var(&mask, GFP_KERNEL))
47293233125SMichael Holzheu return -ENOMEM;
47393233125SMichael Holzheu rc = parse(info->attrs[TASKSTATS_CMD_ATTR_DEREGISTER_CPUMASK], mask);
47493233125SMichael Holzheu if (rc < 0)
47593233125SMichael Holzheu goto out;
47615e47304SEric W. Biederman rc = add_del_listener(info->snd_portid, mask, DEREGISTER);
47793233125SMichael Holzheu out:
47893233125SMichael Holzheu free_cpumask_var(mask);
47993233125SMichael Holzheu return rc;
48093233125SMichael Holzheu }
48193233125SMichael Holzheu
taskstats_packet_size(void)4824be2c95dSJeff Mahoney static size_t taskstats_packet_size(void)
4834be2c95dSJeff Mahoney {
4844be2c95dSJeff Mahoney size_t size;
4854be2c95dSJeff Mahoney
4864be2c95dSJeff Mahoney size = nla_total_size(sizeof(u32)) +
48780df5542SNicolas Dichtel nla_total_size_64bit(sizeof(struct taskstats)) +
48880df5542SNicolas Dichtel nla_total_size(0);
48980df5542SNicolas Dichtel
4904be2c95dSJeff Mahoney return size;
4914be2c95dSJeff Mahoney }
4924be2c95dSJeff Mahoney
cmd_attr_pid(struct genl_info * info)49393233125SMichael Holzheu static int cmd_attr_pid(struct genl_info *info)
49493233125SMichael Holzheu {
49593233125SMichael Holzheu struct taskstats *stats;
49693233125SMichael Holzheu struct sk_buff *rep_skb;
49793233125SMichael Holzheu size_t size;
49893233125SMichael Holzheu u32 pid;
49993233125SMichael Holzheu int rc;
50093233125SMichael Holzheu
5014be2c95dSJeff Mahoney size = taskstats_packet_size();
502c757249aSShailabh Nagar
50337167485SOleg Nesterov rc = prepare_reply(info, TASKSTATS_CMD_NEW, &rep_skb, size);
504c757249aSShailabh Nagar if (rc < 0)
505c757249aSShailabh Nagar return rc;
506c757249aSShailabh Nagar
50751de4d90SOleg Nesterov rc = -EINVAL;
50893233125SMichael Holzheu pid = nla_get_u32(info->attrs[TASKSTATS_CMD_ATTR_PID]);
50951de4d90SOleg Nesterov stats = mk_reply(rep_skb, TASKSTATS_TYPE_PID, pid);
51051de4d90SOleg Nesterov if (!stats)
51137167485SOleg Nesterov goto err;
512c757249aSShailabh Nagar
5133d9e0cf1SMichael Holzheu rc = fill_stats_for_pid(pid, stats);
51451de4d90SOleg Nesterov if (rc < 0)
51537167485SOleg Nesterov goto err;
51693233125SMichael Holzheu return send_reply(rep_skb, info);
51793233125SMichael Holzheu err:
51893233125SMichael Holzheu nlmsg_free(rep_skb);
51993233125SMichael Holzheu return rc;
52093233125SMichael Holzheu }
52193233125SMichael Holzheu
cmd_attr_tgid(struct genl_info * info)52293233125SMichael Holzheu static int cmd_attr_tgid(struct genl_info *info)
52393233125SMichael Holzheu {
52493233125SMichael Holzheu struct taskstats *stats;
52593233125SMichael Holzheu struct sk_buff *rep_skb;
52693233125SMichael Holzheu size_t size;
52793233125SMichael Holzheu u32 tgid;
52893233125SMichael Holzheu int rc;
52993233125SMichael Holzheu
5304be2c95dSJeff Mahoney size = taskstats_packet_size();
53193233125SMichael Holzheu
53293233125SMichael Holzheu rc = prepare_reply(info, TASKSTATS_CMD_NEW, &rep_skb, size);
53393233125SMichael Holzheu if (rc < 0)
53493233125SMichael Holzheu return rc;
53593233125SMichael Holzheu
53693233125SMichael Holzheu rc = -EINVAL;
53793233125SMichael Holzheu tgid = nla_get_u32(info->attrs[TASKSTATS_CMD_ATTR_TGID]);
53851de4d90SOleg Nesterov stats = mk_reply(rep_skb, TASKSTATS_TYPE_TGID, tgid);
53951de4d90SOleg Nesterov if (!stats)
54037167485SOleg Nesterov goto err;
541c757249aSShailabh Nagar
5423d9e0cf1SMichael Holzheu rc = fill_stats_for_tgid(tgid, stats);
54351de4d90SOleg Nesterov if (rc < 0)
54437167485SOleg Nesterov goto err;
545134e6375SJohannes Berg return send_reply(rep_skb, info);
546c757249aSShailabh Nagar err:
547c757249aSShailabh Nagar nlmsg_free(rep_skb);
548c757249aSShailabh Nagar return rc;
549c757249aSShailabh Nagar }
550c757249aSShailabh Nagar
taskstats_user_cmd(struct sk_buff * skb,struct genl_info * info)55193233125SMichael Holzheu static int taskstats_user_cmd(struct sk_buff *skb, struct genl_info *info)
55293233125SMichael Holzheu {
55393233125SMichael Holzheu if (info->attrs[TASKSTATS_CMD_ATTR_REGISTER_CPUMASK])
55493233125SMichael Holzheu return cmd_attr_register_cpumask(info);
55593233125SMichael Holzheu else if (info->attrs[TASKSTATS_CMD_ATTR_DEREGISTER_CPUMASK])
55693233125SMichael Holzheu return cmd_attr_deregister_cpumask(info);
55793233125SMichael Holzheu else if (info->attrs[TASKSTATS_CMD_ATTR_PID])
55893233125SMichael Holzheu return cmd_attr_pid(info);
55993233125SMichael Holzheu else if (info->attrs[TASKSTATS_CMD_ATTR_TGID])
56093233125SMichael Holzheu return cmd_attr_tgid(info);
56193233125SMichael Holzheu else
56293233125SMichael Holzheu return -EINVAL;
56393233125SMichael Holzheu }
56493233125SMichael Holzheu
taskstats_tgid_alloc(struct task_struct * tsk)56534ec1234SOleg Nesterov static struct taskstats *taskstats_tgid_alloc(struct task_struct *tsk)
56634ec1234SOleg Nesterov {
56734ec1234SOleg Nesterov struct signal_struct *sig = tsk->signal;
5680b8d616fSChristian Brauner struct taskstats *stats_new, *stats;
56934ec1234SOleg Nesterov
5700b8d616fSChristian Brauner /* Pairs with smp_store_release() below. */
5710b8d616fSChristian Brauner stats = smp_load_acquire(&sig->stats);
5720b8d616fSChristian Brauner if (stats || thread_group_empty(tsk))
5730b8d616fSChristian Brauner return stats;
57434ec1234SOleg Nesterov
57534ec1234SOleg Nesterov /* No problem if kmem_cache_zalloc() fails */
5760b8d616fSChristian Brauner stats_new = kmem_cache_zalloc(taskstats_cache, GFP_KERNEL);
57734ec1234SOleg Nesterov
57834ec1234SOleg Nesterov spin_lock_irq(&tsk->sighand->siglock);
5790b8d616fSChristian Brauner stats = sig->stats;
5800b8d616fSChristian Brauner if (!stats) {
5810b8d616fSChristian Brauner /*
5820b8d616fSChristian Brauner * Pairs with smp_store_release() above and order the
5830b8d616fSChristian Brauner * kmem_cache_zalloc().
5840b8d616fSChristian Brauner */
5850b8d616fSChristian Brauner smp_store_release(&sig->stats, stats_new);
5860b8d616fSChristian Brauner stats = stats_new;
5870b8d616fSChristian Brauner stats_new = NULL;
58834ec1234SOleg Nesterov }
58934ec1234SOleg Nesterov spin_unlock_irq(&tsk->sighand->siglock);
59034ec1234SOleg Nesterov
5910b8d616fSChristian Brauner if (stats_new)
5920b8d616fSChristian Brauner kmem_cache_free(taskstats_cache, stats_new);
5930b8d616fSChristian Brauner
5940b8d616fSChristian Brauner return stats;
59534ec1234SOleg Nesterov }
59634ec1234SOleg Nesterov
597c757249aSShailabh Nagar /* Send pid data out on exit */
taskstats_exit(struct task_struct * tsk,int group_dead)598115085eaSOleg Nesterov void taskstats_exit(struct task_struct *tsk, int group_dead)
599c757249aSShailabh Nagar {
600c757249aSShailabh Nagar int rc;
601115085eaSOleg Nesterov struct listener_list *listeners;
60251de4d90SOleg Nesterov struct taskstats *stats;
603c757249aSShailabh Nagar struct sk_buff *rep_skb;
604c757249aSShailabh Nagar size_t size;
605c757249aSShailabh Nagar int is_thread_group;
606c757249aSShailabh Nagar
6074a279ff1SOleg Nesterov if (!family_registered)
608c757249aSShailabh Nagar return;
609c757249aSShailabh Nagar
610c757249aSShailabh Nagar /*
611c757249aSShailabh Nagar * Size includes space for nested attributes
612c757249aSShailabh Nagar */
6134be2c95dSJeff Mahoney size = taskstats_packet_size();
614c757249aSShailabh Nagar
61534ec1234SOleg Nesterov is_thread_group = !!taskstats_tgid_alloc(tsk);
6164a279ff1SOleg Nesterov if (is_thread_group) {
6174a279ff1SOleg Nesterov /* PID + STATS + TGID + STATS */
6184a279ff1SOleg Nesterov size = 2 * size;
6194a279ff1SOleg Nesterov /* fill the tsk->signal->stats structure */
6204a279ff1SOleg Nesterov fill_tgid_exit(tsk);
6214a279ff1SOleg Nesterov }
6224a279ff1SOleg Nesterov
6234a32fea9SChristoph Lameter listeners = raw_cpu_ptr(&listener_array);
624115085eaSOleg Nesterov if (list_empty(&listeners->list))
625115085eaSOleg Nesterov return;
626115085eaSOleg Nesterov
62737167485SOleg Nesterov rc = prepare_reply(NULL, TASKSTATS_CMD_NEW, &rep_skb, size);
628c757249aSShailabh Nagar if (rc < 0)
62951de4d90SOleg Nesterov return;
630c757249aSShailabh Nagar
6314bd6e32aSEric W. Biederman stats = mk_reply(rep_skb, TASKSTATS_TYPE_PID,
6324bd6e32aSEric W. Biederman task_pid_nr_ns(tsk, &init_pid_ns));
63351de4d90SOleg Nesterov if (!stats)
63437167485SOleg Nesterov goto err;
63551de4d90SOleg Nesterov
6364bd6e32aSEric W. Biederman fill_stats(&init_user_ns, &init_pid_ns, tsk, stats);
6370e0af57eSDr. Thomas Orgis if (group_dead)
6380e0af57eSDr. Thomas Orgis stats->ac_flag |= AGROUP;
639c757249aSShailabh Nagar
640c757249aSShailabh Nagar /*
641ad4ecbcbSShailabh Nagar * Doesn't matter if tsk is the leader or the last group member leaving
642c757249aSShailabh Nagar */
64368062b86SOleg Nesterov if (!is_thread_group || !group_dead)
644ad4ecbcbSShailabh Nagar goto send;
645c757249aSShailabh Nagar
6464bd6e32aSEric W. Biederman stats = mk_reply(rep_skb, TASKSTATS_TYPE_TGID,
6474bd6e32aSEric W. Biederman task_tgid_nr_ns(tsk, &init_pid_ns));
64851de4d90SOleg Nesterov if (!stats)
64937167485SOleg Nesterov goto err;
65051de4d90SOleg Nesterov
65151de4d90SOleg Nesterov memcpy(stats, tsk->signal->stats, sizeof(*stats));
652c757249aSShailabh Nagar
653ad4ecbcbSShailabh Nagar send:
654115085eaSOleg Nesterov send_cpu_listeners(rep_skb, listeners);
655ad4ecbcbSShailabh Nagar return;
65637167485SOleg Nesterov err:
657c757249aSShailabh Nagar nlmsg_free(rep_skb);
658c757249aSShailabh Nagar }
659c757249aSShailabh Nagar
6607c1e0926SJakub Kicinski static const struct genl_ops taskstats_ops[] = {
66188d36a99SJohannes Berg {
662c757249aSShailabh Nagar .cmd = TASKSTATS_CMD_GET,
663ef6243acSJohannes Berg .validate = GENL_DONT_VALIDATE_STRICT | GENL_DONT_VALIDATE_DUMP,
664f9fd8914SShailabh Nagar .doit = taskstats_user_cmd,
6657c1e0926SJakub Kicinski .policy = taskstats_cmd_get_policy,
6667c1e0926SJakub Kicinski .maxattr = ARRAY_SIZE(taskstats_cmd_get_policy) - 1,
6677c1e0926SJakub Kicinski .flags = GENL_ADMIN_PERM,
66888d36a99SJohannes Berg },
66988d36a99SJohannes Berg {
670846c7bb0SBalbir Singh .cmd = CGROUPSTATS_CMD_GET,
671ef6243acSJohannes Berg .validate = GENL_DONT_VALIDATE_STRICT | GENL_DONT_VALIDATE_DUMP,
672846c7bb0SBalbir Singh .doit = cgroupstats_user_cmd,
6737c1e0926SJakub Kicinski .policy = cgroupstats_cmd_get_policy,
6747c1e0926SJakub Kicinski .maxattr = ARRAY_SIZE(cgroupstats_cmd_get_policy) - 1,
67588d36a99SJohannes Berg },
676846c7bb0SBalbir Singh };
677846c7bb0SBalbir Singh
67856989f6dSJohannes Berg static struct genl_family family __ro_after_init = {
679489111e5SJohannes Berg .name = TASKSTATS_GENL_NAME,
680489111e5SJohannes Berg .version = TASKSTATS_GENL_VERSION,
681489111e5SJohannes Berg .module = THIS_MODULE,
6827c1e0926SJakub Kicinski .ops = taskstats_ops,
6837c1e0926SJakub Kicinski .n_ops = ARRAY_SIZE(taskstats_ops),
6849c5d03d3SJakub Kicinski .resv_start_op = CGROUPSTATS_CMD_GET + 1,
685edc73c72Sxu xin .netnsok = true,
686489111e5SJohannes Berg };
687489111e5SJohannes Berg
688c757249aSShailabh Nagar /* Needed early in initialization */
taskstats_init_early(void)689c757249aSShailabh Nagar void __init taskstats_init_early(void)
690c757249aSShailabh Nagar {
691f9fd8914SShailabh Nagar unsigned int i;
692f9fd8914SShailabh Nagar
6930a31bd5fSChristoph Lameter taskstats_cache = KMEM_CACHE(taskstats, SLAB_PANIC);
694f9fd8914SShailabh Nagar for_each_possible_cpu(i) {
695f9fd8914SShailabh Nagar INIT_LIST_HEAD(&(per_cpu(listener_array, i).list));
696f9fd8914SShailabh Nagar init_rwsem(&(per_cpu(listener_array, i).sem));
697f9fd8914SShailabh Nagar }
698c757249aSShailabh Nagar }
699c757249aSShailabh Nagar
taskstats_init(void)700c757249aSShailabh Nagar static int __init taskstats_init(void)
701c757249aSShailabh Nagar {
702c757249aSShailabh Nagar int rc;
703c757249aSShailabh Nagar
704489111e5SJohannes Berg rc = genl_register_family(&family);
705c757249aSShailabh Nagar if (rc)
706c757249aSShailabh Nagar return rc;
707c757249aSShailabh Nagar
708c757249aSShailabh Nagar family_registered = 1;
709f9b182e2SMandeep Singh Baines pr_info("registered taskstats version %d\n", TASKSTATS_GENL_VERSION);
710c757249aSShailabh Nagar return 0;
711c757249aSShailabh Nagar }
712c757249aSShailabh Nagar
713c757249aSShailabh Nagar /*
714c757249aSShailabh Nagar * late initcall ensures initialization of statistics collection
715c757249aSShailabh Nagar * mechanisms precedes initialization of the taskstats interface
716c757249aSShailabh Nagar */
717c757249aSShailabh Nagar late_initcall(taskstats_init);
718