3 * Utility to get per-pid and per-tgid delay accounting statistics
4 * Also illustrates usage of the taskstats interface
6 * Copyright (C) Shailabh Nagar, IBM Corp. 2005
7 * Copyright (C) Balbir Singh, IBM Corp. 2006
8 * Copyright (c) Jay Lan, SGI. 2006
11 * gcc -I/usr/src/linux/include getdelays.c -o getdelays
21 #include <sys/types.h>
23 #include <sys/socket.h>
26 #include <linux/genetlink.h>
27 #include <linux/taskstats.h>
30 * Generic macros for dealing with netlink sockets. Might be duplicated
31 * elsewhere. It is recommended that commercial grade applications use
32 * libnl or libnetlink and use the interfaces provided by the library
34 #define GENLMSG_DATA(glh) ((void *)(NLMSG_DATA(glh) + GENL_HDRLEN))
35 #define GENLMSG_PAYLOAD(glh) (NLMSG_PAYLOAD(glh, 0) - GENL_HDRLEN)
36 #define NLA_DATA(na) ((void *)((char*)(na) + NLA_HDRLEN))
37 #define NLA_PAYLOAD(len) (len - NLA_HDRLEN)
39 #define err(code, fmt, arg...) \
41 fprintf(stderr, fmt, ##arg); \
50 int print_io_accounting
;
51 int print_task_context_switch_counts
;
54 #define PRINTF(fmt, arg...) { \
60 /* Maximum size of response requested or message sent */
61 #define MAX_MSG_SIZE 1024
62 /* Maximum number of cpus expected to be specified in a cpumask */
68 char buf
[MAX_MSG_SIZE
];
71 char cpumask
[100+6*MAX_CPUS
];
73 static void usage(void)
75 fprintf(stderr
, "getdelays [-dilv] [-w logfile] [-r bufsize] "
76 "[-m cpumask] [-t tgid] [-p pid]\n");
77 fprintf(stderr
, " -d: print delayacct stats\n");
78 fprintf(stderr
, " -i: print IO accounting (works only with -p)\n");
79 fprintf(stderr
, " -l: listen forever\n");
80 fprintf(stderr
, " -v: debug on\n");
84 * Create a raw netlink socket and bind
86 static int create_nl_socket(int protocol
)
89 struct sockaddr_nl local
;
91 fd
= socket(AF_NETLINK
, SOCK_RAW
, protocol
);
96 if (setsockopt(fd
, SOL_SOCKET
, SO_RCVBUF
,
97 &rcvbufsz
, sizeof(rcvbufsz
)) < 0) {
98 fprintf(stderr
, "Unable to set socket rcv buf size "
104 memset(&local
, 0, sizeof(local
));
105 local
.nl_family
= AF_NETLINK
;
107 if (bind(fd
, (struct sockaddr
*) &local
, sizeof(local
)) < 0)
117 int send_cmd(int sd
, __u16 nlmsg_type
, __u32 nlmsg_pid
,
118 __u8 genl_cmd
, __u16 nla_type
,
119 void *nla_data
, int nla_len
)
122 struct sockaddr_nl nladdr
;
126 struct msgtemplate msg
;
128 msg
.n
.nlmsg_len
= NLMSG_LENGTH(GENL_HDRLEN
);
129 msg
.n
.nlmsg_type
= nlmsg_type
;
130 msg
.n
.nlmsg_flags
= NLM_F_REQUEST
;
132 msg
.n
.nlmsg_pid
= nlmsg_pid
;
133 msg
.g
.cmd
= genl_cmd
;
135 na
= (struct nlattr
*) GENLMSG_DATA(&msg
);
136 na
->nla_type
= nla_type
;
137 na
->nla_len
= nla_len
+ 1 + NLA_HDRLEN
;
138 memcpy(NLA_DATA(na
), nla_data
, nla_len
);
139 msg
.n
.nlmsg_len
+= NLMSG_ALIGN(na
->nla_len
);
142 buflen
= msg
.n
.nlmsg_len
;
143 memset(&nladdr
, 0, sizeof(nladdr
));
144 nladdr
.nl_family
= AF_NETLINK
;
145 while ((r
= sendto(sd
, buf
, buflen
, 0, (struct sockaddr
*) &nladdr
,
146 sizeof(nladdr
))) < buflen
) {
150 } else if (errno
!= EAGAIN
)
158 * Probe the controller in genetlink to find the family id
159 * for the TASKSTATS family
161 int get_family_id(int sd
)
173 strcpy(name
, TASKSTATS_GENL_NAME
);
174 rc
= send_cmd(sd
, GENL_ID_CTRL
, getpid(), CTRL_CMD_GETFAMILY
,
175 CTRL_ATTR_FAMILY_NAME
, (void *)name
,
176 strlen(TASKSTATS_GENL_NAME
)+1);
178 rep_len
= recv(sd
, &ans
, sizeof(ans
), 0);
179 if (ans
.n
.nlmsg_type
== NLMSG_ERROR
||
180 (rep_len
< 0) || !NLMSG_OK((&ans
.n
), rep_len
))
183 na
= (struct nlattr
*) GENLMSG_DATA(&ans
);
184 na
= (struct nlattr
*) ((char *) na
+ NLA_ALIGN(na
->nla_len
));
185 if (na
->nla_type
== CTRL_ATTR_FAMILY_ID
) {
186 id
= *(__u16
*) NLA_DATA(na
);
191 void print_delayacct(struct taskstats
*t
)
193 printf("\n\nCPU %15s%15s%15s%15s\n"
194 " %15llu%15llu%15llu%15llu\n"
199 "count", "real total", "virtual total", "delay total",
200 t
->cpu_count
, t
->cpu_run_real_total
, t
->cpu_run_virtual_total
,
202 "count", "delay total",
203 t
->blkio_count
, t
->blkio_delay_total
,
204 "count", "delay total", t
->swapin_count
, t
->swapin_delay_total
);
207 void task_context_switch_counts(struct taskstats
*t
)
209 printf("\n\nTask %15s%15s\n"
211 "voluntary", "nonvoluntary",
212 t
->nvcsw
, t
->nivcsw
);
215 void print_ioacct(struct taskstats
*t
)
217 printf("%s: read=%llu, write=%llu, cancelled_write=%llu\n",
219 (unsigned long long)t
->read_bytes
,
220 (unsigned long long)t
->write_bytes
,
221 (unsigned long long)t
->cancelled_write_bytes
);
224 int main(int argc
, char *argv
[])
226 int c
, rc
, rep_len
, aggr_len
, len2
, cmd_type
;
240 char *logfile
= NULL
;
243 struct msgtemplate msg
;
246 c
= getopt(argc
, argv
, "qdiw:r:m:t:p:vl");
252 printf("print delayacct stats ON\n");
256 printf("printing IO accounting\n");
257 print_io_accounting
= 1;
260 printf("printing task/process context switch rates\n");
261 print_task_context_switch_counts
= 1;
264 logfile
= strdup(optarg
);
265 printf("write to file %s\n", logfile
);
269 rcvbufsz
= atoi(optarg
);
270 printf("receive buf size %d\n", rcvbufsz
);
272 err(1, "Invalid rcv buf size\n");
275 strncpy(cpumask
, optarg
, sizeof(cpumask
));
277 printf("cpumask %s maskset %d\n", cpumask
, maskset
);
282 err(1, "Invalid tgid\n");
283 cmd_type
= TASKSTATS_CMD_ATTR_TGID
;
288 err(1, "Invalid pid\n");
289 cmd_type
= TASKSTATS_CMD_ATTR_PID
;
292 printf("debug on\n");
296 printf("listen forever\n");
306 fd
= open(logfile
, O_WRONLY
| O_CREAT
| O_TRUNC
,
307 S_IRUSR
| S_IWUSR
| S_IRGRP
| S_IROTH
);
309 perror("Cannot open output file\n");
314 if ((nl_sd
= create_nl_socket(NETLINK_GENERIC
)) < 0)
315 err(1, "error creating Netlink socket\n");
319 id
= get_family_id(nl_sd
);
321 fprintf(stderr
, "Error getting family id, errno %d\n", errno
);
324 PRINTF("family id %d\n", id
);
327 rc
= send_cmd(nl_sd
, id
, mypid
, TASKSTATS_CMD_GET
,
328 TASKSTATS_CMD_ATTR_REGISTER_CPUMASK
,
329 &cpumask
, strlen(cpumask
) + 1);
330 PRINTF("Sent register cpumask, retval %d\n", rc
);
332 fprintf(stderr
, "error sending register cpumask\n");
338 rc
= send_cmd(nl_sd
, id
, mypid
, TASKSTATS_CMD_GET
,
339 cmd_type
, &tid
, sizeof(__u32
));
340 PRINTF("Sent pid/tgid, retval %d\n", rc
);
342 fprintf(stderr
, "error sending tid/tgid cmd\n");
350 rep_len
= recv(nl_sd
, &msg
, sizeof(msg
), 0);
351 PRINTF("received %d bytes\n", rep_len
);
354 fprintf(stderr
, "nonfatal reply error: errno %d\n",
358 if (msg
.n
.nlmsg_type
== NLMSG_ERROR
||
359 !NLMSG_OK((&msg
.n
), rep_len
)) {
360 struct nlmsgerr
*err
= NLMSG_DATA(&msg
);
361 fprintf(stderr
, "fatal reply error, errno %d\n",
366 PRINTF("nlmsghdr size=%d, nlmsg_len=%d, rep_len=%d\n",
367 sizeof(struct nlmsghdr
), msg
.n
.nlmsg_len
, rep_len
);
370 rep_len
= GENLMSG_PAYLOAD(&msg
.n
);
372 na
= (struct nlattr
*) GENLMSG_DATA(&msg
);
375 while (len
< rep_len
) {
376 len
+= NLA_ALIGN(na
->nla_len
);
377 switch (na
->nla_type
) {
378 case TASKSTATS_TYPE_AGGR_TGID
:
380 case TASKSTATS_TYPE_AGGR_PID
:
381 aggr_len
= NLA_PAYLOAD(na
->nla_len
);
383 /* For nested attributes, na follows */
384 na
= (struct nlattr
*) NLA_DATA(na
);
386 while (len2
< aggr_len
) {
387 switch (na
->nla_type
) {
388 case TASKSTATS_TYPE_PID
:
389 rtid
= *(int *) NLA_DATA(na
);
391 printf("PID\t%d\n", rtid
);
393 case TASKSTATS_TYPE_TGID
:
394 rtid
= *(int *) NLA_DATA(na
);
396 printf("TGID\t%d\n", rtid
);
398 case TASKSTATS_TYPE_STATS
:
401 print_delayacct((struct taskstats
*) NLA_DATA(na
));
402 if (print_io_accounting
)
403 print_ioacct((struct taskstats
*) NLA_DATA(na
));
404 if (print_task_context_switch_counts
)
405 task_context_switch_counts((struct taskstats
*) NLA_DATA(na
));
407 if (write(fd
, NLA_DATA(na
), na
->nla_len
) < 0) {
408 err(1,"write error\n");
415 fprintf(stderr
, "Unknown nested"
420 len2
+= NLA_ALIGN(na
->nla_len
);
421 na
= (struct nlattr
*) ((char *) na
+ len2
);
426 fprintf(stderr
, "Unknown nla_type %d\n",
430 na
= (struct nlattr
*) (GENLMSG_DATA(&msg
) + len
);
435 rc
= send_cmd(nl_sd
, id
, mypid
, TASKSTATS_CMD_GET
,
436 TASKSTATS_CMD_ATTR_DEREGISTER_CPUMASK
,
437 &cpumask
, strlen(cpumask
) + 1);
438 printf("Sent deregister mask, retval %d\n", rc
);
440 err(rc
, "error sending deregister cpumask\n");