2 * arch/s390/oprofile/init.c
5 * Copyright (C) 2002-2011 IBM Deutschland Entwicklung GmbH, IBM Corporation
6 * Author(s): Thomas Spatzier (tspat@de.ibm.com)
7 * Author(s): Mahesh Salgaonkar (mahesh@linux.vnet.ibm.com)
8 * Author(s): Heinz Graalfs (graalfs@linux.vnet.ibm.com)
9 * Author(s): Andreas Krebbel (krebbel@linux.vnet.ibm.com)
11 * @remark Copyright 2002-2011 OProfile authors
14 #include <linux/oprofile.h>
15 #include <linux/init.h>
16 #include <linux/errno.h>
18 #include <linux/module.h>
19 #include <asm/processor.h>
21 #include "../../../drivers/oprofile/oprof.h"
23 extern void s390_backtrace(struct pt_regs
* const regs
, unsigned int depth
);
27 #include "hwsampler.h"
28 #include "op_counter.h"
30 #define DEFAULT_INTERVAL 4127518
32 #define DEFAULT_SDBT_BLOCKS 1
33 #define DEFAULT_SDB_BLOCKS 511
35 static unsigned long oprofile_hw_interval
= DEFAULT_INTERVAL
;
36 static unsigned long oprofile_min_interval
;
37 static unsigned long oprofile_max_interval
;
39 static unsigned long oprofile_sdbt_blocks
= DEFAULT_SDBT_BLOCKS
;
40 static unsigned long oprofile_sdb_blocks
= DEFAULT_SDB_BLOCKS
;
42 static int hwsampler_enabled
;
43 static int hwsampler_running
; /* start_mutex must be held to change */
44 static int hwsampler_available
;
46 static struct oprofile_operations timer_ops
;
48 struct op_counter_config counter_config
;
50 enum __force_cpu_type
{
51 reserved
= 0, /* do not force */
54 static int force_cpu_type
;
56 static int set_cpu_type(const char *str
, struct kernel_param
*kp
)
58 if (!strcmp(str
, "timer")) {
59 force_cpu_type
= timer
;
60 printk(KERN_INFO
"oprofile: forcing timer to be returned "
68 module_param_call(cpu_type
, set_cpu_type
, NULL
, NULL
, 0);
69 MODULE_PARM_DESC(cpu_type
, "Force legacy basic mode sampling"
70 "(report cpu_type \"timer\"");
72 static int oprofile_hwsampler_start(void)
76 hwsampler_running
= hwsampler_enabled
;
78 if (!hwsampler_running
)
79 return timer_ops
.start();
81 retval
= hwsampler_allocate(oprofile_sdbt_blocks
, oprofile_sdb_blocks
);
85 retval
= hwsampler_start_all(oprofile_hw_interval
);
87 hwsampler_deallocate();
92 static void oprofile_hwsampler_stop(void)
94 if (!hwsampler_running
) {
100 hwsampler_deallocate();
106 * /dev/oprofile/0/enabled
107 * /dev/oprofile/hwsampling/hwsampler (cpu_type = timer)
110 static ssize_t
hwsampler_read(struct file
*file
, char __user
*buf
,
111 size_t count
, loff_t
*offset
)
113 return oprofilefs_ulong_to_user(hwsampler_enabled
, buf
, count
, offset
);
116 static ssize_t
hwsampler_write(struct file
*file
, char const __user
*buf
,
117 size_t count
, loff_t
*offset
)
125 retval
= oprofilefs_ulong_from_user(&val
, buf
, count
);
129 if (val
!= 0 && val
!= 1)
132 if (oprofile_started
)
134 * save to do without locking as we set
135 * hwsampler_running in start() when start_mutex is
140 hwsampler_enabled
= val
;
145 static const struct file_operations hwsampler_fops
= {
146 .read
= hwsampler_read
,
147 .write
= hwsampler_write
,
152 * /dev/oprofile/0/count
153 * /dev/oprofile/hwsampling/hw_interval (cpu_type = timer)
155 * Make sure that the value is within the hardware range.
158 static ssize_t
hw_interval_read(struct file
*file
, char __user
*buf
,
159 size_t count
, loff_t
*offset
)
161 return oprofilefs_ulong_to_user(oprofile_hw_interval
, buf
,
165 static ssize_t
hw_interval_write(struct file
*file
, char const __user
*buf
,
166 size_t count
, loff_t
*offset
)
173 retval
= oprofilefs_ulong_from_user(&val
, buf
, count
);
176 if (val
< oprofile_min_interval
)
177 oprofile_hw_interval
= oprofile_min_interval
;
178 else if (val
> oprofile_max_interval
)
179 oprofile_hw_interval
= oprofile_max_interval
;
181 oprofile_hw_interval
= val
;
186 static const struct file_operations hw_interval_fops
= {
187 .read
= hw_interval_read
,
188 .write
= hw_interval_write
,
193 * /dev/oprofile/0/event
194 * Only a single event with number 0 is supported with this counter.
196 * /dev/oprofile/0/unit_mask
197 * This is a dummy file needed by the user space tools.
198 * No value other than 0 is accepted or returned.
201 static ssize_t
hwsampler_zero_read(struct file
*file
, char __user
*buf
,
202 size_t count
, loff_t
*offset
)
204 return oprofilefs_ulong_to_user(0, buf
, count
, offset
);
207 static ssize_t
hwsampler_zero_write(struct file
*file
, char const __user
*buf
,
208 size_t count
, loff_t
*offset
)
216 retval
= oprofilefs_ulong_from_user(&val
, buf
, count
);
224 static const struct file_operations zero_fops
= {
225 .read
= hwsampler_zero_read
,
226 .write
= hwsampler_zero_write
,
229 /* /dev/oprofile/0/kernel file ops. */
231 static ssize_t
hwsampler_kernel_read(struct file
*file
, char __user
*buf
,
232 size_t count
, loff_t
*offset
)
234 return oprofilefs_ulong_to_user(counter_config
.kernel
,
238 static ssize_t
hwsampler_kernel_write(struct file
*file
, char const __user
*buf
,
239 size_t count
, loff_t
*offset
)
247 retval
= oprofilefs_ulong_from_user(&val
, buf
, count
);
251 if (val
!= 0 && val
!= 1)
254 counter_config
.kernel
= val
;
259 static const struct file_operations kernel_fops
= {
260 .read
= hwsampler_kernel_read
,
261 .write
= hwsampler_kernel_write
,
264 /* /dev/oprofile/0/user file ops. */
266 static ssize_t
hwsampler_user_read(struct file
*file
, char __user
*buf
,
267 size_t count
, loff_t
*offset
)
269 return oprofilefs_ulong_to_user(counter_config
.user
,
273 static ssize_t
hwsampler_user_write(struct file
*file
, char const __user
*buf
,
274 size_t count
, loff_t
*offset
)
282 retval
= oprofilefs_ulong_from_user(&val
, buf
, count
);
286 if (val
!= 0 && val
!= 1)
289 counter_config
.user
= val
;
294 static const struct file_operations user_fops
= {
295 .read
= hwsampler_user_read
,
296 .write
= hwsampler_user_write
,
301 * File ops used for: /dev/oprofile/timer/enabled
302 * The value always has to be the inverted value of hwsampler_enabled. So
303 * no separate variable is created. That way we do not need locking.
306 static ssize_t
timer_enabled_read(struct file
*file
, char __user
*buf
,
307 size_t count
, loff_t
*offset
)
309 return oprofilefs_ulong_to_user(!hwsampler_enabled
, buf
, count
, offset
);
312 static ssize_t
timer_enabled_write(struct file
*file
, char const __user
*buf
,
313 size_t count
, loff_t
*offset
)
321 retval
= oprofilefs_ulong_from_user(&val
, buf
, count
);
325 if (val
!= 0 && val
!= 1)
328 /* Timer cannot be disabled without having hardware sampling. */
329 if (val
== 0 && !hwsampler_available
)
332 if (oprofile_started
)
334 * save to do without locking as we set
335 * hwsampler_running in start() when start_mutex is
340 hwsampler_enabled
= !val
;
345 static const struct file_operations timer_enabled_fops
= {
346 .read
= timer_enabled_read
,
347 .write
= timer_enabled_write
,
351 static int oprofile_create_hwsampling_files(struct super_block
*sb
,
356 dir
= oprofilefs_mkdir(sb
, root
, "timer");
360 oprofilefs_create_file(sb
, dir
, "enabled", &timer_enabled_fops
);
362 if (!hwsampler_available
)
365 /* reinitialize default values */
366 hwsampler_enabled
= 1;
367 counter_config
.kernel
= 1;
368 counter_config
.user
= 1;
370 if (!force_cpu_type
) {
372 * Create the counter file system. A single virtual
373 * counter is created which can be used to
374 * enable/disable hardware sampling dynamically from
375 * user space. The user space will configure a single
376 * counter with a single event. The value of 'event'
377 * and 'unit_mask' are not evaluated by the kernel code
378 * and can only be set to 0.
381 dir
= oprofilefs_mkdir(sb
, root
, "0");
385 oprofilefs_create_file(sb
, dir
, "enabled", &hwsampler_fops
);
386 oprofilefs_create_file(sb
, dir
, "event", &zero_fops
);
387 oprofilefs_create_file(sb
, dir
, "count", &hw_interval_fops
);
388 oprofilefs_create_file(sb
, dir
, "unit_mask", &zero_fops
);
389 oprofilefs_create_file(sb
, dir
, "kernel", &kernel_fops
);
390 oprofilefs_create_file(sb
, dir
, "user", &user_fops
);
391 oprofilefs_create_ulong(sb
, dir
, "hw_sdbt_blocks",
392 &oprofile_sdbt_blocks
);
396 * Hardware sampling can be used but the cpu_type is
397 * forced to timer in order to deal with legacy user
398 * space tools. The /dev/oprofile/hwsampling fs is
399 * provided in that case.
401 dir
= oprofilefs_mkdir(sb
, root
, "hwsampling");
405 oprofilefs_create_file(sb
, dir
, "hwsampler",
407 oprofilefs_create_file(sb
, dir
, "hw_interval",
409 oprofilefs_create_ro_ulong(sb
, dir
, "hw_min_interval",
410 &oprofile_min_interval
);
411 oprofilefs_create_ro_ulong(sb
, dir
, "hw_max_interval",
412 &oprofile_max_interval
);
413 oprofilefs_create_ulong(sb
, dir
, "hw_sdbt_blocks",
414 &oprofile_sdbt_blocks
);
419 static int oprofile_hwsampler_init(struct oprofile_operations
*ops
)
422 * Initialize the timer mode infrastructure as well in order
423 * to be able to switch back dynamically. oprofile_timer_init
424 * is not supposed to fail.
426 if (oprofile_timer_init(ops
))
429 memcpy(&timer_ops
, ops
, sizeof(timer_ops
));
430 ops
->create_files
= oprofile_create_hwsampling_files
;
433 * If the user space tools do not support newer cpu types,
434 * the force_cpu_type module parameter
435 * can be used to always return \"timer\" as cpu type.
437 if (force_cpu_type
!= timer
) {
442 switch (id
.machine
) {
443 case 0x2097: case 0x2098: ops
->cpu_type
= "s390/z10"; break;
444 case 0x2817: case 0x2818: ops
->cpu_type
= "s390/z196"; break;
445 default: return -ENODEV
;
449 if (hwsampler_setup())
453 * Query the range for the sampling interval from the
456 oprofile_min_interval
= hwsampler_query_min_interval();
457 if (oprofile_min_interval
== 0)
459 oprofile_max_interval
= hwsampler_query_max_interval();
460 if (oprofile_max_interval
== 0)
463 /* The initial value should be sane */
464 if (oprofile_hw_interval
< oprofile_min_interval
)
465 oprofile_hw_interval
= oprofile_min_interval
;
466 if (oprofile_hw_interval
> oprofile_max_interval
)
467 oprofile_hw_interval
= oprofile_max_interval
;
469 printk(KERN_INFO
"oprofile: System z hardware sampling "
470 "facility found.\n");
472 ops
->start
= oprofile_hwsampler_start
;
473 ops
->stop
= oprofile_hwsampler_stop
;
478 static void oprofile_hwsampler_exit(void)
480 hwsampler_shutdown();
483 #endif /* CONFIG_64BIT */
485 int __init
oprofile_arch_init(struct oprofile_operations
*ops
)
487 ops
->backtrace
= s390_backtrace
;
492 * -ENODEV is not reported to the caller. The module itself
493 * will use the timer mode sampling as fallback and this is
496 hwsampler_available
= oprofile_hwsampler_init(ops
) == 0;
504 void oprofile_arch_exit(void)
507 oprofile_hwsampler_exit();