3 * Copyright IBM Corp. 2002, 2011
4 * Author(s): Thomas Spatzier (tspat@de.ibm.com)
5 * Author(s): Mahesh Salgaonkar (mahesh@linux.vnet.ibm.com)
6 * Author(s): Heinz Graalfs (graalfs@linux.vnet.ibm.com)
7 * Author(s): Andreas Krebbel (krebbel@linux.vnet.ibm.com)
9 * @remark Copyright 2002-2011 OProfile authors
12 #include <linux/oprofile.h>
13 #include <linux/init.h>
14 #include <linux/errno.h>
16 #include <linux/module.h>
17 #include <asm/processor.h>
19 #include "../../../drivers/oprofile/oprof.h"
21 extern void s390_backtrace(struct pt_regs * const regs, unsigned int depth);
25 #include "hwsampler.h"
26 #include "op_counter.h"
28 #define DEFAULT_INTERVAL 4127518
30 #define DEFAULT_SDBT_BLOCKS 1
31 #define DEFAULT_SDB_BLOCKS 511
33 static unsigned long oprofile_hw_interval = DEFAULT_INTERVAL;
34 static unsigned long oprofile_min_interval;
35 static unsigned long oprofile_max_interval;
37 static unsigned long oprofile_sdbt_blocks = DEFAULT_SDBT_BLOCKS;
38 static unsigned long oprofile_sdb_blocks = DEFAULT_SDB_BLOCKS;
40 static int hwsampler_enabled;
41 static int hwsampler_running; /* start_mutex must be held to change */
42 static int hwsampler_available;
44 static struct oprofile_operations timer_ops;
46 struct op_counter_config counter_config;
48 enum __force_cpu_type {
49 reserved = 0, /* do not force */
52 static int force_cpu_type;
54 static int set_cpu_type(const char *str, struct kernel_param *kp)
56 if (!strcmp(str, "timer")) {
57 force_cpu_type = timer;
58 printk(KERN_INFO "oprofile: forcing timer to be returned "
66 module_param_call(cpu_type, set_cpu_type, NULL, NULL, 0);
67 MODULE_PARM_DESC(cpu_type, "Force legacy basic mode sampling"
68 "(report cpu_type \"timer\"");
70 static int oprofile_hwsampler_start(void)
74 hwsampler_running = hwsampler_enabled;
76 if (!hwsampler_running)
77 return timer_ops.start();
79 retval = hwsampler_allocate(oprofile_sdbt_blocks, oprofile_sdb_blocks);
83 retval = hwsampler_start_all(oprofile_hw_interval);
85 hwsampler_deallocate();
90 static void oprofile_hwsampler_stop(void)
92 if (!hwsampler_running) {
98 hwsampler_deallocate();
104 * /dev/oprofile/0/enabled
105 * /dev/oprofile/hwsampling/hwsampler (cpu_type = timer)
108 static ssize_t hwsampler_read(struct file *file, char __user *buf,
109 size_t count, loff_t *offset)
111 return oprofilefs_ulong_to_user(hwsampler_enabled, buf, count, offset);
114 static ssize_t hwsampler_write(struct file *file, char const __user *buf,
115 size_t count, loff_t *offset)
123 retval = oprofilefs_ulong_from_user(&val, buf, count);
127 if (val != 0 && val != 1)
130 if (oprofile_started)
132 * save to do without locking as we set
133 * hwsampler_running in start() when start_mutex is
138 hwsampler_enabled = val;
143 static const struct file_operations hwsampler_fops = {
144 .read = hwsampler_read,
145 .write = hwsampler_write,
150 * /dev/oprofile/0/count
151 * /dev/oprofile/hwsampling/hw_interval (cpu_type = timer)
153 * Make sure that the value is within the hardware range.
156 static ssize_t hw_interval_read(struct file *file, char __user *buf,
157 size_t count, loff_t *offset)
159 return oprofilefs_ulong_to_user(oprofile_hw_interval, buf,
163 static ssize_t hw_interval_write(struct file *file, char const __user *buf,
164 size_t count, loff_t *offset)
171 retval = oprofilefs_ulong_from_user(&val, buf, count);
174 if (val < oprofile_min_interval)
175 oprofile_hw_interval = oprofile_min_interval;
176 else if (val > oprofile_max_interval)
177 oprofile_hw_interval = oprofile_max_interval;
179 oprofile_hw_interval = val;
184 static const struct file_operations hw_interval_fops = {
185 .read = hw_interval_read,
186 .write = hw_interval_write,
191 * /dev/oprofile/0/event
192 * Only a single event with number 0 is supported with this counter.
194 * /dev/oprofile/0/unit_mask
195 * This is a dummy file needed by the user space tools.
196 * No value other than 0 is accepted or returned.
199 static ssize_t hwsampler_zero_read(struct file *file, char __user *buf,
200 size_t count, loff_t *offset)
202 return oprofilefs_ulong_to_user(0, buf, count, offset);
205 static ssize_t hwsampler_zero_write(struct file *file, char const __user *buf,
206 size_t count, loff_t *offset)
214 retval = oprofilefs_ulong_from_user(&val, buf, count);
222 static const struct file_operations zero_fops = {
223 .read = hwsampler_zero_read,
224 .write = hwsampler_zero_write,
227 /* /dev/oprofile/0/kernel file ops. */
229 static ssize_t hwsampler_kernel_read(struct file *file, char __user *buf,
230 size_t count, loff_t *offset)
232 return oprofilefs_ulong_to_user(counter_config.kernel,
236 static ssize_t hwsampler_kernel_write(struct file *file, char const __user *buf,
237 size_t count, loff_t *offset)
245 retval = oprofilefs_ulong_from_user(&val, buf, count);
249 if (val != 0 && val != 1)
252 counter_config.kernel = val;
257 static const struct file_operations kernel_fops = {
258 .read = hwsampler_kernel_read,
259 .write = hwsampler_kernel_write,
262 /* /dev/oprofile/0/user file ops. */
264 static ssize_t hwsampler_user_read(struct file *file, char __user *buf,
265 size_t count, loff_t *offset)
267 return oprofilefs_ulong_to_user(counter_config.user,
271 static ssize_t hwsampler_user_write(struct file *file, char const __user *buf,
272 size_t count, loff_t *offset)
280 retval = oprofilefs_ulong_from_user(&val, buf, count);
284 if (val != 0 && val != 1)
287 counter_config.user = val;
292 static const struct file_operations user_fops = {
293 .read = hwsampler_user_read,
294 .write = hwsampler_user_write,
299 * File ops used for: /dev/oprofile/timer/enabled
300 * The value always has to be the inverted value of hwsampler_enabled. So
301 * no separate variable is created. That way we do not need locking.
304 static ssize_t timer_enabled_read(struct file *file, char __user *buf,
305 size_t count, loff_t *offset)
307 return oprofilefs_ulong_to_user(!hwsampler_enabled, buf, count, offset);
310 static ssize_t timer_enabled_write(struct file *file, char const __user *buf,
311 size_t count, loff_t *offset)
319 retval = oprofilefs_ulong_from_user(&val, buf, count);
323 if (val != 0 && val != 1)
326 /* Timer cannot be disabled without having hardware sampling. */
327 if (val == 0 && !hwsampler_available)
330 if (oprofile_started)
332 * save to do without locking as we set
333 * hwsampler_running in start() when start_mutex is
338 hwsampler_enabled = !val;
343 static const struct file_operations timer_enabled_fops = {
344 .read = timer_enabled_read,
345 .write = timer_enabled_write,
349 static int oprofile_create_hwsampling_files(struct super_block *sb,
354 dir = oprofilefs_mkdir(sb, root, "timer");
358 oprofilefs_create_file(sb, dir, "enabled", &timer_enabled_fops);
360 if (!hwsampler_available)
363 /* reinitialize default values */
364 hwsampler_enabled = 1;
365 counter_config.kernel = 1;
366 counter_config.user = 1;
368 if (!force_cpu_type) {
370 * Create the counter file system. A single virtual
371 * counter is created which can be used to
372 * enable/disable hardware sampling dynamically from
373 * user space. The user space will configure a single
374 * counter with a single event. The value of 'event'
375 * and 'unit_mask' are not evaluated by the kernel code
376 * and can only be set to 0.
379 dir = oprofilefs_mkdir(sb, root, "0");
383 oprofilefs_create_file(sb, dir, "enabled", &hwsampler_fops);
384 oprofilefs_create_file(sb, dir, "event", &zero_fops);
385 oprofilefs_create_file(sb, dir, "count", &hw_interval_fops);
386 oprofilefs_create_file(sb, dir, "unit_mask", &zero_fops);
387 oprofilefs_create_file(sb, dir, "kernel", &kernel_fops);
388 oprofilefs_create_file(sb, dir, "user", &user_fops);
389 oprofilefs_create_ulong(sb, dir, "hw_sdbt_blocks",
390 &oprofile_sdbt_blocks);
394 * Hardware sampling can be used but the cpu_type is
395 * forced to timer in order to deal with legacy user
396 * space tools. The /dev/oprofile/hwsampling fs is
397 * provided in that case.
399 dir = oprofilefs_mkdir(sb, root, "hwsampling");
403 oprofilefs_create_file(sb, dir, "hwsampler",
405 oprofilefs_create_file(sb, dir, "hw_interval",
407 oprofilefs_create_ro_ulong(sb, dir, "hw_min_interval",
408 &oprofile_min_interval);
409 oprofilefs_create_ro_ulong(sb, dir, "hw_max_interval",
410 &oprofile_max_interval);
411 oprofilefs_create_ulong(sb, dir, "hw_sdbt_blocks",
412 &oprofile_sdbt_blocks);
417 static int oprofile_hwsampler_init(struct oprofile_operations *ops)
420 * Initialize the timer mode infrastructure as well in order
421 * to be able to switch back dynamically. oprofile_timer_init
422 * is not supposed to fail.
424 if (oprofile_timer_init(ops))
427 memcpy(&timer_ops, ops, sizeof(timer_ops));
428 ops->create_files = oprofile_create_hwsampling_files;
431 * If the user space tools do not support newer cpu types,
432 * the force_cpu_type module parameter
433 * can be used to always return \"timer\" as cpu type.
435 if (force_cpu_type != timer) {
440 switch (id.machine) {
441 case 0x2097: case 0x2098: ops->cpu_type = "s390/z10"; break;
442 case 0x2817: case 0x2818: ops->cpu_type = "s390/z196"; break;
443 case 0x2827: ops->cpu_type = "s390/zEC12"; break;
444 default: return -ENODEV;
448 if (hwsampler_setup())
452 * Query the range for the sampling interval from the
455 oprofile_min_interval = hwsampler_query_min_interval();
456 if (oprofile_min_interval == 0)
458 oprofile_max_interval = hwsampler_query_max_interval();
459 if (oprofile_max_interval == 0)
462 /* The initial value should be sane */
463 if (oprofile_hw_interval < oprofile_min_interval)
464 oprofile_hw_interval = oprofile_min_interval;
465 if (oprofile_hw_interval > oprofile_max_interval)
466 oprofile_hw_interval = oprofile_max_interval;
468 printk(KERN_INFO "oprofile: System z hardware sampling "
469 "facility found.\n");
471 ops->start = oprofile_hwsampler_start;
472 ops->stop = oprofile_hwsampler_stop;
477 static void oprofile_hwsampler_exit(void)
479 hwsampler_shutdown();
482 #endif /* CONFIG_64BIT */
484 int __init oprofile_arch_init(struct oprofile_operations *ops)
486 ops->backtrace = s390_backtrace;
491 * -ENODEV is not reported to the caller. The module itself
492 * will use the timer mode sampling as fallback and this is
495 hwsampler_available = oprofile_hwsampler_init(ops) == 0;
503 void oprofile_arch_exit(void)
506 oprofile_hwsampler_exit();