123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514 |
- /*
- * S390 Version
- * Copyright IBM Corp. 2002, 2011
- * Author(s): Thomas Spatzier (tspat@de.ibm.com)
- * Author(s): Mahesh Salgaonkar (mahesh@linux.vnet.ibm.com)
- * Author(s): Heinz Graalfs (graalfs@linux.vnet.ibm.com)
- * Author(s): Andreas Krebbel (krebbel@linux.vnet.ibm.com)
- *
- * @remark Copyright 2002-2011 OProfile authors
- */
- #include <linux/oprofile.h>
- #include <linux/perf_event.h>
- #include <linux/init.h>
- #include <linux/errno.h>
- #include <linux/fs.h>
- #include <linux/module.h>
- #include <asm/processor.h>
- #include <asm/perf_event.h>
- #include "../../../drivers/oprofile/oprof.h"
- extern void s390_backtrace(struct pt_regs * const regs, unsigned int depth);
- #include "hwsampler.h"
- #include "op_counter.h"
- #define DEFAULT_INTERVAL 4127518
- #define DEFAULT_SDBT_BLOCKS 1
- #define DEFAULT_SDB_BLOCKS 511
- static unsigned long oprofile_hw_interval = DEFAULT_INTERVAL;
- static unsigned long oprofile_min_interval;
- static unsigned long oprofile_max_interval;
- static unsigned long oprofile_sdbt_blocks = DEFAULT_SDBT_BLOCKS;
- static unsigned long oprofile_sdb_blocks = DEFAULT_SDB_BLOCKS;
- static int hwsampler_enabled;
- static int hwsampler_running; /* start_mutex must be held to change */
- static int hwsampler_available;
- static struct oprofile_operations timer_ops;
- struct op_counter_config counter_config;
- enum __force_cpu_type {
- reserved = 0, /* do not force */
- timer,
- };
- static int force_cpu_type;
- static int set_cpu_type(const char *str, struct kernel_param *kp)
- {
- if (!strcmp(str, "timer")) {
- force_cpu_type = timer;
- printk(KERN_INFO "oprofile: forcing timer to be returned "
- "as cpu type\n");
- } else {
- force_cpu_type = 0;
- }
- return 0;
- }
- module_param_call(cpu_type, set_cpu_type, NULL, NULL, 0);
- MODULE_PARM_DESC(cpu_type, "Force legacy basic mode sampling"
- "(report cpu_type \"timer\"");
- static int __oprofile_hwsampler_start(void)
- {
- int retval;
- retval = hwsampler_allocate(oprofile_sdbt_blocks, oprofile_sdb_blocks);
- if (retval)
- return retval;
- retval = hwsampler_start_all(oprofile_hw_interval);
- if (retval)
- hwsampler_deallocate();
- return retval;
- }
- static int oprofile_hwsampler_start(void)
- {
- int retval;
- hwsampler_running = hwsampler_enabled;
- if (!hwsampler_running)
- return timer_ops.start();
- retval = perf_reserve_sampling();
- if (retval)
- return retval;
- retval = __oprofile_hwsampler_start();
- if (retval)
- perf_release_sampling();
- return retval;
- }
- static void oprofile_hwsampler_stop(void)
- {
- if (!hwsampler_running) {
- timer_ops.stop();
- return;
- }
- hwsampler_stop_all();
- hwsampler_deallocate();
- perf_release_sampling();
- return;
- }
- /*
- * File ops used for:
- * /dev/oprofile/0/enabled
- * /dev/oprofile/hwsampling/hwsampler (cpu_type = timer)
- */
- static ssize_t hwsampler_read(struct file *file, char __user *buf,
- size_t count, loff_t *offset)
- {
- return oprofilefs_ulong_to_user(hwsampler_enabled, buf, count, offset);
- }
- static ssize_t hwsampler_write(struct file *file, char const __user *buf,
- size_t count, loff_t *offset)
- {
- unsigned long val;
- int retval;
- if (*offset)
- return -EINVAL;
- retval = oprofilefs_ulong_from_user(&val, buf, count);
- if (retval <= 0)
- return retval;
- if (val != 0 && val != 1)
- return -EINVAL;
- if (oprofile_started)
- /*
- * save to do without locking as we set
- * hwsampler_running in start() when start_mutex is
- * held
- */
- return -EBUSY;
- hwsampler_enabled = val;
- return count;
- }
- static const struct file_operations hwsampler_fops = {
- .read = hwsampler_read,
- .write = hwsampler_write,
- };
- /*
- * File ops used for:
- * /dev/oprofile/0/count
- * /dev/oprofile/hwsampling/hw_interval (cpu_type = timer)
- *
- * Make sure that the value is within the hardware range.
- */
- static ssize_t hw_interval_read(struct file *file, char __user *buf,
- size_t count, loff_t *offset)
- {
- return oprofilefs_ulong_to_user(oprofile_hw_interval, buf,
- count, offset);
- }
- static ssize_t hw_interval_write(struct file *file, char const __user *buf,
- size_t count, loff_t *offset)
- {
- unsigned long val;
- int retval;
- if (*offset)
- return -EINVAL;
- retval = oprofilefs_ulong_from_user(&val, buf, count);
- if (retval <= 0)
- return retval;
- if (val < oprofile_min_interval)
- oprofile_hw_interval = oprofile_min_interval;
- else if (val > oprofile_max_interval)
- oprofile_hw_interval = oprofile_max_interval;
- else
- oprofile_hw_interval = val;
- return count;
- }
- static const struct file_operations hw_interval_fops = {
- .read = hw_interval_read,
- .write = hw_interval_write,
- };
- /*
- * File ops used for:
- * /dev/oprofile/0/event
- * Only a single event with number 0 is supported with this counter.
- *
- * /dev/oprofile/0/unit_mask
- * This is a dummy file needed by the user space tools.
- * No value other than 0 is accepted or returned.
- */
- static ssize_t hwsampler_zero_read(struct file *file, char __user *buf,
- size_t count, loff_t *offset)
- {
- return oprofilefs_ulong_to_user(0, buf, count, offset);
- }
- static ssize_t hwsampler_zero_write(struct file *file, char const __user *buf,
- size_t count, loff_t *offset)
- {
- unsigned long val;
- int retval;
- if (*offset)
- return -EINVAL;
- retval = oprofilefs_ulong_from_user(&val, buf, count);
- if (retval <= 0)
- return retval;
- if (val != 0)
- return -EINVAL;
- return count;
- }
- static const struct file_operations zero_fops = {
- .read = hwsampler_zero_read,
- .write = hwsampler_zero_write,
- };
- /* /dev/oprofile/0/kernel file ops. */
- static ssize_t hwsampler_kernel_read(struct file *file, char __user *buf,
- size_t count, loff_t *offset)
- {
- return oprofilefs_ulong_to_user(counter_config.kernel,
- buf, count, offset);
- }
- static ssize_t hwsampler_kernel_write(struct file *file, char const __user *buf,
- size_t count, loff_t *offset)
- {
- unsigned long val;
- int retval;
- if (*offset)
- return -EINVAL;
- retval = oprofilefs_ulong_from_user(&val, buf, count);
- if (retval <= 0)
- return retval;
- if (val != 0 && val != 1)
- return -EINVAL;
- counter_config.kernel = val;
- return count;
- }
- static const struct file_operations kernel_fops = {
- .read = hwsampler_kernel_read,
- .write = hwsampler_kernel_write,
- };
- /* /dev/oprofile/0/user file ops. */
- static ssize_t hwsampler_user_read(struct file *file, char __user *buf,
- size_t count, loff_t *offset)
- {
- return oprofilefs_ulong_to_user(counter_config.user,
- buf, count, offset);
- }
- static ssize_t hwsampler_user_write(struct file *file, char const __user *buf,
- size_t count, loff_t *offset)
- {
- unsigned long val;
- int retval;
- if (*offset)
- return -EINVAL;
- retval = oprofilefs_ulong_from_user(&val, buf, count);
- if (retval <= 0)
- return retval;
- if (val != 0 && val != 1)
- return -EINVAL;
- counter_config.user = val;
- return count;
- }
- static const struct file_operations user_fops = {
- .read = hwsampler_user_read,
- .write = hwsampler_user_write,
- };
- /*
- * File ops used for: /dev/oprofile/timer/enabled
- * The value always has to be the inverted value of hwsampler_enabled. So
- * no separate variable is created. That way we do not need locking.
- */
- static ssize_t timer_enabled_read(struct file *file, char __user *buf,
- size_t count, loff_t *offset)
- {
- return oprofilefs_ulong_to_user(!hwsampler_enabled, buf, count, offset);
- }
- static ssize_t timer_enabled_write(struct file *file, char const __user *buf,
- size_t count, loff_t *offset)
- {
- unsigned long val;
- int retval;
- if (*offset)
- return -EINVAL;
- retval = oprofilefs_ulong_from_user(&val, buf, count);
- if (retval <= 0)
- return retval;
- if (val != 0 && val != 1)
- return -EINVAL;
- /* Timer cannot be disabled without having hardware sampling. */
- if (val == 0 && !hwsampler_available)
- return -EINVAL;
- if (oprofile_started)
- /*
- * save to do without locking as we set
- * hwsampler_running in start() when start_mutex is
- * held
- */
- return -EBUSY;
- hwsampler_enabled = !val;
- return count;
- }
- static const struct file_operations timer_enabled_fops = {
- .read = timer_enabled_read,
- .write = timer_enabled_write,
- };
- static int oprofile_create_hwsampling_files(struct dentry *root)
- {
- struct dentry *dir;
- dir = oprofilefs_mkdir(root, "timer");
- if (!dir)
- return -EINVAL;
- oprofilefs_create_file(dir, "enabled", &timer_enabled_fops);
- if (!hwsampler_available)
- return 0;
- /* reinitialize default values */
- hwsampler_enabled = 1;
- counter_config.kernel = 1;
- counter_config.user = 1;
- if (!force_cpu_type) {
- /*
- * Create the counter file system. A single virtual
- * counter is created which can be used to
- * enable/disable hardware sampling dynamically from
- * user space. The user space will configure a single
- * counter with a single event. The value of 'event'
- * and 'unit_mask' are not evaluated by the kernel code
- * and can only be set to 0.
- */
- dir = oprofilefs_mkdir(root, "0");
- if (!dir)
- return -EINVAL;
- oprofilefs_create_file(dir, "enabled", &hwsampler_fops);
- oprofilefs_create_file(dir, "event", &zero_fops);
- oprofilefs_create_file(dir, "count", &hw_interval_fops);
- oprofilefs_create_file(dir, "unit_mask", &zero_fops);
- oprofilefs_create_file(dir, "kernel", &kernel_fops);
- oprofilefs_create_file(dir, "user", &user_fops);
- oprofilefs_create_ulong(dir, "hw_sdbt_blocks",
- &oprofile_sdbt_blocks);
- } else {
- /*
- * Hardware sampling can be used but the cpu_type is
- * forced to timer in order to deal with legacy user
- * space tools. The /dev/oprofile/hwsampling fs is
- * provided in that case.
- */
- dir = oprofilefs_mkdir(root, "hwsampling");
- if (!dir)
- return -EINVAL;
- oprofilefs_create_file(dir, "hwsampler",
- &hwsampler_fops);
- oprofilefs_create_file(dir, "hw_interval",
- &hw_interval_fops);
- oprofilefs_create_ro_ulong(dir, "hw_min_interval",
- &oprofile_min_interval);
- oprofilefs_create_ro_ulong(dir, "hw_max_interval",
- &oprofile_max_interval);
- oprofilefs_create_ulong(dir, "hw_sdbt_blocks",
- &oprofile_sdbt_blocks);
- }
- return 0;
- }
- static int oprofile_hwsampler_init(struct oprofile_operations *ops)
- {
- /*
- * Initialize the timer mode infrastructure as well in order
- * to be able to switch back dynamically. oprofile_timer_init
- * is not supposed to fail.
- */
- if (oprofile_timer_init(ops))
- BUG();
- memcpy(&timer_ops, ops, sizeof(timer_ops));
- ops->create_files = oprofile_create_hwsampling_files;
- /*
- * If the user space tools do not support newer cpu types,
- * the force_cpu_type module parameter
- * can be used to always return \"timer\" as cpu type.
- */
- if (force_cpu_type != timer) {
- struct cpuid id;
- get_cpu_id (&id);
- switch (id.machine) {
- case 0x2097: case 0x2098: ops->cpu_type = "s390/z10"; break;
- case 0x2817: case 0x2818: ops->cpu_type = "s390/z196"; break;
- case 0x2827: case 0x2828: ops->cpu_type = "s390/zEC12"; break;
- default: return -ENODEV;
- }
- }
- if (hwsampler_setup())
- return -ENODEV;
- /*
- * Query the range for the sampling interval from the
- * hardware.
- */
- oprofile_min_interval = hwsampler_query_min_interval();
- if (oprofile_min_interval == 0)
- return -ENODEV;
- oprofile_max_interval = hwsampler_query_max_interval();
- if (oprofile_max_interval == 0)
- return -ENODEV;
- /* The initial value should be sane */
- if (oprofile_hw_interval < oprofile_min_interval)
- oprofile_hw_interval = oprofile_min_interval;
- if (oprofile_hw_interval > oprofile_max_interval)
- oprofile_hw_interval = oprofile_max_interval;
- printk(KERN_INFO "oprofile: System z hardware sampling "
- "facility found.\n");
- ops->start = oprofile_hwsampler_start;
- ops->stop = oprofile_hwsampler_stop;
- return 0;
- }
- static void oprofile_hwsampler_exit(void)
- {
- hwsampler_shutdown();
- }
- int __init oprofile_arch_init(struct oprofile_operations *ops)
- {
- ops->backtrace = s390_backtrace;
- /*
- * -ENODEV is not reported to the caller. The module itself
- * will use the timer mode sampling as fallback and this is
- * always available.
- */
- hwsampler_available = oprofile_hwsampler_init(ops) == 0;
- return 0;
- }
- void oprofile_arch_exit(void)
- {
- oprofile_hwsampler_exit();
- }
|