2 * drivers/misc/tegra-profiler/main.c
4 * Copyright (c) 2014, NVIDIA CORPORATION. All rights reserved.
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms and conditions of the GNU General Public License,
8 * version 2, as published by the Free Software Foundation.
10 * This program is distributed in the hope it will be useful, but WITHOUT
11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
17 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19 #include <linux/init.h>
20 #include <linux/module.h>
21 #include <linux/err.h>
22 #include <linux/sched.h>
24 #include <linux/tegra_profiler.h>
33 #include "power_clk.h"
36 #include "quadd_proc.h"
37 #include "eh_unwind.h"
40 #include "armv8_pmu.h"
42 #include "armv7_pmu.h"
45 #ifdef CONFIG_CACHE_L2X0
49 static struct quadd_ctx ctx;
51 static int get_default_properties(void)
54 ctx.param.ma_freq = 50;
55 ctx.param.backtrace = 1;
56 ctx.param.use_freq = 1;
57 ctx.param.system_wide = 1;
58 ctx.param.power_rate_freq = 0;
59 ctx.param.debug_samples = 0;
61 ctx.param.pids[0] = 0;
62 ctx.param.nr_pids = 1;
67 int tegra_profiler_try_lock(void)
69 return atomic_cmpxchg(&ctx.tegra_profiler_lock, 0, 1);
71 EXPORT_SYMBOL_GPL(tegra_profiler_try_lock);
73 void tegra_profiler_unlock(void)
75 atomic_set(&ctx.tegra_profiler_lock, 0);
77 EXPORT_SYMBOL_GPL(tegra_profiler_unlock);
79 static int start(void)
83 if (tegra_profiler_try_lock()) {
84 pr_err("Error: tegra_profiler lock\n");
88 if (!atomic_cmpxchg(&ctx.started, 0, 1)) {
90 err = ctx.pmu->enable();
92 pr_err("error: pmu enable\n");
98 err = ctx.pl310->enable();
100 pr_err("error: pl310 enable\n");
107 err = quadd_power_clk_start();
109 pr_err("error: power_clk start\n");
113 err = quadd_hrt_start();
115 pr_err("error: hrt start\n");
123 atomic_set(&ctx.started, 0);
124 tegra_profiler_unlock();
128 static void stop(void)
130 if (atomic_cmpxchg(&ctx.started, 1, 0)) {
135 quadd_power_clk_stop();
142 ctx.pl310->disable();
144 tegra_profiler_unlock();
148 static inline int is_event_supported(struct source_info *si, int event)
151 int nr = si->nr_supported_events;
152 int *events = si->supported_events;
154 for (i = 0; i < nr; i++) {
155 if (event == events[i])
162 validate_freq(unsigned int freq)
164 if (capable(CAP_SYS_ADMIN))
165 return freq >= 100 && freq <= 100000;
167 return freq == 100 || freq == 1000 || freq == 10000;
171 set_parameters(struct quadd_parameters *p, uid_t *debug_app_uid)
174 int pmu_events_id[QUADD_MAX_COUNTERS];
176 int nr_pmu = 0, nr_pl310 = 0;
178 struct task_struct *task;
181 if (!validate_freq(p->freq)) {
182 pr_err("%s: incorrect frequency: %u", __func__, p->freq);
186 ctx.param.freq = p->freq;
187 ctx.param.ma_freq = p->ma_freq;
188 ctx.param.backtrace = p->backtrace;
189 ctx.param.use_freq = p->use_freq;
190 ctx.param.system_wide = p->system_wide;
191 ctx.param.power_rate_freq = p->power_rate_freq;
192 ctx.param.debug_samples = p->debug_samples;
194 for (i = 0; i < ARRAY_SIZE(p->reserved); i++)
195 ctx.param.reserved[i] = p->reserved[i];
197 /* Currently only one process */
202 task = pid_task(find_vpid(p->pids[0]), PIDTYPE_PID);
205 pr_err("Process not found: %u\n", p->pids[0]);
209 pr_info("owner/task uids: %u/%u\n", current_fsuid(), task_uid(task));
210 if (!capable(CAP_SYS_ADMIN)) {
211 if (current_fsuid() != task_uid(task)) {
212 uid = quadd_auth_is_debuggable((char *)p->package_name);
214 pr_err("Error: QuadD security service\n");
216 } else if (uid == 0) {
217 pr_err("Error: app is not debuggable\n");
221 *debug_app_uid = uid;
222 pr_info("debug_app_uid: %u\n", uid);
224 ctx.collect_kernel_ips = 0;
226 ctx.collect_kernel_ips = 1;
229 for (i = 0; i < p->nr_pids; i++)
230 ctx.param.pids[i] = p->pids[i];
232 ctx.param.nr_pids = p->nr_pids;
234 for (i = 0; i < p->nr_events; i++) {
235 int event = p->events[i];
237 if (ctx.pmu && ctx.pmu_info.nr_supported_events > 0
238 && is_event_supported(&ctx.pmu_info, event)) {
239 pmu_events_id[nr_pmu++] = p->events[i];
241 pr_info("PMU active event: %s\n",
242 quadd_get_event_str(event));
243 } else if (ctx.pl310 &&
244 ctx.pl310_info.nr_supported_events > 0 &&
245 is_event_supported(&ctx.pl310_info, event)) {
246 pl310_events_id = p->events[i];
248 pr_info("PL310 active event: %s\n",
249 quadd_get_event_str(event));
251 if (nr_pl310++ > 1) {
252 pr_err("error: multiply pl310 events\n");
256 pr_err("Bad event: %s\n",
257 quadd_get_event_str(event));
264 err = ctx.pmu->set_events(pmu_events_id, nr_pmu);
266 pr_err("PMU set parameters: error\n");
269 ctx.pmu_info.active = 1;
271 ctx.pmu_info.active = 0;
272 ctx.pmu->set_events(NULL, 0);
278 err = ctx.pl310->set_events(&pl310_events_id, 1);
280 pr_info("pl310 set_parameters: error\n");
283 ctx.pl310_info.active = 1;
285 ctx.pl310_info.active = 0;
286 ctx.pl310->set_events(NULL, 0);
290 extra = p->reserved[QUADD_PARAM_IDX_EXTRA];
292 if (extra & QUADD_PARAM_EXTRA_BT_UNWIND_TABLES)
293 pr_info("unwinding: exception-handling tables\n");
295 if (extra & QUADD_PARAM_EXTRA_BT_FP)
296 pr_info("unwinding: frame pointers\n");
298 if (extra & QUADD_PARAM_EXTRA_BT_MIXED)
299 pr_info("unwinding: mixed mode\n");
301 quadd_unwind_start(task);
303 pr_info("New parameters have been applied\n");
308 static void get_capabilities(struct quadd_comm_cap *cap)
311 unsigned int extra = 0;
312 struct quadd_events_cap *events_cap = &cap->events_cap;
314 cap->pmu = ctx.pmu ? 1 : 0;
319 cap->l2_multiple_events = 0;
320 } else if (ctx.pmu) {
321 struct source_info *s = &ctx.pmu_info;
322 for (i = 0; i < s->nr_supported_events; i++) {
323 event = s->supported_events[i];
324 if (event == QUADD_EVENT_TYPE_L2_DCACHE_READ_MISSES ||
325 event == QUADD_EVENT_TYPE_L2_DCACHE_WRITE_MISSES ||
326 event == QUADD_EVENT_TYPE_L2_ICACHE_MISSES) {
328 cap->l2_multiple_events = 1;
334 events_cap->cpu_cycles = 0;
335 events_cap->l1_dcache_read_misses = 0;
336 events_cap->l1_dcache_write_misses = 0;
337 events_cap->l1_icache_misses = 0;
339 events_cap->instructions = 0;
340 events_cap->branch_instructions = 0;
341 events_cap->branch_misses = 0;
342 events_cap->bus_cycles = 0;
344 events_cap->l2_dcache_read_misses = 0;
345 events_cap->l2_dcache_write_misses = 0;
346 events_cap->l2_icache_misses = 0;
349 struct source_info *s = &ctx.pl310_info;
350 for (i = 0; i < s->nr_supported_events; i++) {
351 int event = s->supported_events[i];
354 case QUADD_EVENT_TYPE_L2_DCACHE_READ_MISSES:
355 events_cap->l2_dcache_read_misses = 1;
357 case QUADD_EVENT_TYPE_L2_DCACHE_WRITE_MISSES:
358 events_cap->l2_dcache_write_misses = 1;
360 case QUADD_EVENT_TYPE_L2_ICACHE_MISSES:
361 events_cap->l2_icache_misses = 1;
365 pr_err_once("%s: error: invalid event\n",
373 struct source_info *s = &ctx.pmu_info;
374 for (i = 0; i < s->nr_supported_events; i++) {
375 int event = s->supported_events[i];
378 case QUADD_EVENT_TYPE_CPU_CYCLES:
379 events_cap->cpu_cycles = 1;
381 case QUADD_EVENT_TYPE_INSTRUCTIONS:
382 events_cap->instructions = 1;
384 case QUADD_EVENT_TYPE_BRANCH_INSTRUCTIONS:
385 events_cap->branch_instructions = 1;
387 case QUADD_EVENT_TYPE_BRANCH_MISSES:
388 events_cap->branch_misses = 1;
390 case QUADD_EVENT_TYPE_BUS_CYCLES:
391 events_cap->bus_cycles = 1;
394 case QUADD_EVENT_TYPE_L1_DCACHE_READ_MISSES:
395 events_cap->l1_dcache_read_misses = 1;
397 case QUADD_EVENT_TYPE_L1_DCACHE_WRITE_MISSES:
398 events_cap->l1_dcache_write_misses = 1;
400 case QUADD_EVENT_TYPE_L1_ICACHE_MISSES:
401 events_cap->l1_icache_misses = 1;
404 case QUADD_EVENT_TYPE_L2_DCACHE_READ_MISSES:
405 events_cap->l2_dcache_read_misses = 1;
407 case QUADD_EVENT_TYPE_L2_DCACHE_WRITE_MISSES:
408 events_cap->l2_dcache_write_misses = 1;
410 case QUADD_EVENT_TYPE_L2_ICACHE_MISSES:
411 events_cap->l2_icache_misses = 1;
415 pr_err_once("%s: error: invalid event\n",
422 cap->tegra_lp_cluster = quadd_is_cpu_with_lp_cluster();
424 cap->blocked_read = 1;
426 extra |= QUADD_COMM_CAP_EXTRA_BT_KERNEL_CTX;
427 extra |= QUADD_COMM_CAP_EXTRA_GET_MMAP;
428 extra |= QUADD_COMM_CAP_EXTRA_GROUP_SAMPLES;
429 extra |= QUADD_COMM_CAP_EXTRA_BT_UNWIND_TABLES;
430 extra |= QUADD_COMM_CAP_EXTRA_SUPPORT_AARCH64;
431 extra |= QUADD_COMM_CAP_EXTRA_SPECIAL_ARCH_MMAP;
432 extra |= QUADD_COMM_CAP_EXTRA_UNWIND_MIXED;
434 cap->reserved[QUADD_COMM_CAP_IDX_EXTRA] = extra;
437 void quadd_get_state(struct quadd_module_state *state)
439 unsigned int status = 0;
441 quadd_hrt_get_state(state);
443 if (ctx.comm->is_active())
444 status |= QUADD_MOD_STATE_STATUS_IS_ACTIVE;
446 if (quadd_auth_is_auth_open())
447 status |= QUADD_MOD_STATE_STATUS_IS_AUTH_OPEN;
449 state->reserved[QUADD_MOD_STATE_IDX_STATUS] = status;
453 set_extab(struct quadd_extables *extabs,
454 struct quadd_extabs_mmap *mmap)
456 return quadd_unwind_set_extab(extabs, mmap);
460 delete_mmap(struct quadd_extabs_mmap *mmap)
462 quadd_unwind_delete_mmap(mmap);
465 static struct quadd_comm_control_interface control = {
468 .set_parameters = set_parameters,
469 .get_capabilities = get_capabilities,
470 .get_state = quadd_get_state,
471 .set_extab = set_extab,
472 .delete_mmap = delete_mmap,
475 static int __init quadd_module_init(void)
477 int i, nr_events, err;
480 pr_info("Branch: %s\n", QUADD_MODULE_BRANCH);
481 pr_info("Version: %s\n", QUADD_MODULE_VERSION);
482 pr_info("Samples version: %d\n", QUADD_SAMPLES_VERSION);
483 pr_info("IO version: %d\n", QUADD_IO_VERSION);
485 #ifdef QM_DEBUG_SAMPLES_ENABLE
486 pr_info("############## DEBUG VERSION! ##############\n");
489 atomic_set(&ctx.started, 0);
490 atomic_set(&ctx.tegra_profiler_lock, 0);
492 get_default_properties();
494 ctx.pmu_info.active = 0;
495 ctx.pl310_info.active = 0;
498 ctx.pmu = quadd_armv8_pmu_init();
500 ctx.pmu = quadd_armv7_pmu_init();
503 pr_err("PMU init failed\n");
506 events = ctx.pmu_info.supported_events;
507 nr_events = ctx.pmu->get_supported_events(events,
509 ctx.pmu_info.nr_supported_events = nr_events;
511 pr_info("PMU: amount of events: %d\n", nr_events);
513 for (i = 0; i < nr_events; i++)
514 pr_info("PMU event: %s\n",
515 quadd_get_event_str(events[i]));
518 #ifdef CONFIG_CACHE_L2X0
519 ctx.pl310 = quadd_l2x0_events_init();
524 events = ctx.pl310_info.supported_events;
525 nr_events = ctx.pl310->get_supported_events(events,
527 ctx.pl310_info.nr_supported_events = nr_events;
529 pr_info("pl310 success, amount of events: %d\n",
532 for (i = 0; i < nr_events; i++)
533 pr_info("pl310 event: %s\n",
534 quadd_get_event_str(events[i]));
536 pr_info("PL310 not found\n");
539 ctx.hrt = quadd_hrt_init(&ctx);
540 if (IS_ERR(ctx.hrt)) {
541 pr_err("error: HRT init failed\n");
542 return PTR_ERR(ctx.hrt);
545 err = quadd_power_clk_init(&ctx);
547 pr_err("error: POWER CLK init failed\n");
551 ctx.comm = quadd_comm_events_init(&control);
552 if (IS_ERR(ctx.comm)) {
553 pr_err("error: COMM init failed\n");
554 return PTR_ERR(ctx.comm);
557 err = quadd_auth_init(&ctx);
559 pr_err("error: auth failed\n");
563 err = quadd_unwind_init();
565 pr_err("error: EH unwinding init failed\n");
569 get_capabilities(&ctx.cap);
570 quadd_proc_init(&ctx);
575 static void __exit quadd_module_exit(void)
577 pr_info("QuadD module exit\n");
580 quadd_power_clk_deinit();
581 quadd_comm_events_exit();
584 quadd_unwind_deinit();
587 quadd_armv8_pmu_deinit();
589 quadd_armv7_pmu_deinit();
593 module_init(quadd_module_init);
594 module_exit(quadd_module_exit);
596 MODULE_LICENSE("GPL");
598 MODULE_AUTHOR("Nvidia Ltd");
599 MODULE_DESCRIPTION("Tegra profiler");