2 * drivers/misc/tegra-profiler/main.c
4 * Copyright (c) 2015, NVIDIA CORPORATION. All rights reserved.
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms and conditions of the GNU General Public License,
8 * version 2, as published by the Free Software Foundation.
10 * This program is distributed in the hope it will be useful, but WITHOUT
11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
17 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19 #include <linux/init.h>
20 #include <linux/module.h>
21 #include <linux/err.h>
22 #include <linux/sched.h>
24 #include <linux/tegra_profiler.h>
33 #include "power_clk.h"
36 #include "quadd_proc.h"
37 #include "eh_unwind.h"
40 #include "armv8_pmu.h"
42 #include "armv7_pmu.h"
45 #ifdef CONFIG_CACHE_L2X0
49 static struct quadd_ctx ctx;
51 static int get_default_properties(void)
54 ctx.param.ma_freq = 50;
55 ctx.param.backtrace = 1;
56 ctx.param.use_freq = 1;
57 ctx.param.system_wide = 1;
58 ctx.param.power_rate_freq = 0;
59 ctx.param.debug_samples = 0;
61 ctx.param.pids[0] = 0;
62 ctx.param.nr_pids = 1;
67 int tegra_profiler_try_lock(void)
69 return atomic_cmpxchg(&ctx.tegra_profiler_lock, 0, 1);
71 EXPORT_SYMBOL_GPL(tegra_profiler_try_lock);
73 void tegra_profiler_unlock(void)
75 atomic_set(&ctx.tegra_profiler_lock, 0);
77 EXPORT_SYMBOL_GPL(tegra_profiler_unlock);
79 static int start(void)
83 if (tegra_profiler_try_lock()) {
84 pr_err("Error: tegra_profiler lock\n");
88 if (!atomic_cmpxchg(&ctx.started, 0, 1)) {
92 err = ctx.pmu->enable();
94 pr_err("error: pmu enable\n");
100 err = ctx.pl310->enable();
102 pr_err("error: pl310 enable\n");
109 err = quadd_hrt_start();
111 pr_err("error: hrt start\n");
117 err = quadd_power_clk_start();
119 pr_err("error: power_clk start\n");
130 atomic_set(&ctx.started, 0);
131 tegra_profiler_unlock();
136 static void stop(void)
138 if (atomic_cmpxchg(&ctx.started, 1, 0)) {
151 ctx.pl310->disable();
153 tegra_profiler_unlock();
157 quadd_power_clk_stop();
161 static inline int is_event_supported(struct source_info *si, int event)
164 int nr = si->nr_supported_events;
165 int *events = si->supported_events;
167 for (i = 0; i < nr; i++) {
168 if (event == events[i])
175 validate_freq(unsigned int freq)
177 return freq >= 100 && freq <= 100000;
181 set_parameters(struct quadd_parameters *p, uid_t *debug_app_uid)
184 int pmu_events_id[QUADD_MAX_COUNTERS];
186 int nr_pmu = 0, nr_pl310 = 0;
187 struct task_struct *task;
190 if (!validate_freq(p->freq)) {
191 pr_err("%s: incorrect frequency: %u\n", __func__, p->freq);
197 for (i = 0; i < ARRAY_SIZE(p->reserved); i++)
198 ctx.param.reserved[i] = p->reserved[i];
200 /* Currently only one process */
204 p->package_name[sizeof(p->package_name) - 1] = '\0';
207 task = pid_task(find_vpid(p->pids[0]), PIDTYPE_PID);
210 pr_err("Process not found: %u\n", p->pids[0]);
214 pr_info("owner/task uids: %u/%u\n", current_fsuid(), task_uid(task));
215 if (!capable(CAP_SYS_ADMIN)) {
216 if (current_fsuid() != task_uid(task)) {
217 uid = quadd_auth_is_debuggable((char *)p->package_name);
219 pr_err("Error: QuadD security service\n");
221 } else if (uid == 0) {
222 pr_err("Error: app is not debuggable\n");
226 *debug_app_uid = uid;
227 pr_info("debug_app_uid: %u\n", uid);
229 ctx.collect_kernel_ips = 0;
231 ctx.collect_kernel_ips = 1;
234 for (i = 0; i < p->nr_pids; i++)
235 ctx.param.pids[i] = p->pids[i];
237 ctx.param.nr_pids = p->nr_pids;
239 for (i = 0; i < p->nr_events; i++) {
240 int event = p->events[i];
242 if (ctx.pmu && ctx.pmu_info.nr_supported_events > 0
243 && is_event_supported(&ctx.pmu_info, event)) {
244 pmu_events_id[nr_pmu++] = p->events[i];
246 pr_info("PMU active event: %s\n",
247 quadd_get_event_str(event));
248 } else if (ctx.pl310 &&
249 ctx.pl310_info.nr_supported_events > 0 &&
250 is_event_supported(&ctx.pl310_info, event)) {
251 pl310_events_id = p->events[i];
253 pr_info("PL310 active event: %s\n",
254 quadd_get_event_str(event));
256 if (nr_pl310++ > 1) {
257 pr_err("error: multiply pl310 events\n");
261 pr_err("Bad event: %s\n",
262 quadd_get_event_str(event));
269 err = ctx.pmu->set_events(pmu_events_id, nr_pmu);
271 pr_err("PMU set parameters: error\n");
274 ctx.pmu_info.active = 1;
276 ctx.pmu_info.active = 0;
277 ctx.pmu->set_events(NULL, 0);
283 err = ctx.pl310->set_events(&pl310_events_id, 1);
285 pr_info("pl310 set_parameters: error\n");
288 ctx.pl310_info.active = 1;
290 ctx.pl310_info.active = 0;
291 ctx.pl310->set_events(NULL, 0);
295 low_addr_p = (u64 *)&p->reserved[QUADD_PARAM_IDX_BT_LOWER_BOUND];
296 ctx.hrt->low_addr = (unsigned long)*low_addr_p;
297 pr_info("bt lower bound: %#lx\n", ctx.hrt->low_addr);
299 err = quadd_unwind_start(task);
303 pr_info("New parameters have been applied\n");
308 static void get_capabilities(struct quadd_comm_cap *cap)
311 unsigned int extra = 0;
312 struct quadd_events_cap *events_cap = &cap->events_cap;
314 cap->pmu = ctx.pmu ? 1 : 0;
319 cap->l2_multiple_events = 0;
320 } else if (ctx.pmu) {
321 struct source_info *s = &ctx.pmu_info;
322 for (i = 0; i < s->nr_supported_events; i++) {
323 event = s->supported_events[i];
324 if (event == QUADD_EVENT_TYPE_L2_DCACHE_READ_MISSES ||
325 event == QUADD_EVENT_TYPE_L2_DCACHE_WRITE_MISSES ||
326 event == QUADD_EVENT_TYPE_L2_ICACHE_MISSES) {
328 cap->l2_multiple_events = 1;
334 events_cap->cpu_cycles = 0;
335 events_cap->l1_dcache_read_misses = 0;
336 events_cap->l1_dcache_write_misses = 0;
337 events_cap->l1_icache_misses = 0;
339 events_cap->instructions = 0;
340 events_cap->branch_instructions = 0;
341 events_cap->branch_misses = 0;
342 events_cap->bus_cycles = 0;
344 events_cap->l2_dcache_read_misses = 0;
345 events_cap->l2_dcache_write_misses = 0;
346 events_cap->l2_icache_misses = 0;
349 struct source_info *s = &ctx.pl310_info;
350 for (i = 0; i < s->nr_supported_events; i++) {
351 int event = s->supported_events[i];
354 case QUADD_EVENT_TYPE_L2_DCACHE_READ_MISSES:
355 events_cap->l2_dcache_read_misses = 1;
357 case QUADD_EVENT_TYPE_L2_DCACHE_WRITE_MISSES:
358 events_cap->l2_dcache_write_misses = 1;
360 case QUADD_EVENT_TYPE_L2_ICACHE_MISSES:
361 events_cap->l2_icache_misses = 1;
365 pr_err_once("%s: error: invalid event\n",
373 struct source_info *s = &ctx.pmu_info;
374 for (i = 0; i < s->nr_supported_events; i++) {
375 int event = s->supported_events[i];
378 case QUADD_EVENT_TYPE_CPU_CYCLES:
379 events_cap->cpu_cycles = 1;
381 case QUADD_EVENT_TYPE_INSTRUCTIONS:
382 events_cap->instructions = 1;
384 case QUADD_EVENT_TYPE_BRANCH_INSTRUCTIONS:
385 events_cap->branch_instructions = 1;
387 case QUADD_EVENT_TYPE_BRANCH_MISSES:
388 events_cap->branch_misses = 1;
390 case QUADD_EVENT_TYPE_BUS_CYCLES:
391 events_cap->bus_cycles = 1;
394 case QUADD_EVENT_TYPE_L1_DCACHE_READ_MISSES:
395 events_cap->l1_dcache_read_misses = 1;
397 case QUADD_EVENT_TYPE_L1_DCACHE_WRITE_MISSES:
398 events_cap->l1_dcache_write_misses = 1;
400 case QUADD_EVENT_TYPE_L1_ICACHE_MISSES:
401 events_cap->l1_icache_misses = 1;
404 case QUADD_EVENT_TYPE_L2_DCACHE_READ_MISSES:
405 events_cap->l2_dcache_read_misses = 1;
407 case QUADD_EVENT_TYPE_L2_DCACHE_WRITE_MISSES:
408 events_cap->l2_dcache_write_misses = 1;
410 case QUADD_EVENT_TYPE_L2_ICACHE_MISSES:
411 events_cap->l2_icache_misses = 1;
415 pr_err_once("%s: error: invalid event\n",
422 cap->tegra_lp_cluster = quadd_is_cpu_with_lp_cluster();
424 cap->blocked_read = 1;
426 extra |= QUADD_COMM_CAP_EXTRA_BT_KERNEL_CTX;
427 extra |= QUADD_COMM_CAP_EXTRA_GET_MMAP;
428 extra |= QUADD_COMM_CAP_EXTRA_GROUP_SAMPLES;
429 extra |= QUADD_COMM_CAP_EXTRA_BT_UNWIND_TABLES;
430 extra |= QUADD_COMM_CAP_EXTRA_SUPPORT_AARCH64;
431 extra |= QUADD_COMM_CAP_EXTRA_SPECIAL_ARCH_MMAP;
432 extra |= QUADD_COMM_CAP_EXTRA_UNWIND_MIXED;
433 extra |= QUADD_COMM_CAP_EXTRA_UNW_ENTRY_TYPE;
434 extra |= QUADD_COMM_CAP_EXTRA_RB_MMAP_OP;
437 extra |= QUADD_COMM_CAP_EXTRA_ARCH_TIMER;
439 cap->reserved[QUADD_COMM_CAP_IDX_EXTRA] = extra;
442 void quadd_get_state(struct quadd_module_state *state)
444 unsigned int status = 0;
446 quadd_hrt_get_state(state);
448 if (ctx.comm->is_active())
449 status |= QUADD_MOD_STATE_STATUS_IS_ACTIVE;
451 if (quadd_auth_is_auth_open())
452 status |= QUADD_MOD_STATE_STATUS_IS_AUTH_OPEN;
454 state->reserved[QUADD_MOD_STATE_IDX_STATUS] = status;
458 set_extab(struct quadd_sections *extabs,
459 struct quadd_mmap_area *mmap)
461 return quadd_unwind_set_extab(extabs, mmap);
465 delete_mmap(struct quadd_mmap_area *mmap)
467 quadd_unwind_delete_mmap(mmap);
470 static struct quadd_comm_control_interface control = {
473 .set_parameters = set_parameters,
474 .get_capabilities = get_capabilities,
475 .get_state = quadd_get_state,
476 .set_extab = set_extab,
477 .delete_mmap = delete_mmap,
480 static int __init quadd_module_init(void)
482 int i, nr_events, err;
485 pr_info("Branch: %s\n", QUADD_MODULE_BRANCH);
486 pr_info("Version: %s\n", QUADD_MODULE_VERSION);
487 pr_info("Samples version: %d\n", QUADD_SAMPLES_VERSION);
488 pr_info("IO version: %d\n", QUADD_IO_VERSION);
490 #ifdef QM_DEBUG_SAMPLES_ENABLE
491 pr_info("############## DEBUG VERSION! ##############\n");
494 atomic_set(&ctx.started, 0);
495 atomic_set(&ctx.tegra_profiler_lock, 0);
497 get_default_properties();
499 ctx.pmu_info.active = 0;
500 ctx.pl310_info.active = 0;
503 ctx.pmu = quadd_armv8_pmu_init();
505 ctx.pmu = quadd_armv7_pmu_init();
508 pr_err("PMU init failed\n");
511 events = ctx.pmu_info.supported_events;
512 nr_events = ctx.pmu->get_supported_events(events,
514 ctx.pmu_info.nr_supported_events = nr_events;
516 pr_debug("PMU: amount of events: %d\n", nr_events);
518 for (i = 0; i < nr_events; i++)
519 pr_debug("PMU event: %s\n",
520 quadd_get_event_str(events[i]));
523 #ifdef CONFIG_CACHE_L2X0
524 ctx.pl310 = quadd_l2x0_events_init();
529 events = ctx.pl310_info.supported_events;
530 nr_events = ctx.pl310->get_supported_events(events,
532 ctx.pl310_info.nr_supported_events = nr_events;
534 pr_info("pl310 success, amount of events: %d\n",
537 for (i = 0; i < nr_events; i++)
538 pr_info("pl310 event: %s\n",
539 quadd_get_event_str(events[i]));
541 pr_debug("PL310 not found\n");
544 ctx.hrt = quadd_hrt_init(&ctx);
545 if (IS_ERR(ctx.hrt)) {
546 pr_err("error: HRT init failed\n");
547 return PTR_ERR(ctx.hrt);
550 err = quadd_power_clk_init(&ctx);
552 pr_err("error: POWER CLK init failed\n");
556 ctx.comm = quadd_comm_events_init(&control);
557 if (IS_ERR(ctx.comm)) {
558 pr_err("error: COMM init failed\n");
559 return PTR_ERR(ctx.comm);
562 err = quadd_auth_init(&ctx);
564 pr_err("error: auth failed\n");
568 err = quadd_unwind_init();
570 pr_err("error: EH unwinding init failed\n");
574 get_capabilities(&ctx.cap);
575 quadd_proc_init(&ctx);
580 static void __exit quadd_module_exit(void)
582 pr_info("QuadD module exit\n");
585 quadd_power_clk_deinit();
586 quadd_comm_events_exit();
589 quadd_unwind_deinit();
592 quadd_armv8_pmu_deinit();
594 quadd_armv7_pmu_deinit();
598 module_init(quadd_module_init);
599 module_exit(quadd_module_exit);
601 MODULE_LICENSE("GPL");
603 MODULE_AUTHOR("Nvidia Ltd");
604 MODULE_DESCRIPTION("Tegra profiler");