2 * drivers/misc/tegra-profiler/main.c
4 * Copyright (c) 2014, NVIDIA CORPORATION. All rights reserved.
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms and conditions of the GNU General Public License,
8 * version 2, as published by the Free Software Foundation.
10 * This program is distributed in the hope it will be useful, but WITHOUT
11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
17 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19 #include <linux/init.h>
20 #include <linux/module.h>
21 #include <linux/err.h>
22 #include <linux/sched.h>
24 #include <linux/tegra_profiler.h>
33 #include "power_clk.h"
36 #include "quadd_proc.h"
37 #include "eh_unwind.h"
40 #include "armv8_pmu.h"
42 #include "armv7_pmu.h"
45 #ifdef CONFIG_CACHE_L2X0
49 static struct quadd_ctx ctx;
51 static int get_default_properties(void)
54 ctx.param.ma_freq = 50;
55 ctx.param.backtrace = 1;
56 ctx.param.use_freq = 1;
57 ctx.param.system_wide = 1;
58 ctx.param.power_rate_freq = 0;
59 ctx.param.debug_samples = 0;
61 ctx.param.pids[0] = 0;
62 ctx.param.nr_pids = 1;
67 int tegra_profiler_try_lock(void)
69 return atomic_cmpxchg(&ctx.tegra_profiler_lock, 0, 1);
71 EXPORT_SYMBOL_GPL(tegra_profiler_try_lock);
73 void tegra_profiler_unlock(void)
75 atomic_set(&ctx.tegra_profiler_lock, 0);
77 EXPORT_SYMBOL_GPL(tegra_profiler_unlock);
79 static int start(void)
83 if (tegra_profiler_try_lock()) {
84 pr_err("Error: tegra_profiler lock\n");
88 if (!atomic_cmpxchg(&ctx.started, 0, 1)) {
90 err = ctx.pmu->enable();
92 pr_err("error: pmu enable\n");
98 err = ctx.pl310->enable();
100 pr_err("error: pl310 enable\n");
107 err = quadd_power_clk_start();
109 pr_err("error: power_clk start\n");
113 err = quadd_hrt_start();
115 pr_err("error: hrt start\n");
123 atomic_set(&ctx.started, 0);
124 tegra_profiler_unlock();
128 static void stop(void)
130 if (atomic_cmpxchg(&ctx.started, 1, 0)) {
135 quadd_power_clk_stop();
142 ctx.pl310->disable();
144 tegra_profiler_unlock();
148 static inline int is_event_supported(struct source_info *si, int event)
151 int nr = si->nr_supported_events;
152 int *events = si->supported_events;
154 for (i = 0; i < nr; i++) {
155 if (event == events[i])
161 static int set_parameters(struct quadd_parameters *p, uid_t *debug_app_uid)
164 int pmu_events_id[QUADD_MAX_COUNTERS];
166 int nr_pmu = 0, nr_pl310 = 0;
168 struct task_struct *task;
171 if (ctx.param.freq != 100 && ctx.param.freq != 1000 &&
172 ctx.param.freq != 10000)
175 ctx.param.freq = p->freq;
176 ctx.param.ma_freq = p->ma_freq;
177 ctx.param.backtrace = p->backtrace;
178 ctx.param.use_freq = p->use_freq;
179 ctx.param.system_wide = p->system_wide;
180 ctx.param.power_rate_freq = p->power_rate_freq;
181 ctx.param.debug_samples = p->debug_samples;
183 for (i = 0; i < ARRAY_SIZE(p->reserved); i++)
184 ctx.param.reserved[i] = p->reserved[i];
186 /* Currently only one process */
191 task = pid_task(find_vpid(p->pids[0]), PIDTYPE_PID);
194 pr_err("Process not found: %u\n", p->pids[0]);
198 pr_info("owner/task uids: %u/%u\n", current_fsuid(), task_uid(task));
199 if (!capable(CAP_SYS_ADMIN)) {
200 if (current_fsuid() != task_uid(task)) {
201 uid = quadd_auth_is_debuggable((char *)p->package_name);
203 pr_err("Error: QuadD security service\n");
205 } else if (uid == 0) {
206 pr_err("Error: app is not debuggable\n");
210 *debug_app_uid = uid;
211 pr_info("debug_app_uid: %u\n", uid);
213 ctx.collect_kernel_ips = 0;
215 ctx.collect_kernel_ips = 1;
218 for (i = 0; i < p->nr_pids; i++)
219 ctx.param.pids[i] = p->pids[i];
221 ctx.param.nr_pids = p->nr_pids;
223 for (i = 0; i < p->nr_events; i++) {
224 int event = p->events[i];
226 if (ctx.pmu && ctx.pmu_info.nr_supported_events > 0
227 && is_event_supported(&ctx.pmu_info, event)) {
228 pmu_events_id[nr_pmu++] = p->events[i];
230 pr_info("PMU active event: %s\n",
231 quadd_get_event_str(event));
232 } else if (ctx.pl310 &&
233 ctx.pl310_info.nr_supported_events > 0 &&
234 is_event_supported(&ctx.pl310_info, event)) {
235 pl310_events_id = p->events[i];
237 pr_info("PL310 active event: %s\n",
238 quadd_get_event_str(event));
240 if (nr_pl310++ > 1) {
241 pr_err("error: multiply pl310 events\n");
245 pr_err("Bad event: %s\n",
246 quadd_get_event_str(event));
253 err = ctx.pmu->set_events(pmu_events_id, nr_pmu);
255 pr_err("PMU set parameters: error\n");
258 ctx.pmu_info.active = 1;
260 ctx.pmu_info.active = 0;
261 ctx.pmu->set_events(NULL, 0);
267 err = ctx.pl310->set_events(&pl310_events_id, 1);
269 pr_info("pl310 set_parameters: error\n");
272 ctx.pl310_info.active = 1;
274 ctx.pl310_info.active = 0;
275 ctx.pl310->set_events(NULL, 0);
279 extra = p->reserved[QUADD_PARAM_IDX_EXTRA];
281 if (extra & QUADD_PARAM_EXTRA_BT_UNWIND_TABLES)
282 pr_info("unwinding: exception-handling tables\n");
284 if (extra & QUADD_PARAM_EXTRA_BT_FP)
285 pr_info("unwinding: frame pointers\n");
287 quadd_unwind_start(task);
289 pr_info("New parameters have been applied\n");
294 static void get_capabilities(struct quadd_comm_cap *cap)
297 unsigned int extra = 0;
298 struct quadd_events_cap *events_cap = &cap->events_cap;
300 cap->pmu = ctx.pmu ? 1 : 0;
305 cap->l2_multiple_events = 0;
306 } else if (ctx.pmu) {
307 struct source_info *s = &ctx.pmu_info;
308 for (i = 0; i < s->nr_supported_events; i++) {
309 event = s->supported_events[i];
310 if (event == QUADD_EVENT_TYPE_L2_DCACHE_READ_MISSES ||
311 event == QUADD_EVENT_TYPE_L2_DCACHE_WRITE_MISSES ||
312 event == QUADD_EVENT_TYPE_L2_ICACHE_MISSES) {
314 cap->l2_multiple_events = 1;
320 events_cap->cpu_cycles = 0;
321 events_cap->l1_dcache_read_misses = 0;
322 events_cap->l1_dcache_write_misses = 0;
323 events_cap->l1_icache_misses = 0;
325 events_cap->instructions = 0;
326 events_cap->branch_instructions = 0;
327 events_cap->branch_misses = 0;
328 events_cap->bus_cycles = 0;
330 events_cap->l2_dcache_read_misses = 0;
331 events_cap->l2_dcache_write_misses = 0;
332 events_cap->l2_icache_misses = 0;
335 struct source_info *s = &ctx.pl310_info;
336 for (i = 0; i < s->nr_supported_events; i++) {
337 int event = s->supported_events[i];
340 case QUADD_EVENT_TYPE_L2_DCACHE_READ_MISSES:
341 events_cap->l2_dcache_read_misses = 1;
343 case QUADD_EVENT_TYPE_L2_DCACHE_WRITE_MISSES:
344 events_cap->l2_dcache_write_misses = 1;
346 case QUADD_EVENT_TYPE_L2_ICACHE_MISSES:
347 events_cap->l2_icache_misses = 1;
351 pr_err_once("%s: error: invalid event\n",
359 struct source_info *s = &ctx.pmu_info;
360 for (i = 0; i < s->nr_supported_events; i++) {
361 int event = s->supported_events[i];
364 case QUADD_EVENT_TYPE_CPU_CYCLES:
365 events_cap->cpu_cycles = 1;
367 case QUADD_EVENT_TYPE_INSTRUCTIONS:
368 events_cap->instructions = 1;
370 case QUADD_EVENT_TYPE_BRANCH_INSTRUCTIONS:
371 events_cap->branch_instructions = 1;
373 case QUADD_EVENT_TYPE_BRANCH_MISSES:
374 events_cap->branch_misses = 1;
376 case QUADD_EVENT_TYPE_BUS_CYCLES:
377 events_cap->bus_cycles = 1;
380 case QUADD_EVENT_TYPE_L1_DCACHE_READ_MISSES:
381 events_cap->l1_dcache_read_misses = 1;
383 case QUADD_EVENT_TYPE_L1_DCACHE_WRITE_MISSES:
384 events_cap->l1_dcache_write_misses = 1;
386 case QUADD_EVENT_TYPE_L1_ICACHE_MISSES:
387 events_cap->l1_icache_misses = 1;
390 case QUADD_EVENT_TYPE_L2_DCACHE_READ_MISSES:
391 events_cap->l2_dcache_read_misses = 1;
393 case QUADD_EVENT_TYPE_L2_DCACHE_WRITE_MISSES:
394 events_cap->l2_dcache_write_misses = 1;
396 case QUADD_EVENT_TYPE_L2_ICACHE_MISSES:
397 events_cap->l2_icache_misses = 1;
401 pr_err_once("%s: error: invalid event\n",
408 cap->tegra_lp_cluster = quadd_is_cpu_with_lp_cluster();
410 cap->blocked_read = 1;
412 extra |= QUADD_COMM_CAP_EXTRA_BT_KERNEL_CTX;
413 extra |= QUADD_COMM_CAP_EXTRA_GET_MMAP;
414 extra |= QUADD_COMM_CAP_EXTRA_GROUP_SAMPLES;
415 extra |= QUADD_COMM_CAP_EXTRA_BT_UNWIND_TABLES;
416 extra |= QUADD_COMM_CAP_EXTRA_SUPPORT_AARCH64;
417 extra |= QUADD_COMM_CAP_EXTRA_SPECIAL_ARCH_MMAP;
418 extra |= QUADD_COMM_CAP_EXTRA_UNWIND_MIXED;
420 cap->reserved[QUADD_COMM_CAP_IDX_EXTRA] = extra;
423 void quadd_get_state(struct quadd_module_state *state)
425 unsigned int status = 0;
427 quadd_hrt_get_state(state);
429 if (ctx.comm->is_active())
430 status |= QUADD_MOD_STATE_STATUS_IS_ACTIVE;
432 if (quadd_auth_is_auth_open())
433 status |= QUADD_MOD_STATE_STATUS_IS_AUTH_OPEN;
435 state->reserved[QUADD_MOD_STATE_IDX_STATUS] = status;
439 set_extab(struct quadd_extables *extabs,
440 struct quadd_extabs_mmap *mmap)
442 return quadd_unwind_set_extab(extabs, mmap);
446 delete_mmap(struct quadd_extabs_mmap *mmap)
448 quadd_unwind_delete_mmap(mmap);
451 static struct quadd_comm_control_interface control = {
454 .set_parameters = set_parameters,
455 .get_capabilities = get_capabilities,
456 .get_state = quadd_get_state,
457 .set_extab = set_extab,
458 .delete_mmap = delete_mmap,
461 static int __init quadd_module_init(void)
463 int i, nr_events, err;
466 pr_info("Branch: %s\n", QUADD_MODULE_BRANCH);
467 pr_info("Version: %s\n", QUADD_MODULE_VERSION);
468 pr_info("Samples version: %d\n", QUADD_SAMPLES_VERSION);
469 pr_info("IO version: %d\n", QUADD_IO_VERSION);
471 #ifdef QM_DEBUG_SAMPLES_ENABLE
472 pr_info("############## DEBUG VERSION! ##############\n");
475 atomic_set(&ctx.started, 0);
476 atomic_set(&ctx.tegra_profiler_lock, 0);
478 get_default_properties();
480 ctx.pmu_info.active = 0;
481 ctx.pl310_info.active = 0;
484 ctx.pmu = quadd_armv8_pmu_init();
486 ctx.pmu = quadd_armv7_pmu_init();
489 pr_err("PMU init failed\n");
492 events = ctx.pmu_info.supported_events;
493 nr_events = ctx.pmu->get_supported_events(events,
495 ctx.pmu_info.nr_supported_events = nr_events;
497 pr_info("PMU: amount of events: %d\n", nr_events);
499 for (i = 0; i < nr_events; i++)
500 pr_info("PMU event: %s\n",
501 quadd_get_event_str(events[i]));
504 #ifdef CONFIG_CACHE_L2X0
505 ctx.pl310 = quadd_l2x0_events_init();
510 events = ctx.pl310_info.supported_events;
511 nr_events = ctx.pl310->get_supported_events(events,
513 ctx.pl310_info.nr_supported_events = nr_events;
515 pr_info("pl310 success, amount of events: %d\n",
518 for (i = 0; i < nr_events; i++)
519 pr_info("pl310 event: %s\n",
520 quadd_get_event_str(events[i]));
522 pr_info("PL310 not found\n");
525 ctx.hrt = quadd_hrt_init(&ctx);
526 if (IS_ERR(ctx.hrt)) {
527 pr_err("error: HRT init failed\n");
528 return PTR_ERR(ctx.hrt);
531 err = quadd_power_clk_init(&ctx);
533 pr_err("error: POWER CLK init failed\n");
537 ctx.comm = quadd_comm_events_init(&control);
538 if (IS_ERR(ctx.comm)) {
539 pr_err("error: COMM init failed\n");
540 return PTR_ERR(ctx.comm);
543 err = quadd_auth_init(&ctx);
545 pr_err("error: auth failed\n");
549 err = quadd_unwind_init();
551 pr_err("error: EH unwinding init failed\n");
555 get_capabilities(&ctx.cap);
556 quadd_proc_init(&ctx);
561 static void __exit quadd_module_exit(void)
563 pr_info("QuadD module exit\n");
566 quadd_power_clk_deinit();
567 quadd_comm_events_exit();
570 quadd_unwind_deinit();
573 quadd_armv8_pmu_deinit();
575 quadd_armv7_pmu_deinit();
579 module_init(quadd_module_init);
580 module_exit(quadd_module_exit);
582 MODULE_LICENSE("GPL");
584 MODULE_AUTHOR("Nvidia Ltd");
585 MODULE_DESCRIPTION("Tegra profiler");