PageRenderTime 43ms CodeModel.GetById 14ms RepoModel.GetById 1ms app.codeStats 0ms

/tools/perf/arch/x86/util/perf_regs.c

https://github.com/kvaneesh/linux
C | 302 lines | 202 code | 28 blank | 72 comment | 18 complexity | 3f1f49eacf3d0c1d0dadb0047c641dcf MD5 | raw file
  1. // SPDX-License-Identifier: GPL-2.0
  2. #include <errno.h>
  3. #include <string.h>
  4. #include <regex.h>
  5. #include <linux/kernel.h>
  6. #include <linux/zalloc.h>
  7. #include "../../../perf-sys.h"
  8. #include "../../../util/perf_regs.h"
  9. #include "../../../util/debug.h"
  10. #include "../../../util/event.h"
  11. const struct sample_reg sample_reg_masks[] = {
  12. SMPL_REG(AX, PERF_REG_X86_AX),
  13. SMPL_REG(BX, PERF_REG_X86_BX),
  14. SMPL_REG(CX, PERF_REG_X86_CX),
  15. SMPL_REG(DX, PERF_REG_X86_DX),
  16. SMPL_REG(SI, PERF_REG_X86_SI),
  17. SMPL_REG(DI, PERF_REG_X86_DI),
  18. SMPL_REG(BP, PERF_REG_X86_BP),
  19. SMPL_REG(SP, PERF_REG_X86_SP),
  20. SMPL_REG(IP, PERF_REG_X86_IP),
  21. SMPL_REG(FLAGS, PERF_REG_X86_FLAGS),
  22. SMPL_REG(CS, PERF_REG_X86_CS),
  23. SMPL_REG(SS, PERF_REG_X86_SS),
  24. #ifdef HAVE_ARCH_X86_64_SUPPORT
  25. SMPL_REG(R8, PERF_REG_X86_R8),
  26. SMPL_REG(R9, PERF_REG_X86_R9),
  27. SMPL_REG(R10, PERF_REG_X86_R10),
  28. SMPL_REG(R11, PERF_REG_X86_R11),
  29. SMPL_REG(R12, PERF_REG_X86_R12),
  30. SMPL_REG(R13, PERF_REG_X86_R13),
  31. SMPL_REG(R14, PERF_REG_X86_R14),
  32. SMPL_REG(R15, PERF_REG_X86_R15),
  33. #endif
  34. SMPL_REG2(XMM0, PERF_REG_X86_XMM0),
  35. SMPL_REG2(XMM1, PERF_REG_X86_XMM1),
  36. SMPL_REG2(XMM2, PERF_REG_X86_XMM2),
  37. SMPL_REG2(XMM3, PERF_REG_X86_XMM3),
  38. SMPL_REG2(XMM4, PERF_REG_X86_XMM4),
  39. SMPL_REG2(XMM5, PERF_REG_X86_XMM5),
  40. SMPL_REG2(XMM6, PERF_REG_X86_XMM6),
  41. SMPL_REG2(XMM7, PERF_REG_X86_XMM7),
  42. SMPL_REG2(XMM8, PERF_REG_X86_XMM8),
  43. SMPL_REG2(XMM9, PERF_REG_X86_XMM9),
  44. SMPL_REG2(XMM10, PERF_REG_X86_XMM10),
  45. SMPL_REG2(XMM11, PERF_REG_X86_XMM11),
  46. SMPL_REG2(XMM12, PERF_REG_X86_XMM12),
  47. SMPL_REG2(XMM13, PERF_REG_X86_XMM13),
  48. SMPL_REG2(XMM14, PERF_REG_X86_XMM14),
  49. SMPL_REG2(XMM15, PERF_REG_X86_XMM15),
  50. SMPL_REG_END
  51. };
  52. struct sdt_name_reg {
  53. const char *sdt_name;
  54. const char *uprobe_name;
  55. };
  56. #define SDT_NAME_REG(n, m) {.sdt_name = "%" #n, .uprobe_name = "%" #m}
  57. #define SDT_NAME_REG_END {.sdt_name = NULL, .uprobe_name = NULL}
  58. static const struct sdt_name_reg sdt_reg_tbl[] = {
  59. SDT_NAME_REG(eax, ax),
  60. SDT_NAME_REG(rax, ax),
  61. SDT_NAME_REG(al, ax),
  62. SDT_NAME_REG(ah, ax),
  63. SDT_NAME_REG(ebx, bx),
  64. SDT_NAME_REG(rbx, bx),
  65. SDT_NAME_REG(bl, bx),
  66. SDT_NAME_REG(bh, bx),
  67. SDT_NAME_REG(ecx, cx),
  68. SDT_NAME_REG(rcx, cx),
  69. SDT_NAME_REG(cl, cx),
  70. SDT_NAME_REG(ch, cx),
  71. SDT_NAME_REG(edx, dx),
  72. SDT_NAME_REG(rdx, dx),
  73. SDT_NAME_REG(dl, dx),
  74. SDT_NAME_REG(dh, dx),
  75. SDT_NAME_REG(esi, si),
  76. SDT_NAME_REG(rsi, si),
  77. SDT_NAME_REG(sil, si),
  78. SDT_NAME_REG(edi, di),
  79. SDT_NAME_REG(rdi, di),
  80. SDT_NAME_REG(dil, di),
  81. SDT_NAME_REG(ebp, bp),
  82. SDT_NAME_REG(rbp, bp),
  83. SDT_NAME_REG(bpl, bp),
  84. SDT_NAME_REG(rsp, sp),
  85. SDT_NAME_REG(esp, sp),
  86. SDT_NAME_REG(spl, sp),
  87. /* rNN registers */
  88. SDT_NAME_REG(r8b, r8),
  89. SDT_NAME_REG(r8w, r8),
  90. SDT_NAME_REG(r8d, r8),
  91. SDT_NAME_REG(r9b, r9),
  92. SDT_NAME_REG(r9w, r9),
  93. SDT_NAME_REG(r9d, r9),
  94. SDT_NAME_REG(r10b, r10),
  95. SDT_NAME_REG(r10w, r10),
  96. SDT_NAME_REG(r10d, r10),
  97. SDT_NAME_REG(r11b, r11),
  98. SDT_NAME_REG(r11w, r11),
  99. SDT_NAME_REG(r11d, r11),
  100. SDT_NAME_REG(r12b, r12),
  101. SDT_NAME_REG(r12w, r12),
  102. SDT_NAME_REG(r12d, r12),
  103. SDT_NAME_REG(r13b, r13),
  104. SDT_NAME_REG(r13w, r13),
  105. SDT_NAME_REG(r13d, r13),
  106. SDT_NAME_REG(r14b, r14),
  107. SDT_NAME_REG(r14w, r14),
  108. SDT_NAME_REG(r14d, r14),
  109. SDT_NAME_REG(r15b, r15),
  110. SDT_NAME_REG(r15w, r15),
  111. SDT_NAME_REG(r15d, r15),
  112. SDT_NAME_REG_END,
  113. };
  114. /*
  115. * Perf only supports OP which is in +/-NUM(REG) form.
  116. * Here plus-minus sign, NUM and parenthesis are optional,
  117. * only REG is mandatory.
  118. *
  119. * SDT events also supports indirect addressing mode with a
  120. * symbol as offset, scaled mode and constants in OP. But
  121. * perf does not support them yet. Below are few examples.
  122. *
  123. * OP with scaled mode:
  124. * (%rax,%rsi,8)
  125. * 10(%ras,%rsi,8)
  126. *
  127. * OP with indirect addressing mode:
  128. * check_action(%rip)
  129. * mp_+52(%rip)
  130. * 44+mp_(%rip)
  131. *
  132. * OP with constant values:
  133. * $0
  134. * $123
  135. * $-1
  136. */
  137. #define SDT_OP_REGEX "^([+\\-]?)([0-9]*)(\\(?)(%[a-z][a-z0-9]+)(\\)?)$"
  138. static regex_t sdt_op_regex;
  139. static int sdt_init_op_regex(void)
  140. {
  141. static int initialized;
  142. int ret = 0;
  143. if (initialized)
  144. return 0;
  145. ret = regcomp(&sdt_op_regex, SDT_OP_REGEX, REG_EXTENDED);
  146. if (ret < 0) {
  147. pr_debug4("Regex compilation error.\n");
  148. return ret;
  149. }
  150. initialized = 1;
  151. return 0;
  152. }
  153. /*
  154. * Max x86 register name length is 5(ex: %r15d). So, 6th char
  155. * should always contain NULL. This helps to find register name
  156. * length using strlen, instead of maintaining one more variable.
  157. */
  158. #define SDT_REG_NAME_SIZE 6
  159. /*
  160. * The uprobe parser does not support all gas register names;
  161. * so, we have to replace them (ex. for x86_64: %rax -> %ax).
  162. * Note: If register does not require renaming, just copy
  163. * paste as it is, but don't leave it empty.
  164. */
  165. static void sdt_rename_register(char *sdt_reg, int sdt_len, char *uprobe_reg)
  166. {
  167. int i = 0;
  168. for (i = 0; sdt_reg_tbl[i].sdt_name != NULL; i++) {
  169. if (!strncmp(sdt_reg_tbl[i].sdt_name, sdt_reg, sdt_len)) {
  170. strcpy(uprobe_reg, sdt_reg_tbl[i].uprobe_name);
  171. return;
  172. }
  173. }
  174. strncpy(uprobe_reg, sdt_reg, sdt_len);
  175. }
  176. int arch_sdt_arg_parse_op(char *old_op, char **new_op)
  177. {
  178. char new_reg[SDT_REG_NAME_SIZE] = {0};
  179. int new_len = 0, ret;
  180. /*
  181. * rm[0]: +/-NUM(REG)
  182. * rm[1]: +/-
  183. * rm[2]: NUM
  184. * rm[3]: (
  185. * rm[4]: REG
  186. * rm[5]: )
  187. */
  188. regmatch_t rm[6];
  189. /*
  190. * Max prefix length is 2 as it may contains sign(+/-)
  191. * and displacement 0 (Both sign and displacement 0 are
  192. * optional so it may be empty). Use one more character
  193. * to hold last NULL so that strlen can be used to find
  194. * prefix length, instead of maintaining one more variable.
  195. */
  196. char prefix[3] = {0};
  197. ret = sdt_init_op_regex();
  198. if (ret < 0)
  199. return ret;
  200. /*
  201. * If unsupported OR does not match with regex OR
  202. * register name too long, skip it.
  203. */
  204. if (strchr(old_op, ',') || strchr(old_op, '$') ||
  205. regexec(&sdt_op_regex, old_op, 6, rm, 0) ||
  206. rm[4].rm_eo - rm[4].rm_so > SDT_REG_NAME_SIZE) {
  207. pr_debug4("Skipping unsupported SDT argument: %s\n", old_op);
  208. return SDT_ARG_SKIP;
  209. }
  210. /*
  211. * Prepare prefix.
  212. * If SDT OP has parenthesis but does not provide
  213. * displacement, add 0 for displacement.
  214. * SDT Uprobe Prefix
  215. * -----------------------------
  216. * +24(%rdi) +24(%di) +
  217. * 24(%rdi) +24(%di) +
  218. * %rdi %di
  219. * (%rdi) +0(%di) +0
  220. * -80(%rbx) -80(%bx) -
  221. */
  222. if (rm[3].rm_so != rm[3].rm_eo) {
  223. if (rm[1].rm_so != rm[1].rm_eo)
  224. prefix[0] = *(old_op + rm[1].rm_so);
  225. else if (rm[2].rm_so != rm[2].rm_eo)
  226. prefix[0] = '+';
  227. else
  228. scnprintf(prefix, sizeof(prefix), "+0");
  229. }
  230. /* Rename register */
  231. sdt_rename_register(old_op + rm[4].rm_so, rm[4].rm_eo - rm[4].rm_so,
  232. new_reg);
  233. /* Prepare final OP which should be valid for uprobe_events */
  234. new_len = strlen(prefix) +
  235. (rm[2].rm_eo - rm[2].rm_so) +
  236. (rm[3].rm_eo - rm[3].rm_so) +
  237. strlen(new_reg) +
  238. (rm[5].rm_eo - rm[5].rm_so) +
  239. 1; /* NULL */
  240. *new_op = zalloc(new_len);
  241. if (!*new_op)
  242. return -ENOMEM;
  243. scnprintf(*new_op, new_len, "%.*s%.*s%.*s%.*s%.*s",
  244. strlen(prefix), prefix,
  245. (int)(rm[2].rm_eo - rm[2].rm_so), old_op + rm[2].rm_so,
  246. (int)(rm[3].rm_eo - rm[3].rm_so), old_op + rm[3].rm_so,
  247. strlen(new_reg), new_reg,
  248. (int)(rm[5].rm_eo - rm[5].rm_so), old_op + rm[5].rm_so);
  249. return SDT_ARG_VALID;
  250. }
  251. uint64_t arch__intr_reg_mask(void)
  252. {
  253. struct perf_event_attr attr = {
  254. .type = PERF_TYPE_HARDWARE,
  255. .config = PERF_COUNT_HW_CPU_CYCLES,
  256. .sample_type = PERF_SAMPLE_REGS_INTR,
  257. .sample_regs_intr = PERF_REG_EXTENDED_MASK,
  258. .precise_ip = 1,
  259. .disabled = 1,
  260. .exclude_kernel = 1,
  261. };
  262. int fd;
  263. /*
  264. * In an unnamed union, init it here to build on older gcc versions
  265. */
  266. attr.sample_period = 1;
  267. event_attr_init(&attr);
  268. fd = sys_perf_event_open(&attr, 0, -1, -1, 0);
  269. if (fd != -1) {
  270. close(fd);
  271. return (PERF_REG_EXTENDED_MASK | PERF_REGS_MASK);
  272. }
  273. return PERF_REGS_MASK;
  274. }