nvidia_cspmu.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Copyright (c) 2022-2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
  4. *
  5. */
  6. /* Support for NVIDIA specific attributes. */
  7. #include <linux/module.h>
  8. #include <linux/topology.h>
  9. #include "arm_cspmu.h"
  10. #define NV_PCIE_PORT_COUNT 10ULL
  11. #define NV_PCIE_FILTER_ID_MASK GENMASK_ULL(NV_PCIE_PORT_COUNT - 1, 0)
  12. #define NV_NVL_C2C_PORT_COUNT 2ULL
  13. #define NV_NVL_C2C_FILTER_ID_MASK GENMASK_ULL(NV_NVL_C2C_PORT_COUNT - 1, 0)
  14. #define NV_CNVL_PORT_COUNT 4ULL
  15. #define NV_CNVL_FILTER_ID_MASK GENMASK_ULL(NV_CNVL_PORT_COUNT - 1, 0)
  16. #define NV_GENERIC_FILTER_ID_MASK GENMASK_ULL(31, 0)
  17. #define NV_PRODID_MASK GENMASK(31, 0)
  18. #define NV_FORMAT_NAME_GENERIC 0
  19. #define to_nv_cspmu_ctx(cspmu) ((struct nv_cspmu_ctx *)(cspmu->impl.ctx))
  20. #define NV_CSPMU_EVENT_ATTR_4_INNER(_pref, _num, _suff, _config) \
  21. ARM_CSPMU_EVENT_ATTR(_pref##_num##_suff, _config)
  22. #define NV_CSPMU_EVENT_ATTR_4(_pref, _suff, _config) \
  23. NV_CSPMU_EVENT_ATTR_4_INNER(_pref, _0_, _suff, _config), \
  24. NV_CSPMU_EVENT_ATTR_4_INNER(_pref, _1_, _suff, _config + 1), \
  25. NV_CSPMU_EVENT_ATTR_4_INNER(_pref, _2_, _suff, _config + 2), \
  26. NV_CSPMU_EVENT_ATTR_4_INNER(_pref, _3_, _suff, _config + 3)
  27. struct nv_cspmu_ctx {
  28. const char *name;
  29. u32 filter_mask;
  30. u32 filter_default_val;
  31. struct attribute **event_attr;
  32. struct attribute **format_attr;
  33. };
  34. static struct attribute *scf_pmu_event_attrs[] = {
  35. ARM_CSPMU_EVENT_ATTR(bus_cycles, 0x1d),
  36. ARM_CSPMU_EVENT_ATTR(scf_cache_allocate, 0xF0),
  37. ARM_CSPMU_EVENT_ATTR(scf_cache_refill, 0xF1),
  38. ARM_CSPMU_EVENT_ATTR(scf_cache, 0xF2),
  39. ARM_CSPMU_EVENT_ATTR(scf_cache_wb, 0xF3),
  40. NV_CSPMU_EVENT_ATTR_4(socket, rd_data, 0x101),
  41. NV_CSPMU_EVENT_ATTR_4(socket, dl_rsp, 0x105),
  42. NV_CSPMU_EVENT_ATTR_4(socket, wb_data, 0x109),
  43. NV_CSPMU_EVENT_ATTR_4(socket, ev_rsp, 0x10d),
  44. NV_CSPMU_EVENT_ATTR_4(socket, prb_data, 0x111),
  45. NV_CSPMU_EVENT_ATTR_4(socket, rd_outstanding, 0x115),
  46. NV_CSPMU_EVENT_ATTR_4(socket, dl_outstanding, 0x119),
  47. NV_CSPMU_EVENT_ATTR_4(socket, wb_outstanding, 0x11d),
  48. NV_CSPMU_EVENT_ATTR_4(socket, wr_outstanding, 0x121),
  49. NV_CSPMU_EVENT_ATTR_4(socket, ev_outstanding, 0x125),
  50. NV_CSPMU_EVENT_ATTR_4(socket, prb_outstanding, 0x129),
  51. NV_CSPMU_EVENT_ATTR_4(socket, rd_access, 0x12d),
  52. NV_CSPMU_EVENT_ATTR_4(socket, dl_access, 0x131),
  53. NV_CSPMU_EVENT_ATTR_4(socket, wb_access, 0x135),
  54. NV_CSPMU_EVENT_ATTR_4(socket, wr_access, 0x139),
  55. NV_CSPMU_EVENT_ATTR_4(socket, ev_access, 0x13d),
  56. NV_CSPMU_EVENT_ATTR_4(socket, prb_access, 0x141),
  57. NV_CSPMU_EVENT_ATTR_4(ocu, gmem_rd_data, 0x145),
  58. NV_CSPMU_EVENT_ATTR_4(ocu, gmem_rd_access, 0x149),
  59. NV_CSPMU_EVENT_ATTR_4(ocu, gmem_wb_access, 0x14d),
  60. NV_CSPMU_EVENT_ATTR_4(ocu, gmem_rd_outstanding, 0x151),
  61. NV_CSPMU_EVENT_ATTR_4(ocu, gmem_wr_outstanding, 0x155),
  62. NV_CSPMU_EVENT_ATTR_4(ocu, rem_rd_data, 0x159),
  63. NV_CSPMU_EVENT_ATTR_4(ocu, rem_rd_access, 0x15d),
  64. NV_CSPMU_EVENT_ATTR_4(ocu, rem_wb_access, 0x161),
  65. NV_CSPMU_EVENT_ATTR_4(ocu, rem_rd_outstanding, 0x165),
  66. NV_CSPMU_EVENT_ATTR_4(ocu, rem_wr_outstanding, 0x169),
  67. ARM_CSPMU_EVENT_ATTR(gmem_rd_data, 0x16d),
  68. ARM_CSPMU_EVENT_ATTR(gmem_rd_access, 0x16e),
  69. ARM_CSPMU_EVENT_ATTR(gmem_rd_outstanding, 0x16f),
  70. ARM_CSPMU_EVENT_ATTR(gmem_dl_rsp, 0x170),
  71. ARM_CSPMU_EVENT_ATTR(gmem_dl_access, 0x171),
  72. ARM_CSPMU_EVENT_ATTR(gmem_dl_outstanding, 0x172),
  73. ARM_CSPMU_EVENT_ATTR(gmem_wb_data, 0x173),
  74. ARM_CSPMU_EVENT_ATTR(gmem_wb_access, 0x174),
  75. ARM_CSPMU_EVENT_ATTR(gmem_wb_outstanding, 0x175),
  76. ARM_CSPMU_EVENT_ATTR(gmem_ev_rsp, 0x176),
  77. ARM_CSPMU_EVENT_ATTR(gmem_ev_access, 0x177),
  78. ARM_CSPMU_EVENT_ATTR(gmem_ev_outstanding, 0x178),
  79. ARM_CSPMU_EVENT_ATTR(gmem_wr_data, 0x179),
  80. ARM_CSPMU_EVENT_ATTR(gmem_wr_outstanding, 0x17a),
  81. ARM_CSPMU_EVENT_ATTR(gmem_wr_access, 0x17b),
  82. NV_CSPMU_EVENT_ATTR_4(socket, wr_data, 0x17c),
  83. NV_CSPMU_EVENT_ATTR_4(ocu, gmem_wr_data, 0x180),
  84. NV_CSPMU_EVENT_ATTR_4(ocu, gmem_wb_data, 0x184),
  85. NV_CSPMU_EVENT_ATTR_4(ocu, gmem_wr_access, 0x188),
  86. NV_CSPMU_EVENT_ATTR_4(ocu, gmem_wb_outstanding, 0x18c),
  87. NV_CSPMU_EVENT_ATTR_4(ocu, rem_wr_data, 0x190),
  88. NV_CSPMU_EVENT_ATTR_4(ocu, rem_wb_data, 0x194),
  89. NV_CSPMU_EVENT_ATTR_4(ocu, rem_wr_access, 0x198),
  90. NV_CSPMU_EVENT_ATTR_4(ocu, rem_wb_outstanding, 0x19c),
  91. ARM_CSPMU_EVENT_ATTR(gmem_wr_total_bytes, 0x1a0),
  92. ARM_CSPMU_EVENT_ATTR(remote_socket_wr_total_bytes, 0x1a1),
  93. ARM_CSPMU_EVENT_ATTR(remote_socket_rd_data, 0x1a2),
  94. ARM_CSPMU_EVENT_ATTR(remote_socket_rd_outstanding, 0x1a3),
  95. ARM_CSPMU_EVENT_ATTR(remote_socket_rd_access, 0x1a4),
  96. ARM_CSPMU_EVENT_ATTR(cmem_rd_data, 0x1a5),
  97. ARM_CSPMU_EVENT_ATTR(cmem_rd_access, 0x1a6),
  98. ARM_CSPMU_EVENT_ATTR(cmem_rd_outstanding, 0x1a7),
  99. ARM_CSPMU_EVENT_ATTR(cmem_dl_rsp, 0x1a8),
  100. ARM_CSPMU_EVENT_ATTR(cmem_dl_access, 0x1a9),
  101. ARM_CSPMU_EVENT_ATTR(cmem_dl_outstanding, 0x1aa),
  102. ARM_CSPMU_EVENT_ATTR(cmem_wb_data, 0x1ab),
  103. ARM_CSPMU_EVENT_ATTR(cmem_wb_access, 0x1ac),
  104. ARM_CSPMU_EVENT_ATTR(cmem_wb_outstanding, 0x1ad),
  105. ARM_CSPMU_EVENT_ATTR(cmem_ev_rsp, 0x1ae),
  106. ARM_CSPMU_EVENT_ATTR(cmem_ev_access, 0x1af),
  107. ARM_CSPMU_EVENT_ATTR(cmem_ev_outstanding, 0x1b0),
  108. ARM_CSPMU_EVENT_ATTR(cmem_wr_data, 0x1b1),
  109. ARM_CSPMU_EVENT_ATTR(cmem_wr_outstanding, 0x1b2),
  110. NV_CSPMU_EVENT_ATTR_4(ocu, cmem_rd_data, 0x1b3),
  111. NV_CSPMU_EVENT_ATTR_4(ocu, cmem_rd_access, 0x1b7),
  112. NV_CSPMU_EVENT_ATTR_4(ocu, cmem_wb_access, 0x1bb),
  113. NV_CSPMU_EVENT_ATTR_4(ocu, cmem_rd_outstanding, 0x1bf),
  114. NV_CSPMU_EVENT_ATTR_4(ocu, cmem_wr_outstanding, 0x1c3),
  115. ARM_CSPMU_EVENT_ATTR(ocu_prb_access, 0x1c7),
  116. ARM_CSPMU_EVENT_ATTR(ocu_prb_data, 0x1c8),
  117. ARM_CSPMU_EVENT_ATTR(ocu_prb_outstanding, 0x1c9),
  118. ARM_CSPMU_EVENT_ATTR(cmem_wr_access, 0x1ca),
  119. NV_CSPMU_EVENT_ATTR_4(ocu, cmem_wr_access, 0x1cb),
  120. NV_CSPMU_EVENT_ATTR_4(ocu, cmem_wb_data, 0x1cf),
  121. NV_CSPMU_EVENT_ATTR_4(ocu, cmem_wr_data, 0x1d3),
  122. NV_CSPMU_EVENT_ATTR_4(ocu, cmem_wb_outstanding, 0x1d7),
  123. ARM_CSPMU_EVENT_ATTR(cmem_wr_total_bytes, 0x1db),
  124. ARM_CSPMU_EVENT_ATTR(cycles, ARM_CSPMU_EVT_CYCLES_DEFAULT),
  125. NULL,
  126. };
  127. static struct attribute *mcf_pmu_event_attrs[] = {
  128. ARM_CSPMU_EVENT_ATTR(rd_bytes_loc, 0x0),
  129. ARM_CSPMU_EVENT_ATTR(rd_bytes_rem, 0x1),
  130. ARM_CSPMU_EVENT_ATTR(wr_bytes_loc, 0x2),
  131. ARM_CSPMU_EVENT_ATTR(wr_bytes_rem, 0x3),
  132. ARM_CSPMU_EVENT_ATTR(total_bytes_loc, 0x4),
  133. ARM_CSPMU_EVENT_ATTR(total_bytes_rem, 0x5),
  134. ARM_CSPMU_EVENT_ATTR(rd_req_loc, 0x6),
  135. ARM_CSPMU_EVENT_ATTR(rd_req_rem, 0x7),
  136. ARM_CSPMU_EVENT_ATTR(wr_req_loc, 0x8),
  137. ARM_CSPMU_EVENT_ATTR(wr_req_rem, 0x9),
  138. ARM_CSPMU_EVENT_ATTR(total_req_loc, 0xa),
  139. ARM_CSPMU_EVENT_ATTR(total_req_rem, 0xb),
  140. ARM_CSPMU_EVENT_ATTR(rd_cum_outs_loc, 0xc),
  141. ARM_CSPMU_EVENT_ATTR(rd_cum_outs_rem, 0xd),
  142. ARM_CSPMU_EVENT_ATTR(cycles, ARM_CSPMU_EVT_CYCLES_DEFAULT),
  143. NULL,
  144. };
  145. static struct attribute *generic_pmu_event_attrs[] = {
  146. ARM_CSPMU_EVENT_ATTR(cycles, ARM_CSPMU_EVT_CYCLES_DEFAULT),
  147. NULL,
  148. };
  149. static struct attribute *scf_pmu_format_attrs[] = {
  150. ARM_CSPMU_FORMAT_EVENT_ATTR,
  151. NULL,
  152. };
  153. static struct attribute *pcie_pmu_format_attrs[] = {
  154. ARM_CSPMU_FORMAT_EVENT_ATTR,
  155. ARM_CSPMU_FORMAT_ATTR(root_port, "config1:0-9"),
  156. NULL,
  157. };
  158. static struct attribute *nvlink_c2c_pmu_format_attrs[] = {
  159. ARM_CSPMU_FORMAT_EVENT_ATTR,
  160. NULL,
  161. };
  162. static struct attribute *cnvlink_pmu_format_attrs[] = {
  163. ARM_CSPMU_FORMAT_EVENT_ATTR,
  164. ARM_CSPMU_FORMAT_ATTR(rem_socket, "config1:0-3"),
  165. NULL,
  166. };
  167. static struct attribute *generic_pmu_format_attrs[] = {
  168. ARM_CSPMU_FORMAT_EVENT_ATTR,
  169. ARM_CSPMU_FORMAT_FILTER_ATTR,
  170. NULL,
  171. };
  172. static struct attribute **
  173. nv_cspmu_get_event_attrs(const struct arm_cspmu *cspmu)
  174. {
  175. const struct nv_cspmu_ctx *ctx = to_nv_cspmu_ctx(cspmu);
  176. return ctx->event_attr;
  177. }
  178. static struct attribute **
  179. nv_cspmu_get_format_attrs(const struct arm_cspmu *cspmu)
  180. {
  181. const struct nv_cspmu_ctx *ctx = to_nv_cspmu_ctx(cspmu);
  182. return ctx->format_attr;
  183. }
  184. static const char *
  185. nv_cspmu_get_name(const struct arm_cspmu *cspmu)
  186. {
  187. const struct nv_cspmu_ctx *ctx = to_nv_cspmu_ctx(cspmu);
  188. return ctx->name;
  189. }
  190. static u32 nv_cspmu_event_filter(const struct perf_event *event)
  191. {
  192. const struct nv_cspmu_ctx *ctx =
  193. to_nv_cspmu_ctx(to_arm_cspmu(event->pmu));
  194. if (ctx->filter_mask == 0)
  195. return ctx->filter_default_val;
  196. return event->attr.config1 & ctx->filter_mask;
  197. }
  198. enum nv_cspmu_name_fmt {
  199. NAME_FMT_GENERIC,
  200. NAME_FMT_SOCKET
  201. };
  202. struct nv_cspmu_match {
  203. u32 prodid;
  204. u32 prodid_mask;
  205. u64 filter_mask;
  206. u32 filter_default_val;
  207. const char *name_pattern;
  208. enum nv_cspmu_name_fmt name_fmt;
  209. struct attribute **event_attr;
  210. struct attribute **format_attr;
  211. };
  212. static const struct nv_cspmu_match nv_cspmu_match[] = {
  213. {
  214. .prodid = 0x103,
  215. .prodid_mask = NV_PRODID_MASK,
  216. .filter_mask = NV_PCIE_FILTER_ID_MASK,
  217. .filter_default_val = NV_PCIE_FILTER_ID_MASK,
  218. .name_pattern = "nvidia_pcie_pmu_%u",
  219. .name_fmt = NAME_FMT_SOCKET,
  220. .event_attr = mcf_pmu_event_attrs,
  221. .format_attr = pcie_pmu_format_attrs
  222. },
  223. {
  224. .prodid = 0x104,
  225. .prodid_mask = NV_PRODID_MASK,
  226. .filter_mask = 0x0,
  227. .filter_default_val = NV_NVL_C2C_FILTER_ID_MASK,
  228. .name_pattern = "nvidia_nvlink_c2c1_pmu_%u",
  229. .name_fmt = NAME_FMT_SOCKET,
  230. .event_attr = mcf_pmu_event_attrs,
  231. .format_attr = nvlink_c2c_pmu_format_attrs
  232. },
  233. {
  234. .prodid = 0x105,
  235. .prodid_mask = NV_PRODID_MASK,
  236. .filter_mask = 0x0,
  237. .filter_default_val = NV_NVL_C2C_FILTER_ID_MASK,
  238. .name_pattern = "nvidia_nvlink_c2c0_pmu_%u",
  239. .name_fmt = NAME_FMT_SOCKET,
  240. .event_attr = mcf_pmu_event_attrs,
  241. .format_attr = nvlink_c2c_pmu_format_attrs
  242. },
  243. {
  244. .prodid = 0x106,
  245. .prodid_mask = NV_PRODID_MASK,
  246. .filter_mask = NV_CNVL_FILTER_ID_MASK,
  247. .filter_default_val = NV_CNVL_FILTER_ID_MASK,
  248. .name_pattern = "nvidia_cnvlink_pmu_%u",
  249. .name_fmt = NAME_FMT_SOCKET,
  250. .event_attr = mcf_pmu_event_attrs,
  251. .format_attr = cnvlink_pmu_format_attrs
  252. },
  253. {
  254. .prodid = 0x2CF,
  255. .prodid_mask = NV_PRODID_MASK,
  256. .filter_mask = 0x0,
  257. .filter_default_val = 0x0,
  258. .name_pattern = "nvidia_scf_pmu_%u",
  259. .name_fmt = NAME_FMT_SOCKET,
  260. .event_attr = scf_pmu_event_attrs,
  261. .format_attr = scf_pmu_format_attrs
  262. },
  263. {
  264. .prodid = 0,
  265. .prodid_mask = 0,
  266. .filter_mask = NV_GENERIC_FILTER_ID_MASK,
  267. .filter_default_val = NV_GENERIC_FILTER_ID_MASK,
  268. .name_pattern = "nvidia_uncore_pmu_%u",
  269. .name_fmt = NAME_FMT_GENERIC,
  270. .event_attr = generic_pmu_event_attrs,
  271. .format_attr = generic_pmu_format_attrs
  272. },
  273. };
  274. static char *nv_cspmu_format_name(const struct arm_cspmu *cspmu,
  275. const struct nv_cspmu_match *match)
  276. {
  277. char *name;
  278. struct device *dev = cspmu->dev;
  279. static atomic_t pmu_generic_idx = {0};
  280. switch (match->name_fmt) {
  281. case NAME_FMT_SOCKET: {
  282. const int cpu = cpumask_first(&cspmu->associated_cpus);
  283. const int socket = cpu_to_node(cpu);
  284. name = devm_kasprintf(dev, GFP_KERNEL, match->name_pattern,
  285. socket);
  286. break;
  287. }
  288. case NAME_FMT_GENERIC:
  289. name = devm_kasprintf(dev, GFP_KERNEL, match->name_pattern,
  290. atomic_fetch_inc(&pmu_generic_idx));
  291. break;
  292. default:
  293. name = NULL;
  294. break;
  295. }
  296. return name;
  297. }
  298. static int nv_cspmu_init_ops(struct arm_cspmu *cspmu)
  299. {
  300. u32 prodid;
  301. struct nv_cspmu_ctx *ctx;
  302. struct device *dev = cspmu->dev;
  303. struct arm_cspmu_impl_ops *impl_ops = &cspmu->impl.ops;
  304. const struct nv_cspmu_match *match = nv_cspmu_match;
  305. ctx = devm_kzalloc(dev, sizeof(struct nv_cspmu_ctx), GFP_KERNEL);
  306. if (!ctx)
  307. return -ENOMEM;
  308. prodid = FIELD_GET(ARM_CSPMU_PMIIDR_PRODUCTID, cspmu->impl.pmiidr);
  309. /* Find matching PMU. */
  310. for (; match->prodid; match++) {
  311. const u32 prodid_mask = match->prodid_mask;
  312. if ((match->prodid & prodid_mask) == (prodid & prodid_mask))
  313. break;
  314. }
  315. ctx->name = nv_cspmu_format_name(cspmu, match);
  316. ctx->filter_mask = match->filter_mask;
  317. ctx->filter_default_val = match->filter_default_val;
  318. ctx->event_attr = match->event_attr;
  319. ctx->format_attr = match->format_attr;
  320. cspmu->impl.ctx = ctx;
  321. /* NVIDIA specific callbacks. */
  322. impl_ops->event_filter = nv_cspmu_event_filter;
  323. impl_ops->get_event_attrs = nv_cspmu_get_event_attrs;
  324. impl_ops->get_format_attrs = nv_cspmu_get_format_attrs;
  325. impl_ops->get_name = nv_cspmu_get_name;
  326. return 0;
  327. }
  328. /* Match all NVIDIA Coresight PMU devices */
  329. static const struct arm_cspmu_impl_match nv_cspmu_param = {
  330. .pmiidr_val = ARM_CSPMU_IMPL_ID_NVIDIA,
  331. .module = THIS_MODULE,
  332. .impl_init_ops = nv_cspmu_init_ops
  333. };
  334. static int __init nvidia_cspmu_init(void)
  335. {
  336. int ret;
  337. ret = arm_cspmu_impl_register(&nv_cspmu_param);
  338. if (ret)
  339. pr_err("nvidia_cspmu backend registration error: %d\n", ret);
  340. return ret;
  341. }
  342. static void __exit nvidia_cspmu_exit(void)
  343. {
  344. arm_cspmu_impl_unregister(&nv_cspmu_param);
  345. }
  346. module_init(nvidia_cspmu_init);
  347. module_exit(nvidia_cspmu_exit);
  348. MODULE_DESCRIPTION("NVIDIA Coresight Architecture Performance Monitor Driver");
  349. MODULE_LICENSE("GPL v2");