vas.h 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479
  1. /*
  2. * Copyright 2016-17 IBM Corp.
  3. *
  4. * This program is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU General Public License
  6. * as published by the Free Software Foundation; either version
  7. * 2 of the License, or (at your option) any later version.
  8. */
  9. #ifndef _VAS_H
  10. #define _VAS_H
  11. #include <linux/atomic.h>
  12. #include <linux/idr.h>
  13. #include <asm/vas.h>
  14. #include <linux/io.h>
  15. #include <linux/dcache.h>
  16. #include <linux/mutex.h>
  17. #include <linux/stringify.h>
  18. /*
  19. * Overview of Virtual Accelerator Switchboard (VAS).
  20. *
  21. * VAS is a hardware "switchboard" that allows senders and receivers to
  22. * exchange messages with _minimal_ kernel involvment. The receivers are
  23. * typically NX coprocessor engines that perform compression or encryption
  24. * in hardware, but receivers can also be other software threads.
  25. *
  26. * Senders are user/kernel threads that submit compression/encryption or
  27. * other requests to the receivers. Senders must format their messages as
  28. * Coprocessor Request Blocks (CRB)s and submit them using the "copy" and
  29. * "paste" instructions which were introduced in Power9.
  30. *
  31. * A Power node can have (upto?) 8 Power chips. There is one instance of
  32. * VAS in each Power9 chip. Each instance of VAS has 64K windows or ports,
  33. * Senders and receivers must each connect to a separate window before they
  34. * can exchange messages through the switchboard.
  35. *
  36. * Each window is described by two types of window contexts:
  37. *
  38. * Hypervisor Window Context (HVWC) of size VAS_HVWC_SIZE bytes
  39. *
  40. * OS/User Window Context (UWC) of size VAS_UWC_SIZE bytes.
  41. *
  42. * A window context can be viewed as a set of 64-bit registers. The settings
  43. * in these registers configure/control/determine the behavior of the VAS
  44. * hardware when messages are sent/received through the window. The registers
  45. * in the HVWC are configured by the kernel while the registers in the UWC can
  46. * be configured by the kernel or by the user space application that is using
  47. * the window.
  48. *
  49. * The HVWCs for all windows on a specific instance of VAS are in a contiguous
  50. * range of hardware addresses or Base address region (BAR) referred to as the
  51. * HVWC BAR for the instance. Similarly the UWCs for all windows on an instance
  52. * are referred to as the UWC BAR for the instance.
  53. *
  54. * The two BARs for each instance are defined Power9 MMIO Ranges spreadsheet
  55. * and available to the kernel in the VAS node's "reg" property in the device
  56. * tree:
  57. *
  58. * /proc/device-tree/vasm@.../reg
  59. *
  60. * (see vas_probe() for details on the reg property).
  61. *
  62. * The kernel maps the HVWC and UWC BAR regions into the kernel address
  63. * space (hvwc_map and uwc_map). The kernel can then access the window
  64. * contexts of a specific window using:
  65. *
  66. * hvwc = hvwc_map + winid * VAS_HVWC_SIZE.
  67. * uwc = uwc_map + winid * VAS_UWC_SIZE.
  68. *
  69. * where winid is the window index (0..64K).
  70. *
  71. * As mentioned, a window context is used to "configure" a window. Besides
  72. * this configuration address, each _send_ window also has a unique hardware
  73. * "paste" address that is used to submit requests/CRBs (see vas_paste_crb()).
  74. *
  75. * The hardware paste address for a window is computed using the "paste
  76. * base address" and "paste win id shift" reg properties in the VAS device
  77. * tree node using:
  78. *
  79. * paste_addr = paste_base + ((winid << paste_win_id_shift))
  80. *
  81. * (again, see vas_probe() for ->paste_base_addr and ->paste_win_id_shift).
  82. *
  83. * The kernel maps this hardware address into the sender's address space
  84. * after which they can use the 'paste' instruction (new in Power9) to
  85. * send a message (submit a request aka CRB) to the coprocessor.
  86. *
  87. * NOTE: In the initial version, senders can only in-kernel drivers/threads.
  88. * Support for user space threads will be added in follow-on patches.
  89. *
  90. * TODO: Do we need to map the UWC into user address space so they can return
  91. * credits? Its NA for NX but may be needed for other receive windows.
  92. *
  93. */
  94. #define VAS_WINDOWS_PER_CHIP (64 << 10)
  95. /*
  96. * Hypervisor and OS/USer Window Context sizes
  97. */
  98. #define VAS_HVWC_SIZE 512
  99. #define VAS_UWC_SIZE PAGE_SIZE
  100. /*
  101. * Initial per-process credits.
  102. * Max send window credits: 4K-1 (12-bits in VAS_TX_WCRED)
  103. * Max receive window credits: 64K-1 (16 bits in VAS_LRX_WCRED)
  104. *
  105. * TODO: Needs tuning for per-process credits
  106. */
  107. #define VAS_RX_WCREDS_MAX ((64 << 10) - 1)
  108. #define VAS_TX_WCREDS_MAX ((4 << 10) - 1)
  109. #define VAS_WCREDS_DEFAULT (1 << 10)
  110. /*
  111. * VAS Window Context Register Offsets and bitmasks.
  112. * See Section 3.1.4 of VAS Work book
  113. */
  114. #define VAS_LPID_OFFSET 0x010
  115. #define VAS_LPID PPC_BITMASK(0, 11)
  116. #define VAS_PID_OFFSET 0x018
  117. #define VAS_PID_ID PPC_BITMASK(0, 19)
  118. #define VAS_XLATE_MSR_OFFSET 0x020
  119. #define VAS_XLATE_MSR_DR PPC_BIT(0)
  120. #define VAS_XLATE_MSR_TA PPC_BIT(1)
  121. #define VAS_XLATE_MSR_PR PPC_BIT(2)
  122. #define VAS_XLATE_MSR_US PPC_BIT(3)
  123. #define VAS_XLATE_MSR_HV PPC_BIT(4)
  124. #define VAS_XLATE_MSR_SF PPC_BIT(5)
  125. #define VAS_XLATE_LPCR_OFFSET 0x028
  126. #define VAS_XLATE_LPCR_PAGE_SIZE PPC_BITMASK(0, 2)
  127. #define VAS_XLATE_LPCR_ISL PPC_BIT(3)
  128. #define VAS_XLATE_LPCR_TC PPC_BIT(4)
  129. #define VAS_XLATE_LPCR_SC PPC_BIT(5)
  130. #define VAS_XLATE_CTL_OFFSET 0x030
  131. #define VAS_XLATE_MODE PPC_BITMASK(0, 1)
  132. #define VAS_AMR_OFFSET 0x040
  133. #define VAS_AMR PPC_BITMASK(0, 63)
  134. #define VAS_SEIDR_OFFSET 0x048
  135. #define VAS_SEIDR PPC_BITMASK(0, 63)
  136. #define VAS_FAULT_TX_WIN_OFFSET 0x050
  137. #define VAS_FAULT_TX_WIN PPC_BITMASK(48, 63)
  138. #define VAS_OSU_INTR_SRC_RA_OFFSET 0x060
  139. #define VAS_OSU_INTR_SRC_RA PPC_BITMASK(8, 63)
  140. #define VAS_HV_INTR_SRC_RA_OFFSET 0x070
  141. #define VAS_HV_INTR_SRC_RA PPC_BITMASK(8, 63)
  142. #define VAS_PSWID_OFFSET 0x078
  143. #define VAS_PSWID_EA_HANDLE PPC_BITMASK(0, 31)
  144. #define VAS_SPARE1_OFFSET 0x080
  145. #define VAS_SPARE2_OFFSET 0x088
  146. #define VAS_SPARE3_OFFSET 0x090
  147. #define VAS_SPARE4_OFFSET 0x130
  148. #define VAS_SPARE5_OFFSET 0x160
  149. #define VAS_SPARE6_OFFSET 0x188
  150. #define VAS_LFIFO_BAR_OFFSET 0x0A0
  151. #define VAS_LFIFO_BAR PPC_BITMASK(8, 53)
  152. #define VAS_PAGE_MIGRATION_SELECT PPC_BITMASK(54, 56)
  153. #define VAS_LDATA_STAMP_CTL_OFFSET 0x0A8
  154. #define VAS_LDATA_STAMP PPC_BITMASK(0, 1)
  155. #define VAS_XTRA_WRITE PPC_BIT(2)
  156. #define VAS_LDMA_CACHE_CTL_OFFSET 0x0B0
  157. #define VAS_LDMA_TYPE PPC_BITMASK(0, 1)
  158. #define VAS_LDMA_FIFO_DISABLE PPC_BIT(2)
  159. #define VAS_LRFIFO_PUSH_OFFSET 0x0B8
  160. #define VAS_LRFIFO_PUSH PPC_BITMASK(0, 15)
  161. #define VAS_CURR_MSG_COUNT_OFFSET 0x0C0
  162. #define VAS_CURR_MSG_COUNT PPC_BITMASK(0, 7)
  163. #define VAS_LNOTIFY_AFTER_COUNT_OFFSET 0x0C8
  164. #define VAS_LNOTIFY_AFTER_COUNT PPC_BITMASK(0, 7)
  165. #define VAS_LRX_WCRED_OFFSET 0x0E0
  166. #define VAS_LRX_WCRED PPC_BITMASK(0, 15)
  167. #define VAS_LRX_WCRED_ADDER_OFFSET 0x190
  168. #define VAS_LRX_WCRED_ADDER PPC_BITMASK(0, 15)
  169. #define VAS_TX_WCRED_OFFSET 0x0F0
  170. #define VAS_TX_WCRED PPC_BITMASK(4, 15)
  171. #define VAS_TX_WCRED_ADDER_OFFSET 0x1A0
  172. #define VAS_TX_WCRED_ADDER PPC_BITMASK(4, 15)
  173. #define VAS_LFIFO_SIZE_OFFSET 0x100
  174. #define VAS_LFIFO_SIZE PPC_BITMASK(0, 3)
  175. #define VAS_WINCTL_OFFSET 0x108
  176. #define VAS_WINCTL_OPEN PPC_BIT(0)
  177. #define VAS_WINCTL_REJ_NO_CREDIT PPC_BIT(1)
  178. #define VAS_WINCTL_PIN PPC_BIT(2)
  179. #define VAS_WINCTL_TX_WCRED_MODE PPC_BIT(3)
  180. #define VAS_WINCTL_RX_WCRED_MODE PPC_BIT(4)
  181. #define VAS_WINCTL_TX_WORD_MODE PPC_BIT(5)
  182. #define VAS_WINCTL_RX_WORD_MODE PPC_BIT(6)
  183. #define VAS_WINCTL_RSVD_TXBUF PPC_BIT(7)
  184. #define VAS_WINCTL_THRESH_CTL PPC_BITMASK(8, 9)
  185. #define VAS_WINCTL_FAULT_WIN PPC_BIT(10)
  186. #define VAS_WINCTL_NX_WIN PPC_BIT(11)
  187. #define VAS_WIN_STATUS_OFFSET 0x110
  188. #define VAS_WIN_BUSY PPC_BIT(1)
  189. #define VAS_WIN_CTX_CACHING_CTL_OFFSET 0x118
  190. #define VAS_CASTOUT_REQ PPC_BIT(0)
  191. #define VAS_PUSH_TO_MEM PPC_BIT(1)
  192. #define VAS_WIN_CACHE_STATUS PPC_BIT(4)
  193. #define VAS_TX_RSVD_BUF_COUNT_OFFSET 0x120
  194. #define VAS_RXVD_BUF_COUNT PPC_BITMASK(58, 63)
  195. #define VAS_LRFIFO_WIN_PTR_OFFSET 0x128
  196. #define VAS_LRX_WIN_ID PPC_BITMASK(0, 15)
  197. /*
  198. * Local Notification Control Register controls what happens in _response_
  199. * to a paste command and hence applies only to receive windows.
  200. */
  201. #define VAS_LNOTIFY_CTL_OFFSET 0x138
  202. #define VAS_NOTIFY_DISABLE PPC_BIT(0)
  203. #define VAS_INTR_DISABLE PPC_BIT(1)
  204. #define VAS_NOTIFY_EARLY PPC_BIT(2)
  205. #define VAS_NOTIFY_OSU_INTR PPC_BIT(3)
  206. #define VAS_LNOTIFY_PID_OFFSET 0x140
  207. #define VAS_LNOTIFY_PID PPC_BITMASK(0, 19)
  208. #define VAS_LNOTIFY_LPID_OFFSET 0x148
  209. #define VAS_LNOTIFY_LPID PPC_BITMASK(0, 11)
  210. #define VAS_LNOTIFY_TID_OFFSET 0x150
  211. #define VAS_LNOTIFY_TID PPC_BITMASK(0, 15)
  212. #define VAS_LNOTIFY_SCOPE_OFFSET 0x158
  213. #define VAS_LNOTIFY_MIN_SCOPE PPC_BITMASK(0, 1)
  214. #define VAS_LNOTIFY_MAX_SCOPE PPC_BITMASK(2, 3)
  215. #define VAS_NX_UTIL_OFFSET 0x1B0
  216. #define VAS_NX_UTIL PPC_BITMASK(0, 63)
  217. /* SE: Side effects */
  218. #define VAS_NX_UTIL_SE_OFFSET 0x1B8
  219. #define VAS_NX_UTIL_SE PPC_BITMASK(0, 63)
  220. #define VAS_NX_UTIL_ADDER_OFFSET 0x180
  221. #define VAS_NX_UTIL_ADDER PPC_BITMASK(32, 63)
  222. /*
  223. * VREG(x):
  224. * Expand a register's short name (eg: LPID) into two parameters:
  225. * - the register's short name in string form ("LPID"), and
  226. * - the name of the macro (eg: VAS_LPID_OFFSET), defining the
  227. * register's offset in the window context
  228. */
  229. #define VREG_SFX(n, s) __stringify(n), VAS_##n##s
  230. #define VREG(r) VREG_SFX(r, _OFFSET)
  231. /*
  232. * Local Notify Scope Control Register. (Receive windows only).
  233. */
  234. enum vas_notify_scope {
  235. VAS_SCOPE_LOCAL,
  236. VAS_SCOPE_GROUP,
  237. VAS_SCOPE_VECTORED_GROUP,
  238. VAS_SCOPE_UNUSED,
  239. };
  240. /*
  241. * Local DMA Cache Control Register (Receive windows only).
  242. */
  243. enum vas_dma_type {
  244. VAS_DMA_TYPE_INJECT,
  245. VAS_DMA_TYPE_WRITE,
  246. };
  247. /*
  248. * Local Notify Scope Control Register. (Receive windows only).
  249. * Not applicable to NX receive windows.
  250. */
  251. enum vas_notify_after_count {
  252. VAS_NOTIFY_AFTER_256 = 0,
  253. VAS_NOTIFY_NONE,
  254. VAS_NOTIFY_AFTER_2
  255. };
  256. /*
  257. * One per instance of VAS. Each instance will have a separate set of
  258. * receive windows, one per coprocessor type.
  259. *
  260. * See also function header of set_vinst_win() for details on ->windows[]
  261. * and ->rxwin[] tables.
  262. */
  263. struct vas_instance {
  264. int vas_id;
  265. struct ida ida;
  266. struct list_head node;
  267. struct platform_device *pdev;
  268. u64 hvwc_bar_start;
  269. u64 uwc_bar_start;
  270. u64 paste_base_addr;
  271. u64 paste_win_id_shift;
  272. struct mutex mutex;
  273. struct vas_window *rxwin[VAS_COP_TYPE_MAX];
  274. struct vas_window *windows[VAS_WINDOWS_PER_CHIP];
  275. char *dbgname;
  276. struct dentry *dbgdir;
  277. };
  278. /*
  279. * In-kernel state a VAS window. One per window.
  280. */
  281. struct vas_window {
  282. /* Fields common to send and receive windows */
  283. struct vas_instance *vinst;
  284. int winid;
  285. bool tx_win; /* True if send window */
  286. bool nx_win; /* True if NX window */
  287. bool user_win; /* True if user space window */
  288. void *hvwc_map; /* HV window context */
  289. void *uwc_map; /* OS/User window context */
  290. pid_t pid; /* Linux process id of owner */
  291. int wcreds_max; /* Window credits */
  292. char *dbgname;
  293. struct dentry *dbgdir;
  294. /* Fields applicable only to send windows */
  295. void *paste_kaddr;
  296. char *paste_addr_name;
  297. struct vas_window *rxwin;
  298. /* Feilds applicable only to receive windows */
  299. enum vas_cop_type cop;
  300. atomic_t num_txwins;
  301. };
  302. /*
  303. * Container for the hardware state of a window. One per-window.
  304. *
  305. * A VAS Window context is a 512-byte area in the hardware that contains
  306. * a set of 64-bit registers. Individual bit-fields in these registers
  307. * determine the configuration/operation of the hardware. struct vas_winctx
  308. * is a container for the register fields in the window context.
  309. */
  310. struct vas_winctx {
  311. void *rx_fifo;
  312. int rx_fifo_size;
  313. int wcreds_max;
  314. int rsvd_txbuf_count;
  315. bool user_win;
  316. bool nx_win;
  317. bool fault_win;
  318. bool rsvd_txbuf_enable;
  319. bool pin_win;
  320. bool rej_no_credit;
  321. bool tx_wcred_mode;
  322. bool rx_wcred_mode;
  323. bool tx_word_mode;
  324. bool rx_word_mode;
  325. bool data_stamp;
  326. bool xtra_write;
  327. bool notify_disable;
  328. bool intr_disable;
  329. bool fifo_disable;
  330. bool notify_early;
  331. bool notify_os_intr_reg;
  332. int lpid;
  333. int pidr; /* value from SPRN_PID, not linux pid */
  334. int lnotify_lpid;
  335. int lnotify_pid;
  336. int lnotify_tid;
  337. u32 pswid;
  338. int rx_win_id;
  339. int fault_win_id;
  340. int tc_mode;
  341. u64 irq_port;
  342. enum vas_dma_type dma_type;
  343. enum vas_notify_scope min_scope;
  344. enum vas_notify_scope max_scope;
  345. enum vas_notify_after_count notify_after_count;
  346. };
  347. extern struct mutex vas_mutex;
  348. extern struct vas_instance *find_vas_instance(int vasid);
  349. extern void vas_init_dbgdir(void);
  350. extern void vas_instance_init_dbgdir(struct vas_instance *vinst);
  351. extern void vas_window_init_dbgdir(struct vas_window *win);
  352. extern void vas_window_free_dbgdir(struct vas_window *win);
  353. static inline void vas_log_write(struct vas_window *win, char *name,
  354. void *regptr, u64 val)
  355. {
  356. if (val)
  357. pr_debug("%swin #%d: %s reg %p, val 0x%016llx\n",
  358. win->tx_win ? "Tx" : "Rx", win->winid, name,
  359. regptr, val);
  360. }
  361. static inline void write_uwc_reg(struct vas_window *win, char *name,
  362. s32 reg, u64 val)
  363. {
  364. void *regptr;
  365. regptr = win->uwc_map + reg;
  366. vas_log_write(win, name, regptr, val);
  367. out_be64(regptr, val);
  368. }
  369. static inline void write_hvwc_reg(struct vas_window *win, char *name,
  370. s32 reg, u64 val)
  371. {
  372. void *regptr;
  373. regptr = win->hvwc_map + reg;
  374. vas_log_write(win, name, regptr, val);
  375. out_be64(regptr, val);
  376. }
  377. static inline u64 read_hvwc_reg(struct vas_window *win,
  378. char *name __maybe_unused, s32 reg)
  379. {
  380. return in_be64(win->hvwc_map+reg);
  381. }
  382. /*
  383. * Encode/decode the Partition Send Window ID (PSWID) for a window in
  384. * a way that we can uniquely identify any window in the system. i.e.
  385. * we should be able to locate the 'struct vas_window' given the PSWID.
  386. *
  387. * Bits Usage
  388. * 0:7 VAS id (8 bits)
  389. * 8:15 Unused, 0 (3 bits)
  390. * 16:31 Window id (16 bits)
  391. */
  392. static inline u32 encode_pswid(int vasid, int winid)
  393. {
  394. u32 pswid = 0;
  395. pswid |= vasid << (31 - 7);
  396. pswid |= winid;
  397. return pswid;
  398. }
  399. static inline void decode_pswid(u32 pswid, int *vasid, int *winid)
  400. {
  401. if (vasid)
  402. *vasid = pswid >> (31 - 7) & 0xFF;
  403. if (winid)
  404. *winid = pswid & 0xFFFF;
  405. }
  406. #endif /* _VAS_H */