hyperv_vmbus.h 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488
  1. /* SPDX-License-Identifier: GPL-2.0-only */
  2. /*
  3. *
  4. * Copyright (c) 2011, Microsoft Corporation.
  5. *
  6. * Authors:
  7. * Haiyang Zhang <haiyangz@microsoft.com>
  8. * Hank Janssen <hjanssen@microsoft.com>
  9. * K. Y. Srinivasan <kys@microsoft.com>
  10. */
  11. #ifndef _HYPERV_VMBUS_H
  12. #define _HYPERV_VMBUS_H
  13. #include <linux/list.h>
  14. #include <linux/bitops.h>
  15. #include <asm/sync_bitops.h>
  16. #include <asm/hyperv-tlfs.h>
  17. #include <linux/atomic.h>
  18. #include <linux/hyperv.h>
  19. #include <linux/interrupt.h>
  20. #include "hv_trace.h"
  21. /*
  22. * Timeout for services such as KVP and fcopy.
  23. */
  24. #define HV_UTIL_TIMEOUT 30
  25. /*
  26. * Timeout for guest-host handshake for services.
  27. */
  28. #define HV_UTIL_NEGO_TIMEOUT 55
  29. /* Definitions for the monitored notification facility */
  30. union hv_monitor_trigger_group {
  31. u64 as_uint64;
  32. struct {
  33. u32 pending;
  34. u32 armed;
  35. };
  36. };
  37. struct hv_monitor_parameter {
  38. union hv_connection_id connectionid;
  39. u16 flagnumber;
  40. u16 rsvdz;
  41. };
  42. union hv_monitor_trigger_state {
  43. u32 asu32;
  44. struct {
  45. u32 group_enable:4;
  46. u32 rsvdz:28;
  47. };
  48. };
  49. /* struct hv_monitor_page Layout */
  50. /* ------------------------------------------------------ */
  51. /* | 0 | TriggerState (4 bytes) | Rsvd1 (4 bytes) | */
  52. /* | 8 | TriggerGroup[0] | */
  53. /* | 10 | TriggerGroup[1] | */
  54. /* | 18 | TriggerGroup[2] | */
  55. /* | 20 | TriggerGroup[3] | */
  56. /* | 28 | Rsvd2[0] | */
  57. /* | 30 | Rsvd2[1] | */
  58. /* | 38 | Rsvd2[2] | */
  59. /* | 40 | NextCheckTime[0][0] | NextCheckTime[0][1] | */
  60. /* | ... | */
  61. /* | 240 | Latency[0][0..3] | */
  62. /* | 340 | Rsvz3[0] | */
  63. /* | 440 | Parameter[0][0] | */
  64. /* | 448 | Parameter[0][1] | */
  65. /* | ... | */
  66. /* | 840 | Rsvd4[0] | */
  67. /* ------------------------------------------------------ */
  68. struct hv_monitor_page {
  69. union hv_monitor_trigger_state trigger_state;
  70. u32 rsvdz1;
  71. union hv_monitor_trigger_group trigger_group[4];
  72. u64 rsvdz2[3];
  73. s32 next_checktime[4][32];
  74. u16 latency[4][32];
  75. u64 rsvdz3[32];
  76. struct hv_monitor_parameter parameter[4][32];
  77. u8 rsvdz4[1984];
  78. };
  79. #define HV_HYPERCALL_PARAM_ALIGN sizeof(u64)
  80. /* Definition of the hv_post_message hypercall input structure. */
  81. struct hv_input_post_message {
  82. union hv_connection_id connectionid;
  83. u32 reserved;
  84. u32 message_type;
  85. u32 payload_size;
  86. u64 payload[HV_MESSAGE_PAYLOAD_QWORD_COUNT];
  87. };
  88. enum {
  89. VMBUS_MESSAGE_CONNECTION_ID = 1,
  90. VMBUS_MESSAGE_CONNECTION_ID_4 = 4,
  91. VMBUS_MESSAGE_PORT_ID = 1,
  92. VMBUS_EVENT_CONNECTION_ID = 2,
  93. VMBUS_EVENT_PORT_ID = 2,
  94. VMBUS_MONITOR_CONNECTION_ID = 3,
  95. VMBUS_MONITOR_PORT_ID = 3,
  96. VMBUS_MESSAGE_SINT = 2,
  97. };
  98. /*
  99. * Per cpu state for channel handling
  100. */
  101. struct hv_per_cpu_context {
  102. void *synic_message_page;
  103. void *synic_event_page;
  104. /*
  105. * The page is only used in hv_post_message() for a TDX VM (with the
  106. * paravisor) to post a messages to Hyper-V: when such a VM calls
  107. * HVCALL_POST_MESSAGE, it can't use the hyperv_pcpu_input_arg (which
  108. * is encrypted in such a VM) as the hypercall input page, because
  109. * the input page for HVCALL_POST_MESSAGE must be decrypted in such a
  110. * VM, so post_msg_page (which is decrypted in hv_synic_alloc()) is
  111. * introduced for this purpose. See hyperv_init() for more comments.
  112. */
  113. void *post_msg_page;
  114. /*
  115. * Starting with win8, we can take channel interrupts on any CPU;
  116. * we will manage the tasklet that handles events messages on a per CPU
  117. * basis.
  118. */
  119. struct tasklet_struct msg_dpc;
  120. };
  121. struct hv_context {
  122. /* We only support running on top of Hyper-V
  123. * So at this point this really can only contain the Hyper-V ID
  124. */
  125. u64 guestid;
  126. struct hv_per_cpu_context __percpu *cpu_context;
  127. /*
  128. * To manage allocations in a NUMA node.
  129. * Array indexed by numa node ID.
  130. */
  131. struct cpumask *hv_numa_map;
  132. };
  133. extern struct hv_context hv_context;
  134. /* Hv Interface */
  135. extern int hv_init(void);
  136. extern int hv_post_message(union hv_connection_id connection_id,
  137. enum hv_message_type message_type,
  138. void *payload, size_t payload_size);
  139. extern int hv_synic_alloc(void);
  140. extern void hv_synic_free(void);
  141. extern void hv_synic_enable_regs(unsigned int cpu);
  142. extern int hv_synic_init(unsigned int cpu);
  143. extern void hv_synic_disable_regs(unsigned int cpu);
  144. extern int hv_synic_cleanup(unsigned int cpu);
  145. /* Interface */
  146. void hv_ringbuffer_pre_init(struct vmbus_channel *channel);
  147. int hv_ringbuffer_init(struct hv_ring_buffer_info *ring_info,
  148. struct page *pages, u32 pagecnt, u32 max_pkt_size);
  149. void hv_ringbuffer_cleanup(struct hv_ring_buffer_info *ring_info);
  150. int hv_ringbuffer_write(struct vmbus_channel *channel,
  151. const struct kvec *kv_list, u32 kv_count,
  152. u64 requestid, u64 *trans_id);
  153. int hv_ringbuffer_read(struct vmbus_channel *channel,
  154. void *buffer, u32 buflen, u32 *buffer_actual_len,
  155. u64 *requestid, bool raw);
  156. /*
  157. * The Maximum number of channels (16384) is determined by the size of the
  158. * interrupt page, which is HV_HYP_PAGE_SIZE. 1/2 of HV_HYP_PAGE_SIZE is to
  159. * send endpoint interrupts, and the other is to receive endpoint interrupts.
  160. */
  161. #define MAX_NUM_CHANNELS ((HV_HYP_PAGE_SIZE >> 1) << 3)
  162. /* The value here must be in multiple of 32 */
  163. #define MAX_NUM_CHANNELS_SUPPORTED 256
  164. #define MAX_CHANNEL_RELIDS \
  165. max(MAX_NUM_CHANNELS_SUPPORTED, HV_EVENT_FLAGS_COUNT)
  166. enum vmbus_connect_state {
  167. DISCONNECTED,
  168. CONNECTING,
  169. CONNECTED,
  170. DISCONNECTING
  171. };
  172. #define MAX_SIZE_CHANNEL_MESSAGE HV_MESSAGE_PAYLOAD_BYTE_COUNT
  173. /*
  174. * The CPU that Hyper-V will interrupt for VMBUS messages, such as
  175. * CHANNELMSG_OFFERCHANNEL and CHANNELMSG_RESCIND_CHANNELOFFER.
  176. */
  177. #define VMBUS_CONNECT_CPU 0
  178. struct vmbus_connection {
  179. u32 msg_conn_id;
  180. atomic_t offer_in_progress;
  181. enum vmbus_connect_state conn_state;
  182. atomic_t next_gpadl_handle;
  183. struct completion unload_event;
  184. /*
  185. * Represents channel interrupts. Each bit position represents a
  186. * channel. When a channel sends an interrupt via VMBUS, it finds its
  187. * bit in the sendInterruptPage, set it and calls Hv to generate a port
  188. * event. The other end receives the port event and parse the
  189. * recvInterruptPage to see which bit is set
  190. */
  191. void *int_page;
  192. void *send_int_page;
  193. void *recv_int_page;
  194. /*
  195. * 2 pages - 1st page for parent->child notification and 2nd
  196. * is child->parent notification
  197. */
  198. struct hv_monitor_page *monitor_pages[2];
  199. struct list_head chn_msg_list;
  200. spinlock_t channelmsg_lock;
  201. /* List of channels */
  202. struct list_head chn_list;
  203. struct mutex channel_mutex;
  204. /* Array of channels */
  205. struct vmbus_channel **channels;
  206. /*
  207. * An offer message is handled first on the work_queue, and then
  208. * is further handled on handle_primary_chan_wq or
  209. * handle_sub_chan_wq.
  210. */
  211. struct workqueue_struct *work_queue;
  212. struct workqueue_struct *handle_primary_chan_wq;
  213. struct workqueue_struct *handle_sub_chan_wq;
  214. struct workqueue_struct *rescind_work_queue;
  215. /*
  216. * On suspension of the vmbus, the accumulated offer messages
  217. * must be dropped.
  218. */
  219. bool ignore_any_offer_msg;
  220. /*
  221. * The number of sub-channels and hv_sock channels that should be
  222. * cleaned up upon suspend: sub-channels will be re-created upon
  223. * resume, and hv_sock channels should not survive suspend.
  224. */
  225. atomic_t nr_chan_close_on_suspend;
  226. /*
  227. * vmbus_bus_suspend() waits for "nr_chan_close_on_suspend" to
  228. * drop to zero.
  229. */
  230. struct completion ready_for_suspend_event;
  231. /*
  232. * The number of primary channels that should be "fixed up"
  233. * upon resume: these channels are re-offered upon resume, and some
  234. * fields of the channel offers (i.e. child_relid and connection_id)
  235. * can change, so the old offermsg must be fixed up, before the resume
  236. * callbacks of the VSC drivers start to further touch the channels.
  237. */
  238. atomic_t nr_chan_fixup_on_resume;
  239. /*
  240. * vmbus_bus_resume() waits for "nr_chan_fixup_on_resume" to
  241. * drop to zero.
  242. */
  243. struct completion ready_for_resume_event;
  244. };
  245. struct vmbus_msginfo {
  246. /* Bookkeeping stuff */
  247. struct list_head msglist_entry;
  248. /* The message itself */
  249. unsigned char msg[];
  250. };
  251. extern struct vmbus_connection vmbus_connection;
  252. int vmbus_negotiate_version(struct vmbus_channel_msginfo *msginfo, u32 version);
  253. static inline void vmbus_send_interrupt(u32 relid)
  254. {
  255. sync_set_bit(relid, vmbus_connection.send_int_page);
  256. }
  257. enum vmbus_message_handler_type {
  258. /* The related handler can sleep. */
  259. VMHT_BLOCKING = 0,
  260. /* The related handler must NOT sleep. */
  261. VMHT_NON_BLOCKING = 1,
  262. };
  263. struct vmbus_channel_message_table_entry {
  264. enum vmbus_channel_message_type message_type;
  265. enum vmbus_message_handler_type handler_type;
  266. void (*message_handler)(struct vmbus_channel_message_header *msg);
  267. u32 min_payload_len;
  268. };
  269. extern const struct vmbus_channel_message_table_entry
  270. channel_message_table[CHANNELMSG_COUNT];
  271. /* General vmbus interface */
  272. struct hv_device *vmbus_device_create(const guid_t *type,
  273. const guid_t *instance,
  274. struct vmbus_channel *channel);
  275. int vmbus_device_register(struct hv_device *child_device_obj);
  276. void vmbus_device_unregister(struct hv_device *device_obj);
  277. int vmbus_add_channel_kobj(struct hv_device *device_obj,
  278. struct vmbus_channel *channel);
  279. void vmbus_remove_channel_attr_group(struct vmbus_channel *channel);
  280. void vmbus_channel_map_relid(struct vmbus_channel *channel);
  281. void vmbus_channel_unmap_relid(struct vmbus_channel *channel);
  282. struct vmbus_channel *relid2channel(u32 relid);
  283. void vmbus_free_channels(void);
  284. /* Connection interface */
  285. int vmbus_connect(void);
  286. void vmbus_disconnect(void);
  287. int vmbus_post_msg(void *buffer, size_t buflen, bool can_sleep);
  288. void vmbus_on_event(unsigned long data);
  289. void vmbus_on_msg_dpc(unsigned long data);
  290. int hv_kvp_init(struct hv_util_service *srv);
  291. int hv_kvp_init_transport(void);
  292. void hv_kvp_deinit(void);
  293. int hv_kvp_pre_suspend(void);
  294. int hv_kvp_pre_resume(void);
  295. void hv_kvp_onchannelcallback(void *context);
  296. int hv_vss_init(struct hv_util_service *srv);
  297. int hv_vss_init_transport(void);
  298. void hv_vss_deinit(void);
  299. int hv_vss_pre_suspend(void);
  300. int hv_vss_pre_resume(void);
  301. void hv_vss_onchannelcallback(void *context);
  302. void vmbus_initiate_unload(bool crash);
  303. static inline void hv_poll_channel(struct vmbus_channel *channel,
  304. void (*cb)(void *))
  305. {
  306. if (!channel)
  307. return;
  308. cb(channel);
  309. }
  310. enum hvutil_device_state {
  311. HVUTIL_DEVICE_INIT = 0, /* driver is loaded, waiting for userspace */
  312. HVUTIL_READY, /* userspace is registered */
  313. HVUTIL_HOSTMSG_RECEIVED, /* message from the host was received */
  314. HVUTIL_USERSPACE_REQ, /* request to userspace was sent */
  315. HVUTIL_USERSPACE_RECV, /* reply from userspace was received */
  316. HVUTIL_DEVICE_DYING, /* driver unload is in progress */
  317. };
  318. enum delay {
  319. INTERRUPT_DELAY = 0,
  320. MESSAGE_DELAY = 1,
  321. };
  322. extern const struct vmbus_device vmbus_devs[];
  323. static inline bool hv_is_perf_channel(struct vmbus_channel *channel)
  324. {
  325. return vmbus_devs[channel->device_id].perf_device;
  326. }
  327. static inline size_t hv_dev_ring_size(struct vmbus_channel *channel)
  328. {
  329. return vmbus_devs[channel->device_id].pref_ring_size;
  330. }
  331. static inline bool hv_is_allocated_cpu(unsigned int cpu)
  332. {
  333. struct vmbus_channel *channel, *sc;
  334. lockdep_assert_held(&vmbus_connection.channel_mutex);
  335. /*
  336. * List additions/deletions as well as updates of the target CPUs are
  337. * protected by channel_mutex.
  338. */
  339. list_for_each_entry(channel, &vmbus_connection.chn_list, listentry) {
  340. if (!hv_is_perf_channel(channel))
  341. continue;
  342. if (channel->target_cpu == cpu)
  343. return true;
  344. list_for_each_entry(sc, &channel->sc_list, sc_list) {
  345. if (sc->target_cpu == cpu)
  346. return true;
  347. }
  348. }
  349. return false;
  350. }
  351. static inline void hv_set_allocated_cpu(unsigned int cpu)
  352. {
  353. cpumask_set_cpu(cpu, &hv_context.hv_numa_map[cpu_to_node(cpu)]);
  354. }
  355. static inline void hv_clear_allocated_cpu(unsigned int cpu)
  356. {
  357. if (hv_is_allocated_cpu(cpu))
  358. return;
  359. cpumask_clear_cpu(cpu, &hv_context.hv_numa_map[cpu_to_node(cpu)]);
  360. }
  361. static inline void hv_update_allocated_cpus(unsigned int old_cpu,
  362. unsigned int new_cpu)
  363. {
  364. hv_set_allocated_cpu(new_cpu);
  365. hv_clear_allocated_cpu(old_cpu);
  366. }
  367. #ifdef CONFIG_HYPERV_TESTING
  368. int hv_debug_add_dev_dir(struct hv_device *dev);
  369. void hv_debug_rm_dev_dir(struct hv_device *dev);
  370. void hv_debug_rm_all_dir(void);
  371. int hv_debug_init(void);
  372. void hv_debug_delay_test(struct vmbus_channel *channel, enum delay delay_type);
  373. #else /* CONFIG_HYPERV_TESTING */
  374. static inline void hv_debug_rm_dev_dir(struct hv_device *dev) {};
  375. static inline void hv_debug_rm_all_dir(void) {};
  376. static inline void hv_debug_delay_test(struct vmbus_channel *channel,
  377. enum delay delay_type) {};
  378. static inline int hv_debug_init(void)
  379. {
  380. return -1;
  381. }
  382. static inline int hv_debug_add_dev_dir(struct hv_device *dev)
  383. {
  384. return -1;
  385. }
  386. #endif /* CONFIG_HYPERV_TESTING */
  387. #endif /* _HYPERV_VMBUS_H */