balloon.c 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785
  1. /******************************************************************************
  2. * Xen balloon driver - enables returning/claiming memory to/from Xen.
  3. *
  4. * Copyright (c) 2003, B Dragovic
  5. * Copyright (c) 2003-2004, M Williamson, K Fraser
  6. * Copyright (c) 2005 Dan M. Smith, IBM Corporation
  7. * Copyright (c) 2010 Daniel Kiper
  8. *
  9. * Memory hotplug support was written by Daniel Kiper. Work on
  10. * it was sponsored by Google under Google Summer of Code 2010
  11. * program. Jeremy Fitzhardinge from Citrix was the mentor for
  12. * this project.
  13. *
  14. * This program is free software; you can redistribute it and/or
  15. * modify it under the terms of the GNU General Public License version 2
  16. * as published by the Free Software Foundation; or, when distributed
  17. * separately from the Linux kernel or incorporated into other
  18. * software packages, subject to the following license:
  19. *
  20. * Permission is hereby granted, free of charge, to any person obtaining a copy
  21. * of this source file (the "Software"), to deal in the Software without
  22. * restriction, including without limitation the rights to use, copy, modify,
  23. * merge, publish, distribute, sublicense, and/or sell copies of the Software,
  24. * and to permit persons to whom the Software is furnished to do so, subject to
  25. * the following conditions:
  26. *
  27. * The above copyright notice and this permission notice shall be included in
  28. * all copies or substantial portions of the Software.
  29. *
  30. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  31. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  32. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  33. * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  34. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  35. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  36. * IN THE SOFTWARE.
  37. */
  38. #define pr_fmt(fmt) "xen:" KBUILD_MODNAME ": " fmt
  39. #include <linux/cpu.h>
  40. #include <linux/kernel.h>
  41. #include <linux/sched.h>
  42. #include <linux/cred.h>
  43. #include <linux/errno.h>
  44. #include <linux/freezer.h>
  45. #include <linux/kthread.h>
  46. #include <linux/mm.h>
  47. #include <linux/memblock.h>
  48. #include <linux/pagemap.h>
  49. #include <linux/highmem.h>
  50. #include <linux/mutex.h>
  51. #include <linux/list.h>
  52. #include <linux/gfp.h>
  53. #include <linux/notifier.h>
  54. #include <linux/memory.h>
  55. #include <linux/memory_hotplug.h>
  56. #include <linux/percpu-defs.h>
  57. #include <linux/slab.h>
  58. #include <linux/sysctl.h>
  59. #include <linux/moduleparam.h>
  60. #include <linux/jiffies.h>
  61. #include <asm/page.h>
  62. #include <asm/tlb.h>
  63. #include <asm/xen/hypervisor.h>
  64. #include <asm/xen/hypercall.h>
  65. #include <xen/xen.h>
  66. #include <xen/interface/xen.h>
  67. #include <xen/interface/memory.h>
  68. #include <xen/balloon.h>
  69. #include <xen/features.h>
  70. #include <xen/page.h>
  71. #include <xen/mem-reservation.h>
  72. #undef MODULE_PARAM_PREFIX
  73. #define MODULE_PARAM_PREFIX "xen."
  74. static uint __read_mostly balloon_boot_timeout = 180;
  75. module_param(balloon_boot_timeout, uint, 0444);
  76. #ifdef CONFIG_XEN_BALLOON_MEMORY_HOTPLUG
  77. static int xen_hotplug_unpopulated;
  78. static struct ctl_table balloon_table[] = {
  79. {
  80. .procname = "hotplug_unpopulated",
  81. .data = &xen_hotplug_unpopulated,
  82. .maxlen = sizeof(int),
  83. .mode = 0644,
  84. .proc_handler = proc_dointvec_minmax,
  85. .extra1 = SYSCTL_ZERO,
  86. .extra2 = SYSCTL_ONE,
  87. },
  88. };
  89. #else
  90. #define xen_hotplug_unpopulated 0
  91. #endif
  92. /*
  93. * Use one extent per PAGE_SIZE to avoid to break down the page into
  94. * multiple frame.
  95. */
  96. #define EXTENT_ORDER (fls(XEN_PFN_PER_PAGE) - 1)
  97. /*
  98. * balloon_thread() state:
  99. *
  100. * BP_DONE: done or nothing to do,
  101. * BP_WAIT: wait to be rescheduled,
  102. * BP_EAGAIN: error, go to sleep,
  103. * BP_ECANCELED: error, balloon operation canceled.
  104. */
  105. static enum bp_state {
  106. BP_DONE,
  107. BP_WAIT,
  108. BP_EAGAIN,
  109. BP_ECANCELED
  110. } balloon_state = BP_DONE;
  111. /* Main waiting point for xen-balloon thread. */
  112. static DECLARE_WAIT_QUEUE_HEAD(balloon_thread_wq);
  113. static DEFINE_MUTEX(balloon_mutex);
  114. struct balloon_stats balloon_stats;
  115. EXPORT_SYMBOL_GPL(balloon_stats);
  116. /* We increase/decrease in batches which fit in a page */
  117. static xen_pfn_t frame_list[PAGE_SIZE / sizeof(xen_pfn_t)];
  118. /* List of ballooned pages, threaded through the mem_map array. */
  119. static LIST_HEAD(ballooned_pages);
  120. static DECLARE_WAIT_QUEUE_HEAD(balloon_wq);
  121. /* When ballooning out (allocating memory to return to Xen) we don't really
  122. want the kernel to try too hard since that can trigger the oom killer. */
  123. #define GFP_BALLOON \
  124. (GFP_HIGHUSER | __GFP_NOWARN | __GFP_NORETRY | __GFP_NOMEMALLOC)
  125. /* balloon_append: add the given page to the balloon. */
  126. static void balloon_append(struct page *page)
  127. {
  128. if (!PageOffline(page))
  129. __SetPageOffline(page);
  130. /* Lowmem is re-populated first, so highmem pages go at list tail. */
  131. if (PageHighMem(page)) {
  132. list_add_tail(&page->lru, &ballooned_pages);
  133. balloon_stats.balloon_high++;
  134. } else {
  135. list_add(&page->lru, &ballooned_pages);
  136. balloon_stats.balloon_low++;
  137. }
  138. wake_up(&balloon_wq);
  139. }
  140. /* balloon_retrieve: rescue a page from the balloon, if it is not empty. */
  141. static struct page *balloon_retrieve(bool require_lowmem)
  142. {
  143. struct page *page;
  144. if (list_empty(&ballooned_pages))
  145. return NULL;
  146. page = list_entry(ballooned_pages.next, struct page, lru);
  147. if (require_lowmem && PageHighMem(page))
  148. return NULL;
  149. list_del(&page->lru);
  150. if (PageHighMem(page))
  151. balloon_stats.balloon_high--;
  152. else
  153. balloon_stats.balloon_low--;
  154. __ClearPageOffline(page);
  155. return page;
  156. }
  157. static struct page *balloon_next_page(struct page *page)
  158. {
  159. struct list_head *next = page->lru.next;
  160. if (next == &ballooned_pages)
  161. return NULL;
  162. return list_entry(next, struct page, lru);
  163. }
  164. static void update_schedule(void)
  165. {
  166. if (balloon_state == BP_WAIT || balloon_state == BP_ECANCELED)
  167. return;
  168. if (balloon_state == BP_DONE) {
  169. balloon_stats.schedule_delay = 1;
  170. balloon_stats.retry_count = 1;
  171. return;
  172. }
  173. ++balloon_stats.retry_count;
  174. if (balloon_stats.max_retry_count != RETRY_UNLIMITED &&
  175. balloon_stats.retry_count > balloon_stats.max_retry_count) {
  176. balloon_stats.schedule_delay = 1;
  177. balloon_stats.retry_count = 1;
  178. balloon_state = BP_ECANCELED;
  179. return;
  180. }
  181. balloon_stats.schedule_delay <<= 1;
  182. if (balloon_stats.schedule_delay > balloon_stats.max_schedule_delay)
  183. balloon_stats.schedule_delay = balloon_stats.max_schedule_delay;
  184. balloon_state = BP_EAGAIN;
  185. }
  186. #ifdef CONFIG_XEN_BALLOON_MEMORY_HOTPLUG
  187. static void release_memory_resource(struct resource *resource)
  188. {
  189. if (!resource)
  190. return;
  191. /*
  192. * No need to reset region to identity mapped since we now
  193. * know that no I/O can be in this region
  194. */
  195. release_resource(resource);
  196. kfree(resource);
  197. }
  198. static struct resource *additional_memory_resource(phys_addr_t size)
  199. {
  200. struct resource *res;
  201. int ret;
  202. res = kzalloc(sizeof(*res), GFP_KERNEL);
  203. if (!res)
  204. return NULL;
  205. res->name = "System RAM";
  206. res->flags = IORESOURCE_SYSTEM_RAM | IORESOURCE_BUSY;
  207. ret = allocate_resource(&iomem_resource, res,
  208. size, 0, -1,
  209. PAGES_PER_SECTION * PAGE_SIZE, NULL, NULL);
  210. if (ret < 0) {
  211. pr_err("Cannot allocate new System RAM resource\n");
  212. kfree(res);
  213. return NULL;
  214. }
  215. return res;
  216. }
  217. static enum bp_state reserve_additional_memory(void)
  218. {
  219. long credit;
  220. struct resource *resource;
  221. int nid, rc;
  222. unsigned long balloon_hotplug;
  223. credit = balloon_stats.target_pages + balloon_stats.target_unpopulated
  224. - balloon_stats.total_pages;
  225. /*
  226. * Already hotplugged enough pages? Wait for them to be
  227. * onlined.
  228. */
  229. if (credit <= 0)
  230. return BP_WAIT;
  231. balloon_hotplug = round_up(credit, PAGES_PER_SECTION);
  232. resource = additional_memory_resource(balloon_hotplug * PAGE_SIZE);
  233. if (!resource)
  234. goto err;
  235. nid = memory_add_physaddr_to_nid(resource->start);
  236. #ifdef CONFIG_XEN_HAVE_PVMMU
  237. /*
  238. * We don't support PV MMU when Linux and Xen is using
  239. * different page granularity.
  240. */
  241. BUILD_BUG_ON(XEN_PAGE_SIZE != PAGE_SIZE);
  242. /*
  243. * add_memory() will build page tables for the new memory so
  244. * the p2m must contain invalid entries so the correct
  245. * non-present PTEs will be written.
  246. *
  247. * If a failure occurs, the original (identity) p2m entries
  248. * are not restored since this region is now known not to
  249. * conflict with any devices.
  250. */
  251. if (!xen_feature(XENFEAT_auto_translated_physmap)) {
  252. unsigned long pfn, i;
  253. pfn = PFN_DOWN(resource->start);
  254. for (i = 0; i < balloon_hotplug; i++) {
  255. if (!set_phys_to_machine(pfn + i, INVALID_P2M_ENTRY)) {
  256. pr_warn("set_phys_to_machine() failed, no memory added\n");
  257. goto err;
  258. }
  259. }
  260. }
  261. #endif
  262. /*
  263. * add_memory_resource() will call online_pages() which in its turn
  264. * will call xen_online_page() callback causing deadlock if we don't
  265. * release balloon_mutex here. Unlocking here is safe because the
  266. * callers drop the mutex before trying again.
  267. */
  268. mutex_unlock(&balloon_mutex);
  269. /* add_memory_resource() requires the device_hotplug lock */
  270. lock_device_hotplug();
  271. rc = add_memory_resource(nid, resource, MHP_MERGE_RESOURCE);
  272. unlock_device_hotplug();
  273. mutex_lock(&balloon_mutex);
  274. if (rc) {
  275. pr_warn("Cannot add additional memory (%i)\n", rc);
  276. goto err;
  277. }
  278. balloon_stats.total_pages += balloon_hotplug;
  279. return BP_WAIT;
  280. err:
  281. release_memory_resource(resource);
  282. return BP_ECANCELED;
  283. }
  284. static void xen_online_page(struct page *page, unsigned int order)
  285. {
  286. unsigned long i, size = (1 << order);
  287. unsigned long start_pfn = page_to_pfn(page);
  288. struct page *p;
  289. pr_debug("Online %lu pages starting at pfn 0x%lx\n", size, start_pfn);
  290. mutex_lock(&balloon_mutex);
  291. for (i = 0; i < size; i++) {
  292. p = pfn_to_page(start_pfn + i);
  293. balloon_append(p);
  294. }
  295. mutex_unlock(&balloon_mutex);
  296. }
  297. static int xen_memory_notifier(struct notifier_block *nb, unsigned long val, void *v)
  298. {
  299. if (val == MEM_ONLINE)
  300. wake_up(&balloon_thread_wq);
  301. return NOTIFY_OK;
  302. }
  303. static struct notifier_block xen_memory_nb = {
  304. .notifier_call = xen_memory_notifier,
  305. .priority = 0
  306. };
  307. #else
  308. static enum bp_state reserve_additional_memory(void)
  309. {
  310. balloon_stats.target_pages = balloon_stats.current_pages +
  311. balloon_stats.target_unpopulated;
  312. return BP_ECANCELED;
  313. }
  314. #endif /* CONFIG_XEN_BALLOON_MEMORY_HOTPLUG */
  315. static long current_credit(void)
  316. {
  317. return balloon_stats.target_pages - balloon_stats.current_pages;
  318. }
  319. static bool balloon_is_inflated(void)
  320. {
  321. return balloon_stats.balloon_low || balloon_stats.balloon_high;
  322. }
  323. static enum bp_state increase_reservation(unsigned long nr_pages)
  324. {
  325. int rc;
  326. unsigned long i;
  327. struct page *page;
  328. if (nr_pages > ARRAY_SIZE(frame_list))
  329. nr_pages = ARRAY_SIZE(frame_list);
  330. page = list_first_entry_or_null(&ballooned_pages, struct page, lru);
  331. for (i = 0; i < nr_pages; i++) {
  332. if (!page) {
  333. nr_pages = i;
  334. break;
  335. }
  336. frame_list[i] = page_to_xen_pfn(page);
  337. page = balloon_next_page(page);
  338. }
  339. rc = xenmem_reservation_increase(nr_pages, frame_list);
  340. if (rc <= 0)
  341. return BP_EAGAIN;
  342. for (i = 0; i < rc; i++) {
  343. page = balloon_retrieve(false);
  344. BUG_ON(page == NULL);
  345. xenmem_reservation_va_mapping_update(1, &page, &frame_list[i]);
  346. /*
  347. * Relinquish the page back to the allocator. Note that
  348. * some pages, including ones added via xen_online_page(), might
  349. * not be marked reserved; free_reserved_page() will handle that.
  350. */
  351. free_reserved_page(page);
  352. }
  353. balloon_stats.current_pages += rc;
  354. return BP_DONE;
  355. }
  356. static enum bp_state decrease_reservation(unsigned long nr_pages, gfp_t gfp)
  357. {
  358. enum bp_state state = BP_DONE;
  359. unsigned long i;
  360. struct page *page, *tmp;
  361. int ret;
  362. LIST_HEAD(pages);
  363. if (nr_pages > ARRAY_SIZE(frame_list))
  364. nr_pages = ARRAY_SIZE(frame_list);
  365. for (i = 0; i < nr_pages; i++) {
  366. page = alloc_page(gfp);
  367. if (page == NULL) {
  368. nr_pages = i;
  369. state = BP_EAGAIN;
  370. break;
  371. }
  372. adjust_managed_page_count(page, -1);
  373. xenmem_reservation_scrub_page(page);
  374. list_add(&page->lru, &pages);
  375. }
  376. /*
  377. * Ensure that ballooned highmem pages don't have kmaps.
  378. *
  379. * Do this before changing the p2m as kmap_flush_unused()
  380. * reads PTEs to obtain pages (and hence needs the original
  381. * p2m entry).
  382. */
  383. kmap_flush_unused();
  384. /*
  385. * Setup the frame, update direct mapping, invalidate P2M,
  386. * and add to balloon.
  387. */
  388. i = 0;
  389. list_for_each_entry_safe(page, tmp, &pages, lru) {
  390. frame_list[i++] = xen_page_to_gfn(page);
  391. xenmem_reservation_va_mapping_reset(1, &page);
  392. list_del(&page->lru);
  393. balloon_append(page);
  394. }
  395. flush_tlb_all();
  396. ret = xenmem_reservation_decrease(nr_pages, frame_list);
  397. BUG_ON(ret != nr_pages);
  398. balloon_stats.current_pages -= nr_pages;
  399. return state;
  400. }
  401. /*
  402. * Stop waiting if either state is BP_DONE and ballooning action is
  403. * needed, or if the credit has changed while state is not BP_DONE.
  404. */
  405. static bool balloon_thread_cond(long credit)
  406. {
  407. if (balloon_state == BP_DONE)
  408. credit = 0;
  409. return current_credit() != credit || kthread_should_stop();
  410. }
  411. /*
  412. * As this is a kthread it is guaranteed to run as a single instance only.
  413. * We may of course race updates of the target counts (which are protected
  414. * by the balloon lock), or with changes to the Xen hard limit, but we will
  415. * recover from these in time.
  416. */
  417. static int balloon_thread(void *unused)
  418. {
  419. long credit;
  420. unsigned long timeout;
  421. set_freezable();
  422. for (;;) {
  423. switch (balloon_state) {
  424. case BP_DONE:
  425. case BP_ECANCELED:
  426. timeout = 3600 * HZ;
  427. break;
  428. case BP_EAGAIN:
  429. timeout = balloon_stats.schedule_delay * HZ;
  430. break;
  431. case BP_WAIT:
  432. timeout = HZ;
  433. break;
  434. }
  435. credit = current_credit();
  436. wait_event_freezable_timeout(balloon_thread_wq,
  437. balloon_thread_cond(credit), timeout);
  438. if (kthread_should_stop())
  439. return 0;
  440. mutex_lock(&balloon_mutex);
  441. credit = current_credit();
  442. if (credit > 0) {
  443. if (balloon_is_inflated())
  444. balloon_state = increase_reservation(credit);
  445. else
  446. balloon_state = reserve_additional_memory();
  447. }
  448. if (credit < 0) {
  449. long n_pages;
  450. n_pages = min(-credit, si_mem_available());
  451. balloon_state = decrease_reservation(n_pages,
  452. GFP_BALLOON);
  453. if (balloon_state == BP_DONE && n_pages != -credit &&
  454. n_pages < totalreserve_pages)
  455. balloon_state = BP_EAGAIN;
  456. }
  457. update_schedule();
  458. mutex_unlock(&balloon_mutex);
  459. cond_resched();
  460. }
  461. }
  462. /* Resets the Xen limit, sets new target, and kicks off processing. */
  463. void balloon_set_new_target(unsigned long target)
  464. {
  465. /* No need for lock. Not read-modify-write updates. */
  466. balloon_stats.target_pages = target;
  467. wake_up(&balloon_thread_wq);
  468. }
  469. EXPORT_SYMBOL_GPL(balloon_set_new_target);
  470. static int add_ballooned_pages(unsigned int nr_pages)
  471. {
  472. enum bp_state st;
  473. if (xen_hotplug_unpopulated) {
  474. st = reserve_additional_memory();
  475. if (st != BP_ECANCELED) {
  476. int rc;
  477. mutex_unlock(&balloon_mutex);
  478. rc = wait_event_interruptible(balloon_wq,
  479. !list_empty(&ballooned_pages));
  480. mutex_lock(&balloon_mutex);
  481. return rc ? -ENOMEM : 0;
  482. }
  483. }
  484. if (si_mem_available() < nr_pages)
  485. return -ENOMEM;
  486. st = decrease_reservation(nr_pages, GFP_USER);
  487. if (st != BP_DONE)
  488. return -ENOMEM;
  489. return 0;
  490. }
  491. /**
  492. * xen_alloc_ballooned_pages - get pages that have been ballooned out
  493. * @nr_pages: Number of pages to get
  494. * @pages: pages returned
  495. * @return 0 on success, error otherwise
  496. */
  497. int xen_alloc_ballooned_pages(unsigned int nr_pages, struct page **pages)
  498. {
  499. unsigned int pgno = 0;
  500. struct page *page;
  501. int ret;
  502. mutex_lock(&balloon_mutex);
  503. balloon_stats.target_unpopulated += nr_pages;
  504. while (pgno < nr_pages) {
  505. page = balloon_retrieve(true);
  506. if (page) {
  507. pages[pgno++] = page;
  508. #ifdef CONFIG_XEN_HAVE_PVMMU
  509. /*
  510. * We don't support PV MMU when Linux and Xen is using
  511. * different page granularity.
  512. */
  513. BUILD_BUG_ON(XEN_PAGE_SIZE != PAGE_SIZE);
  514. if (!xen_feature(XENFEAT_auto_translated_physmap)) {
  515. ret = xen_alloc_p2m_entry(page_to_pfn(page));
  516. if (ret < 0)
  517. goto out_undo;
  518. }
  519. #endif
  520. } else {
  521. ret = add_ballooned_pages(nr_pages - pgno);
  522. if (ret < 0)
  523. goto out_undo;
  524. }
  525. }
  526. mutex_unlock(&balloon_mutex);
  527. return 0;
  528. out_undo:
  529. mutex_unlock(&balloon_mutex);
  530. xen_free_ballooned_pages(pgno, pages);
  531. /*
  532. * NB: xen_free_ballooned_pages will only subtract pgno pages, but since
  533. * target_unpopulated is incremented with nr_pages at the start we need
  534. * to remove the remaining ones also, or accounting will be screwed.
  535. */
  536. balloon_stats.target_unpopulated -= nr_pages - pgno;
  537. return ret;
  538. }
  539. EXPORT_SYMBOL(xen_alloc_ballooned_pages);
  540. /**
  541. * xen_free_ballooned_pages - return pages retrieved with get_ballooned_pages
  542. * @nr_pages: Number of pages
  543. * @pages: pages to return
  544. */
  545. void xen_free_ballooned_pages(unsigned int nr_pages, struct page **pages)
  546. {
  547. unsigned int i;
  548. mutex_lock(&balloon_mutex);
  549. for (i = 0; i < nr_pages; i++) {
  550. if (pages[i])
  551. balloon_append(pages[i]);
  552. }
  553. balloon_stats.target_unpopulated -= nr_pages;
  554. /* The balloon may be too large now. Shrink it if needed. */
  555. if (current_credit())
  556. wake_up(&balloon_thread_wq);
  557. mutex_unlock(&balloon_mutex);
  558. }
  559. EXPORT_SYMBOL(xen_free_ballooned_pages);
  560. static void __init balloon_add_regions(void)
  561. {
  562. unsigned long start_pfn, pages;
  563. unsigned long pfn, extra_pfn_end;
  564. unsigned int i;
  565. for (i = 0; i < XEN_EXTRA_MEM_MAX_REGIONS; i++) {
  566. pages = xen_extra_mem[i].n_pfns;
  567. if (!pages)
  568. continue;
  569. start_pfn = xen_extra_mem[i].start_pfn;
  570. /*
  571. * If the amount of usable memory has been limited (e.g., with
  572. * the 'mem' command line parameter), don't add pages beyond
  573. * this limit.
  574. */
  575. extra_pfn_end = min(max_pfn, start_pfn + pages);
  576. for (pfn = start_pfn; pfn < extra_pfn_end; pfn++)
  577. balloon_append(pfn_to_page(pfn));
  578. balloon_stats.total_pages += extra_pfn_end - start_pfn;
  579. }
  580. }
  581. static int __init balloon_init(void)
  582. {
  583. struct task_struct *task;
  584. if (!xen_domain())
  585. return -ENODEV;
  586. pr_info("Initialising balloon driver\n");
  587. #ifdef CONFIG_XEN_PV
  588. balloon_stats.current_pages = xen_pv_domain()
  589. ? min(xen_start_info->nr_pages - xen_released_pages, max_pfn)
  590. : get_num_physpages();
  591. #else
  592. balloon_stats.current_pages = get_num_physpages();
  593. #endif
  594. balloon_stats.target_pages = balloon_stats.current_pages;
  595. balloon_stats.balloon_low = 0;
  596. balloon_stats.balloon_high = 0;
  597. balloon_stats.total_pages = balloon_stats.current_pages;
  598. balloon_stats.schedule_delay = 1;
  599. balloon_stats.max_schedule_delay = 32;
  600. balloon_stats.retry_count = 1;
  601. balloon_stats.max_retry_count = 4;
  602. #ifdef CONFIG_XEN_BALLOON_MEMORY_HOTPLUG
  603. set_online_page_callback(&xen_online_page);
  604. register_memory_notifier(&xen_memory_nb);
  605. register_sysctl_init("xen/balloon", balloon_table);
  606. #endif
  607. balloon_add_regions();
  608. task = kthread_run(balloon_thread, NULL, "xen-balloon");
  609. if (IS_ERR(task)) {
  610. pr_err("xen-balloon thread could not be started, ballooning will not work!\n");
  611. return PTR_ERR(task);
  612. }
  613. /* Init the xen-balloon driver. */
  614. xen_balloon_init();
  615. return 0;
  616. }
  617. subsys_initcall(balloon_init);
  618. static int __init balloon_wait_finish(void)
  619. {
  620. long credit, last_credit = 0;
  621. unsigned long last_changed = 0;
  622. if (!xen_domain())
  623. return -ENODEV;
  624. /* PV guests don't need to wait. */
  625. if (xen_pv_domain() || !current_credit())
  626. return 0;
  627. pr_notice("Waiting for initial ballooning down having finished.\n");
  628. while ((credit = current_credit()) < 0) {
  629. if (credit != last_credit) {
  630. last_changed = jiffies;
  631. last_credit = credit;
  632. }
  633. if (balloon_state == BP_ECANCELED) {
  634. pr_warn_once("Initial ballooning failed, %ld pages need to be freed.\n",
  635. -credit);
  636. if (time_is_before_eq_jiffies(last_changed + HZ * balloon_boot_timeout))
  637. panic("Initial ballooning failed!\n");
  638. }
  639. schedule_timeout_interruptible(HZ / 10);
  640. }
  641. pr_notice("Initial ballooning down finished.\n");
  642. return 0;
  643. }
  644. late_initcall_sync(balloon_wait_finish);