|  | /* | 
|  | * mm/balloon_compaction.c | 
|  | * | 
|  | * Common interface for making balloon pages movable by compaction. | 
|  | * | 
|  | * Copyright (C) 2012, Red Hat, Inc.  Rafael Aquini <aquini@redhat.com> | 
|  | */ | 
|  | #include <linux/mm.h> | 
|  | #include <linux/slab.h> | 
|  | #include <linux/export.h> | 
|  | #include <linux/balloon_compaction.h> | 
|  |  | 
|  | /* | 
|  | * balloon_devinfo_alloc - allocates a balloon device information descriptor. | 
|  | * @balloon_dev_descriptor: pointer to reference the balloon device which | 
|  | *                          this struct balloon_dev_info will be servicing. | 
|  | * | 
|  | * Driver must call it to properly allocate and initialize an instance of | 
|  | * struct balloon_dev_info which will be used to reference a balloon device | 
|  | * as well as to keep track of the balloon device page list. | 
|  | */ | 
|  | struct balloon_dev_info *balloon_devinfo_alloc(void *balloon_dev_descriptor) | 
|  | { | 
|  | struct balloon_dev_info *b_dev_info; | 
|  | b_dev_info = kmalloc(sizeof(*b_dev_info), GFP_KERNEL); | 
|  | if (!b_dev_info) | 
|  | return ERR_PTR(-ENOMEM); | 
|  |  | 
|  | b_dev_info->balloon_device = balloon_dev_descriptor; | 
|  | b_dev_info->mapping = NULL; | 
|  | b_dev_info->isolated_pages = 0; | 
|  | spin_lock_init(&b_dev_info->pages_lock); | 
|  | INIT_LIST_HEAD(&b_dev_info->pages); | 
|  |  | 
|  | return b_dev_info; | 
|  | } | 
|  | EXPORT_SYMBOL_GPL(balloon_devinfo_alloc); | 
|  |  | 
|  | /* | 
|  | * balloon_page_enqueue - allocates a new page and inserts it into the balloon | 
|  | *			  page list. | 
|  | * @b_dev_info: balloon device decriptor where we will insert a new page to | 
|  | * | 
|  | * Driver must call it to properly allocate a new enlisted balloon page | 
|  | * before definetively removing it from the guest system. | 
|  | * This function returns the page address for the recently enqueued page or | 
|  | * NULL in the case we fail to allocate a new page this turn. | 
|  | */ | 
|  | struct page *balloon_page_enqueue(struct balloon_dev_info *b_dev_info) | 
|  | { | 
|  | unsigned long flags; | 
|  | struct page *page = alloc_page(balloon_mapping_gfp_mask() | | 
|  | __GFP_NOMEMALLOC | __GFP_NORETRY); | 
|  | if (!page) | 
|  | return NULL; | 
|  |  | 
|  | /* | 
|  | * Block others from accessing the 'page' when we get around to | 
|  | * establishing additional references. We should be the only one | 
|  | * holding a reference to the 'page' at this point. | 
|  | */ | 
|  | BUG_ON(!trylock_page(page)); | 
|  | spin_lock_irqsave(&b_dev_info->pages_lock, flags); | 
|  | balloon_page_insert(page, b_dev_info->mapping, &b_dev_info->pages); | 
|  | spin_unlock_irqrestore(&b_dev_info->pages_lock, flags); | 
|  | unlock_page(page); | 
|  | return page; | 
|  | } | 
|  | EXPORT_SYMBOL_GPL(balloon_page_enqueue); | 
|  |  | 
|  | /* | 
|  | * balloon_page_dequeue - removes a page from balloon's page list and returns | 
|  | *			  the its address to allow the driver release the page. | 
|  | * @b_dev_info: balloon device decriptor where we will grab a page from. | 
|  | * | 
|  | * Driver must call it to properly de-allocate a previous enlisted balloon page | 
|  | * before definetively releasing it back to the guest system. | 
|  | * This function returns the page address for the recently dequeued page or | 
|  | * NULL in the case we find balloon's page list temporarily empty due to | 
|  | * compaction isolated pages. | 
|  | */ | 
|  | struct page *balloon_page_dequeue(struct balloon_dev_info *b_dev_info) | 
|  | { | 
|  | struct page *page, *tmp; | 
|  | unsigned long flags; | 
|  | bool dequeued_page; | 
|  |  | 
|  | dequeued_page = false; | 
|  | list_for_each_entry_safe(page, tmp, &b_dev_info->pages, lru) { | 
|  | /* | 
|  | * Block others from accessing the 'page' while we get around | 
|  | * establishing additional references and preparing the 'page' | 
|  | * to be released by the balloon driver. | 
|  | */ | 
|  | if (trylock_page(page)) { | 
|  | spin_lock_irqsave(&b_dev_info->pages_lock, flags); | 
|  | /* | 
|  | * Raise the page refcount here to prevent any wrong | 
|  | * attempt to isolate this page, in case of coliding | 
|  | * with balloon_page_isolate() just after we release | 
|  | * the page lock. | 
|  | * | 
|  | * balloon_page_free() will take care of dropping | 
|  | * this extra refcount later. | 
|  | */ | 
|  | get_page(page); | 
|  | balloon_page_delete(page); | 
|  | spin_unlock_irqrestore(&b_dev_info->pages_lock, flags); | 
|  | unlock_page(page); | 
|  | dequeued_page = true; | 
|  | break; | 
|  | } | 
|  | } | 
|  |  | 
|  | if (!dequeued_page) { | 
|  | /* | 
|  | * If we are unable to dequeue a balloon page because the page | 
|  | * list is empty and there is no isolated pages, then something | 
|  | * went out of track and some balloon pages are lost. | 
|  | * BUG() here, otherwise the balloon driver may get stuck into | 
|  | * an infinite loop while attempting to release all its pages. | 
|  | */ | 
|  | spin_lock_irqsave(&b_dev_info->pages_lock, flags); | 
|  | if (unlikely(list_empty(&b_dev_info->pages) && | 
|  | !b_dev_info->isolated_pages)) | 
|  | BUG(); | 
|  | spin_unlock_irqrestore(&b_dev_info->pages_lock, flags); | 
|  | page = NULL; | 
|  | } | 
|  | return page; | 
|  | } | 
|  | EXPORT_SYMBOL_GPL(balloon_page_dequeue); | 
|  |  | 
|  | #ifdef CONFIG_BALLOON_COMPACTION | 
|  | /* | 
|  | * balloon_mapping_alloc - allocates a special ->mapping for ballooned pages. | 
|  | * @b_dev_info: holds the balloon device information descriptor. | 
|  | * @a_ops: balloon_mapping address_space_operations descriptor. | 
|  | * | 
|  | * Driver must call it to properly allocate and initialize an instance of | 
|  | * struct address_space which will be used as the special page->mapping for | 
|  | * balloon device enlisted page instances. | 
|  | */ | 
|  | struct address_space *balloon_mapping_alloc(struct balloon_dev_info *b_dev_info, | 
|  | const struct address_space_operations *a_ops) | 
|  | { | 
|  | struct address_space *mapping; | 
|  |  | 
|  | mapping = kmalloc(sizeof(*mapping), GFP_KERNEL); | 
|  | if (!mapping) | 
|  | return ERR_PTR(-ENOMEM); | 
|  |  | 
|  | /* | 
|  | * Give a clean 'zeroed' status to all elements of this special | 
|  | * balloon page->mapping struct address_space instance. | 
|  | */ | 
|  | address_space_init_once(mapping); | 
|  |  | 
|  | /* | 
|  | * Set mapping->flags appropriately, to allow balloon pages | 
|  | * ->mapping identification. | 
|  | */ | 
|  | mapping_set_balloon(mapping); | 
|  | mapping_set_gfp_mask(mapping, balloon_mapping_gfp_mask()); | 
|  |  | 
|  | /* balloon's page->mapping->a_ops callback descriptor */ | 
|  | mapping->a_ops = a_ops; | 
|  |  | 
|  | /* | 
|  | * Establish a pointer reference back to the balloon device descriptor | 
|  | * this particular page->mapping will be servicing. | 
|  | * This is used by compaction / migration procedures to identify and | 
|  | * access the balloon device pageset while isolating / migrating pages. | 
|  | * | 
|  | * As some balloon drivers can register multiple balloon devices | 
|  | * for a single guest, this also helps compaction / migration to | 
|  | * properly deal with multiple balloon pagesets, when required. | 
|  | */ | 
|  | mapping->private_data = b_dev_info; | 
|  | b_dev_info->mapping = mapping; | 
|  |  | 
|  | return mapping; | 
|  | } | 
|  | EXPORT_SYMBOL_GPL(balloon_mapping_alloc); | 
|  |  | 
|  | static inline void __isolate_balloon_page(struct page *page) | 
|  | { | 
|  | struct balloon_dev_info *b_dev_info = page->mapping->private_data; | 
|  | unsigned long flags; | 
|  | spin_lock_irqsave(&b_dev_info->pages_lock, flags); | 
|  | list_del(&page->lru); | 
|  | b_dev_info->isolated_pages++; | 
|  | spin_unlock_irqrestore(&b_dev_info->pages_lock, flags); | 
|  | } | 
|  |  | 
|  | static inline void __putback_balloon_page(struct page *page) | 
|  | { | 
|  | struct balloon_dev_info *b_dev_info = page->mapping->private_data; | 
|  | unsigned long flags; | 
|  | spin_lock_irqsave(&b_dev_info->pages_lock, flags); | 
|  | list_add(&page->lru, &b_dev_info->pages); | 
|  | b_dev_info->isolated_pages--; | 
|  | spin_unlock_irqrestore(&b_dev_info->pages_lock, flags); | 
|  | } | 
|  |  | 
|  | static inline int __migrate_balloon_page(struct address_space *mapping, | 
|  | struct page *newpage, struct page *page, enum migrate_mode mode) | 
|  | { | 
|  | return page->mapping->a_ops->migratepage(mapping, newpage, page, mode); | 
|  | } | 
|  |  | 
|  | /* __isolate_lru_page() counterpart for a ballooned page */ | 
|  | bool balloon_page_isolate(struct page *page) | 
|  | { | 
|  | /* | 
|  | * Avoid burning cycles with pages that are yet under __free_pages(), | 
|  | * or just got freed under us. | 
|  | * | 
|  | * In case we 'win' a race for a balloon page being freed under us and | 
|  | * raise its refcount preventing __free_pages() from doing its job | 
|  | * the put_page() at the end of this block will take care of | 
|  | * release this page, thus avoiding a nasty leakage. | 
|  | */ | 
|  | if (likely(get_page_unless_zero(page))) { | 
|  | /* | 
|  | * As balloon pages are not isolated from LRU lists, concurrent | 
|  | * compaction threads can race against page migration functions | 
|  | * as well as race against the balloon driver releasing a page. | 
|  | * | 
|  | * In order to avoid having an already isolated balloon page | 
|  | * being (wrongly) re-isolated while it is under migration, | 
|  | * or to avoid attempting to isolate pages being released by | 
|  | * the balloon driver, lets be sure we have the page lock | 
|  | * before proceeding with the balloon page isolation steps. | 
|  | */ | 
|  | if (likely(trylock_page(page))) { | 
|  | /* | 
|  | * A ballooned page, by default, has just one refcount. | 
|  | * Prevent concurrent compaction threads from isolating | 
|  | * an already isolated balloon page by refcount check. | 
|  | */ | 
|  | if (__is_movable_balloon_page(page) && | 
|  | page_count(page) == 2) { | 
|  | __isolate_balloon_page(page); | 
|  | unlock_page(page); | 
|  | return true; | 
|  | } | 
|  | unlock_page(page); | 
|  | } | 
|  | put_page(page); | 
|  | } | 
|  | return false; | 
|  | } | 
|  |  | 
|  | /* putback_lru_page() counterpart for a ballooned page */ | 
|  | void balloon_page_putback(struct page *page) | 
|  | { | 
|  | /* | 
|  | * 'lock_page()' stabilizes the page and prevents races against | 
|  | * concurrent isolation threads attempting to re-isolate it. | 
|  | */ | 
|  | lock_page(page); | 
|  |  | 
|  | if (__is_movable_balloon_page(page)) { | 
|  | __putback_balloon_page(page); | 
|  | /* drop the extra ref count taken for page isolation */ | 
|  | put_page(page); | 
|  | } else { | 
|  | WARN_ON(1); | 
|  | dump_page(page, "not movable balloon page"); | 
|  | } | 
|  | unlock_page(page); | 
|  | } | 
|  |  | 
|  | /* move_to_new_page() counterpart for a ballooned page */ | 
|  | int balloon_page_migrate(struct page *newpage, | 
|  | struct page *page, enum migrate_mode mode) | 
|  | { | 
|  | struct address_space *mapping; | 
|  | int rc = -EAGAIN; | 
|  |  | 
|  | /* | 
|  | * Block others from accessing the 'newpage' when we get around to | 
|  | * establishing additional references. We should be the only one | 
|  | * holding a reference to the 'newpage' at this point. | 
|  | */ | 
|  | BUG_ON(!trylock_page(newpage)); | 
|  |  | 
|  | if (WARN_ON(!__is_movable_balloon_page(page))) { | 
|  | dump_page(page, "not movable balloon page"); | 
|  | unlock_page(newpage); | 
|  | return rc; | 
|  | } | 
|  |  | 
|  | mapping = page->mapping; | 
|  | if (mapping) | 
|  | rc = __migrate_balloon_page(mapping, newpage, page, mode); | 
|  |  | 
|  | unlock_page(newpage); | 
|  | return rc; | 
|  | } | 
|  | #endif /* CONFIG_BALLOON_COMPACTION */ |