303 lines
		
	
	
	
		
			9.6 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
		
		
			
		
	
	
			303 lines
		
	
	
	
		
			9.6 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
|   | /*
 | ||
|  |  * mm/balloon_compaction.c | ||
|  |  * | ||
|  |  * Common interface for making balloon pages movable by compaction. | ||
|  |  * | ||
|  |  * Copyright (C) 2012, Red Hat, Inc.  Rafael Aquini <aquini@redhat.com> | ||
|  |  */ | ||
|  | #include <linux/mm.h>
 | ||
|  | #include <linux/slab.h>
 | ||
|  | #include <linux/export.h>
 | ||
|  | #include <linux/balloon_compaction.h>
 | ||
|  | 
 | ||
|  | /*
 | ||
|  |  * balloon_devinfo_alloc - allocates a balloon device information descriptor. | ||
|  |  * @balloon_dev_descriptor: pointer to reference the balloon device which | ||
|  |  *                          this struct balloon_dev_info will be servicing. | ||
|  |  * | ||
|  |  * Driver must call it to properly allocate and initialize an instance of | ||
|  |  * struct balloon_dev_info which will be used to reference a balloon device | ||
|  |  * as well as to keep track of the balloon device page list. | ||
|  |  */ | ||
|  | struct balloon_dev_info *balloon_devinfo_alloc(void *balloon_dev_descriptor) | ||
|  | { | ||
|  | 	struct balloon_dev_info *b_dev_info; | ||
|  | 	b_dev_info = kmalloc(sizeof(*b_dev_info), GFP_KERNEL); | ||
|  | 	if (!b_dev_info) | ||
|  | 		return ERR_PTR(-ENOMEM); | ||
|  | 
 | ||
|  | 	b_dev_info->balloon_device = balloon_dev_descriptor; | ||
|  | 	b_dev_info->mapping = NULL; | ||
|  | 	b_dev_info->isolated_pages = 0; | ||
|  | 	spin_lock_init(&b_dev_info->pages_lock); | ||
|  | 	INIT_LIST_HEAD(&b_dev_info->pages); | ||
|  | 
 | ||
|  | 	return b_dev_info; | ||
|  | } | ||
|  | EXPORT_SYMBOL_GPL(balloon_devinfo_alloc); | ||
|  | 
 | ||
|  | /*
 | ||
|  |  * balloon_page_enqueue - allocates a new page and inserts it into the balloon | ||
|  |  *			  page list. | ||
|  |  * @b_dev_info: balloon device decriptor where we will insert a new page to | ||
|  |  * | ||
|  |  * Driver must call it to properly allocate a new enlisted balloon page | ||
|  |  * before definetively removing it from the guest system. | ||
|  |  * This function returns the page address for the recently enqueued page or | ||
|  |  * NULL in the case we fail to allocate a new page this turn. | ||
|  |  */ | ||
|  | struct page *balloon_page_enqueue(struct balloon_dev_info *b_dev_info) | ||
|  | { | ||
|  | 	unsigned long flags; | ||
|  | 	struct page *page = alloc_page(balloon_mapping_gfp_mask() | | ||
|  | 					__GFP_NOMEMALLOC | __GFP_NORETRY); | ||
|  | 	if (!page) | ||
|  | 		return NULL; | ||
|  | 
 | ||
|  | 	/*
 | ||
|  | 	 * Block others from accessing the 'page' when we get around to | ||
|  | 	 * establishing additional references. We should be the only one | ||
|  | 	 * holding a reference to the 'page' at this point. | ||
|  | 	 */ | ||
|  | 	BUG_ON(!trylock_page(page)); | ||
|  | 	spin_lock_irqsave(&b_dev_info->pages_lock, flags); | ||
|  | 	balloon_page_insert(page, b_dev_info->mapping, &b_dev_info->pages); | ||
|  | 	spin_unlock_irqrestore(&b_dev_info->pages_lock, flags); | ||
|  | 	unlock_page(page); | ||
|  | 	return page; | ||
|  | } | ||
|  | EXPORT_SYMBOL_GPL(balloon_page_enqueue); | ||
|  | 
 | ||
|  | /*
 | ||
|  |  * balloon_page_dequeue - removes a page from balloon's page list and returns | ||
|  |  *			  the its address to allow the driver release the page. | ||
|  |  * @b_dev_info: balloon device decriptor where we will grab a page from. | ||
|  |  * | ||
|  |  * Driver must call it to properly de-allocate a previous enlisted balloon page | ||
|  |  * before definetively releasing it back to the guest system. | ||
|  |  * This function returns the page address for the recently dequeued page or | ||
|  |  * NULL in the case we find balloon's page list temporarily empty due to | ||
|  |  * compaction isolated pages. | ||
|  |  */ | ||
|  | struct page *balloon_page_dequeue(struct balloon_dev_info *b_dev_info) | ||
|  | { | ||
|  | 	struct page *page, *tmp; | ||
|  | 	unsigned long flags; | ||
|  | 	bool dequeued_page; | ||
|  | 
 | ||
|  | 	dequeued_page = false; | ||
|  | 	list_for_each_entry_safe(page, tmp, &b_dev_info->pages, lru) { | ||
|  | 		/*
 | ||
|  | 		 * Block others from accessing the 'page' while we get around | ||
|  | 		 * establishing additional references and preparing the 'page' | ||
|  | 		 * to be released by the balloon driver. | ||
|  | 		 */ | ||
|  | 		if (trylock_page(page)) { | ||
|  | 			spin_lock_irqsave(&b_dev_info->pages_lock, flags); | ||
|  | 			/*
 | ||
|  | 			 * Raise the page refcount here to prevent any wrong | ||
|  | 			 * attempt to isolate this page, in case of coliding | ||
|  | 			 * with balloon_page_isolate() just after we release | ||
|  | 			 * the page lock. | ||
|  | 			 * | ||
|  | 			 * balloon_page_free() will take care of dropping | ||
|  | 			 * this extra refcount later. | ||
|  | 			 */ | ||
|  | 			get_page(page); | ||
|  | 			balloon_page_delete(page); | ||
|  | 			spin_unlock_irqrestore(&b_dev_info->pages_lock, flags); | ||
|  | 			unlock_page(page); | ||
|  | 			dequeued_page = true; | ||
|  | 			break; | ||
|  | 		} | ||
|  | 	} | ||
|  | 
 | ||
|  | 	if (!dequeued_page) { | ||
|  | 		/*
 | ||
|  | 		 * If we are unable to dequeue a balloon page because the page | ||
|  | 		 * list is empty and there is no isolated pages, then something | ||
|  | 		 * went out of track and some balloon pages are lost. | ||
|  | 		 * BUG() here, otherwise the balloon driver may get stuck into | ||
|  | 		 * an infinite loop while attempting to release all its pages. | ||
|  | 		 */ | ||
|  | 		spin_lock_irqsave(&b_dev_info->pages_lock, flags); | ||
|  | 		if (unlikely(list_empty(&b_dev_info->pages) && | ||
|  | 			     !b_dev_info->isolated_pages)) | ||
|  | 			BUG(); | ||
|  | 		spin_unlock_irqrestore(&b_dev_info->pages_lock, flags); | ||
|  | 		page = NULL; | ||
|  | 	} | ||
|  | 	return page; | ||
|  | } | ||
|  | EXPORT_SYMBOL_GPL(balloon_page_dequeue); | ||
|  | 
 | ||
|  | #ifdef CONFIG_BALLOON_COMPACTION
 | ||
|  | /*
 | ||
|  |  * balloon_mapping_alloc - allocates a special ->mapping for ballooned pages. | ||
|  |  * @b_dev_info: holds the balloon device information descriptor. | ||
|  |  * @a_ops: balloon_mapping address_space_operations descriptor. | ||
|  |  * | ||
|  |  * Driver must call it to properly allocate and initialize an instance of | ||
|  |  * struct address_space which will be used as the special page->mapping for | ||
|  |  * balloon device enlisted page instances. | ||
|  |  */ | ||
|  | struct address_space *balloon_mapping_alloc(struct balloon_dev_info *b_dev_info, | ||
|  | 				const struct address_space_operations *a_ops) | ||
|  | { | ||
|  | 	struct address_space *mapping; | ||
|  | 
 | ||
|  | 	mapping = kmalloc(sizeof(*mapping), GFP_KERNEL); | ||
|  | 	if (!mapping) | ||
|  | 		return ERR_PTR(-ENOMEM); | ||
|  | 
 | ||
|  | 	/*
 | ||
|  | 	 * Give a clean 'zeroed' status to all elements of this special | ||
|  | 	 * balloon page->mapping struct address_space instance. | ||
|  | 	 */ | ||
|  | 	address_space_init_once(mapping); | ||
|  | 
 | ||
|  | 	/*
 | ||
|  | 	 * Set mapping->flags appropriately, to allow balloon pages | ||
|  | 	 * ->mapping identification. | ||
|  | 	 */ | ||
|  | 	mapping_set_balloon(mapping); | ||
|  | 	mapping_set_gfp_mask(mapping, balloon_mapping_gfp_mask()); | ||
|  | 
 | ||
|  | 	/* balloon's page->mapping->a_ops callback descriptor */ | ||
|  | 	mapping->a_ops = a_ops; | ||
|  | 
 | ||
|  | 	/*
 | ||
|  | 	 * Establish a pointer reference back to the balloon device descriptor | ||
|  | 	 * this particular page->mapping will be servicing. | ||
|  | 	 * This is used by compaction / migration procedures to identify and | ||
|  | 	 * access the balloon device pageset while isolating / migrating pages. | ||
|  | 	 * | ||
|  | 	 * As some balloon drivers can register multiple balloon devices | ||
|  | 	 * for a single guest, this also helps compaction / migration to | ||
|  | 	 * properly deal with multiple balloon pagesets, when required. | ||
|  | 	 */ | ||
|  | 	mapping->private_data = b_dev_info; | ||
|  | 	b_dev_info->mapping = mapping; | ||
|  | 
 | ||
|  | 	return mapping; | ||
|  | } | ||
|  | EXPORT_SYMBOL_GPL(balloon_mapping_alloc); | ||
|  | 
 | ||
|  | static inline void __isolate_balloon_page(struct page *page) | ||
|  | { | ||
|  | 	struct balloon_dev_info *b_dev_info = page->mapping->private_data; | ||
|  | 	unsigned long flags; | ||
|  | 	spin_lock_irqsave(&b_dev_info->pages_lock, flags); | ||
|  | 	list_del(&page->lru); | ||
|  | 	b_dev_info->isolated_pages++; | ||
|  | 	spin_unlock_irqrestore(&b_dev_info->pages_lock, flags); | ||
|  | } | ||
|  | 
 | ||
|  | static inline void __putback_balloon_page(struct page *page) | ||
|  | { | ||
|  | 	struct balloon_dev_info *b_dev_info = page->mapping->private_data; | ||
|  | 	unsigned long flags; | ||
|  | 	spin_lock_irqsave(&b_dev_info->pages_lock, flags); | ||
|  | 	list_add(&page->lru, &b_dev_info->pages); | ||
|  | 	b_dev_info->isolated_pages--; | ||
|  | 	spin_unlock_irqrestore(&b_dev_info->pages_lock, flags); | ||
|  | } | ||
|  | 
 | ||
|  | static inline int __migrate_balloon_page(struct address_space *mapping, | ||
|  | 		struct page *newpage, struct page *page, enum migrate_mode mode) | ||
|  | { | ||
|  | 	return page->mapping->a_ops->migratepage(mapping, newpage, page, mode); | ||
|  | } | ||
|  | 
 | ||
|  | /* __isolate_lru_page() counterpart for a ballooned page */ | ||
|  | bool balloon_page_isolate(struct page *page) | ||
|  | { | ||
|  | 	/*
 | ||
|  | 	 * Avoid burning cycles with pages that are yet under __free_pages(), | ||
|  | 	 * or just got freed under us. | ||
|  | 	 * | ||
|  | 	 * In case we 'win' a race for a balloon page being freed under us and | ||
|  | 	 * raise its refcount preventing __free_pages() from doing its job | ||
|  | 	 * the put_page() at the end of this block will take care of | ||
|  | 	 * release this page, thus avoiding a nasty leakage. | ||
|  | 	 */ | ||
|  | 	if (likely(get_page_unless_zero(page))) { | ||
|  | 		/*
 | ||
|  | 		 * As balloon pages are not isolated from LRU lists, concurrent | ||
|  | 		 * compaction threads can race against page migration functions | ||
|  | 		 * as well as race against the balloon driver releasing a page. | ||
|  | 		 * | ||
|  | 		 * In order to avoid having an already isolated balloon page | ||
|  | 		 * being (wrongly) re-isolated while it is under migration, | ||
|  | 		 * or to avoid attempting to isolate pages being released by | ||
|  | 		 * the balloon driver, lets be sure we have the page lock | ||
|  | 		 * before proceeding with the balloon page isolation steps. | ||
|  | 		 */ | ||
|  | 		if (likely(trylock_page(page))) { | ||
|  | 			/*
 | ||
|  | 			 * A ballooned page, by default, has just one refcount. | ||
|  | 			 * Prevent concurrent compaction threads from isolating | ||
|  | 			 * an already isolated balloon page by refcount check. | ||
|  | 			 */ | ||
|  | 			if (__is_movable_balloon_page(page) && | ||
|  | 			    page_count(page) == 2) { | ||
|  | 				__isolate_balloon_page(page); | ||
|  | 				unlock_page(page); | ||
|  | 				return true; | ||
|  | 			} | ||
|  | 			unlock_page(page); | ||
|  | 		} | ||
|  | 		put_page(page); | ||
|  | 	} | ||
|  | 	return false; | ||
|  | } | ||
|  | 
 | ||
|  | /* putback_lru_page() counterpart for a ballooned page */ | ||
|  | void balloon_page_putback(struct page *page) | ||
|  | { | ||
|  | 	/*
 | ||
|  | 	 * 'lock_page()' stabilizes the page and prevents races against | ||
|  | 	 * concurrent isolation threads attempting to re-isolate it. | ||
|  | 	 */ | ||
|  | 	lock_page(page); | ||
|  | 
 | ||
|  | 	if (__is_movable_balloon_page(page)) { | ||
|  | 		__putback_balloon_page(page); | ||
|  | 		/* drop the extra ref count taken for page isolation */ | ||
|  | 		put_page(page); | ||
|  | 	} else { | ||
|  | 		WARN_ON(1); | ||
|  | 		dump_page(page); | ||
|  | 	} | ||
|  | 	unlock_page(page); | ||
|  | } | ||
|  | 
 | ||
|  | /* move_to_new_page() counterpart for a ballooned page */ | ||
|  | int balloon_page_migrate(struct page *newpage, | ||
|  | 			 struct page *page, enum migrate_mode mode) | ||
|  | { | ||
|  | 	struct address_space *mapping; | ||
|  | 	int rc = -EAGAIN; | ||
|  | 
 | ||
|  | 	/*
 | ||
|  | 	 * Block others from accessing the 'newpage' when we get around to | ||
|  | 	 * establishing additional references. We should be the only one | ||
|  | 	 * holding a reference to the 'newpage' at this point. | ||
|  | 	 */ | ||
|  | 	BUG_ON(!trylock_page(newpage)); | ||
|  | 
 | ||
|  | 	if (WARN_ON(!__is_movable_balloon_page(page))) { | ||
|  | 		dump_page(page); | ||
|  | 		unlock_page(newpage); | ||
|  | 		return rc; | ||
|  | 	} | ||
|  | 
 | ||
|  | 	mapping = page->mapping; | ||
|  | 	if (mapping) | ||
|  | 		rc = __migrate_balloon_page(mapping, newpage, page, mode); | ||
|  | 
 | ||
|  | 	unlock_page(newpage); | ||
|  | 	return rc; | ||
|  | } | ||
|  | #endif /* CONFIG_BALLOON_COMPACTION */
 |