Bias the placement of kernel pages at lower PFNs
authorMel Gorman <mel@csn.ul.ie>
Tue, 16 Oct 2007 08:25:54 +0000 (01:25 -0700)
committerLinus Torvalds <torvalds@woody.linux-foundation.org>
Tue, 16 Oct 2007 16:43:00 +0000 (09:43 -0700)
This patch chooses blocks with lower PFNs when placing kernel allocations.
This is particularly important during fallback in low memory situations to
stop unmovable pages being placed throughout the entire address space.

Signed-off-by: Mel Gorman <mel@csn.ul.ie>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
mm/page_alloc.c

index 676aec9..e1d87ee 100644 (file)
@@ -765,6 +765,23 @@ int move_freepages_block(struct zone *zone, struct page *page, int migratetype)
        return move_freepages(zone, start_page, end_page, migratetype);
 }
 
+/* Return the page with the lowest PFN in the list */
+static struct page *min_page(struct list_head *list)
+{
+       unsigned long min_pfn = -1UL;
+       struct page *min_page = NULL, *page;;
+
+       list_for_each_entry(page, list, lru) {
+               unsigned long pfn = page_to_pfn(page);
+               if (pfn < min_pfn) {
+                       min_pfn = pfn;
+                       min_page = page;
+               }
+       }
+
+       return min_page;
+}
+
 /* Remove an element from the buddy allocator from the fallback list */
 static struct page *__rmqueue_fallback(struct zone *zone, int order,
                                                int start_migratetype)
@@ -795,8 +812,11 @@ retry:
                        if (list_empty(&area->free_list[migratetype]))
                                continue;
 
+                       /* Bias kernel allocations towards low pfns */
                        page = list_entry(area->free_list[migratetype].next,
                                        struct page, lru);
+                       if (unlikely(start_migratetype != MIGRATE_MOVABLE))
+                               page = min_page(&area->free_list[migratetype]);
                        area->nr_free--;
 
                        /*