mm, compaction: pass classzone_idx and alloc_flags to watermark checking

[pandora-kernel.git] / mm / page_alloc.c
diff --git a/mm/page_alloc.c b/mm/page_alloc.c

index 9cd36b8..e32121f 100644 (file)
--- a/mm/page_alloc.c
+++ b/mm/page_alloc.c
@@ -466,29 +466,6 @@ static inline void rmv_page_order(struct page *page)
         set_page_private(page, 0);
  }
  
-/*
- * Locate the struct page for both the matching buddy in our
- * pair (buddy1) and the combined O(n+1) page they form (page).
- *
- * 1) Any buddy B1 will have an order O twin B2 which satisfies
- * the following equation:
- *     B2 = B1 ^ (1 << O)
- * For example, if the starting buddy (buddy2) is #8 its order
- * 1 buddy is #10:
- *     B2 = 8 ^ (1 << 1) = 8 ^ 2 = 10
- *
- * 2) Any buddy B will have an order O+1 parent P which
- * satisfies the following equation:
- *     P = B & ~(1 << O)
- *
- * Assumption: *_mem_map is contiguous at least up to MAX_ORDER
- */
-static inline unsigned long
-__find_buddy_index(unsigned long page_idx, unsigned int order)
-{
-       return page_idx ^ (1 << order);
-}
-
  /*
   * This function checks whether a page is free && is the buddy
   * we can do coalesce a page and its buddy if
@@ -569,6 +546,7 @@ static inline void __free_one_page(struct page *page,
         unsigned long combined_idx;
         unsigned long uninitialized_var(buddy_idx);
         struct page *buddy;
+       int max_order = MAX_ORDER;
  
         VM_BUG_ON(!zone_is_initialized(zone));
  
@@ -577,13 +555,24 @@ static inline void __free_one_page(struct page *page,
                         return;
  
         VM_BUG_ON(migratetype == -1);
+       if (is_migrate_isolate(migratetype)) {
+               /*
+                * We restrict max order of merging to prevent merge
+                * between freepages on isolate pageblock and normal
+                * pageblock. Without this, pageblock isolation
+                * could cause incorrect freepage accounting.
+                */
+               max_order = min(MAX_ORDER, pageblock_order + 1);
+       } else {
+               __mod_zone_freepage_state(zone, 1 << order, migratetype);
+       }
  
-       page_idx = pfn & ((1 << MAX_ORDER) - 1);
+       page_idx = pfn & ((1 << max_order) - 1);
  
         VM_BUG_ON_PAGE(page_idx & ((1 << order) - 1), page);
         VM_BUG_ON_PAGE(bad_range(zone, page), page);
  
-       while (order < MAX_ORDER-1) {
+       while (order < max_order - 1) {
                 buddy_idx = __find_buddy_index(page_idx, order);
                 buddy = page + (buddy_idx - page_idx);
                 if (!page_is_buddy(page, buddy, order))
@@ -594,9 +583,11 @@ static inline void __free_one_page(struct page *page,
                  */
                 if (page_is_guard(buddy)) {
                         clear_page_guard_flag(buddy);
-                       set_page_private(page, 0);
-                       __mod_zone_freepage_state(zone, 1 << order,
-                                                 migratetype);
+                       set_page_private(buddy, 0);
+                       if (!is_migrate_isolate(migratetype)) {
+                               __mod_zone_freepage_state(zone, 1 << order,
+                                                         migratetype);
+                       }
                 } else {
                         list_del(&buddy->lru);
                         zone->free_area[order].nr_free--;
@@ -715,14 +706,12 @@ static void free_pcppages_bulk(struct zone *zone, int count,
                         /* must delete as __free_one_page list manipulates */
                         list_del(&page->lru);
                         mt = get_freepage_migratetype(page);
+                       if (unlikely(has_isolate_pageblock(zone)))
+                               mt = get_pageblock_migratetype(page);
+
                         /* MIGRATE_MOVABLE list may include MIGRATE_RESERVEs */
                         __free_one_page(page, page_to_pfn(page), zone, 0, mt);
                         trace_mm_page_pcpu_drain(page, 0, mt);
-                       if (likely(!is_migrate_isolate_page(page))) {
-                               __mod_zone_page_state(zone, NR_FREE_PAGES, 1);
-                               if (is_migrate_cma(mt))
-                                       __mod_zone_page_state(zone, NR_FREE_CMA_PAGES, 1);
-                       }
                 } while (--to_free && --batch_free && !list_empty(list));
         }
         spin_unlock(&zone->lock);
@@ -739,9 +728,11 @@ static void free_one_page(struct zone *zone,
         if (nr_scanned)
                 __mod_zone_page_state(zone, NR_PAGES_SCANNED, -nr_scanned);
  
+       if (unlikely(has_isolate_pageblock(zone) ||
+               is_migrate_isolate(migratetype))) {
+               migratetype = get_pfnblock_migratetype(page, pfn);
+       }
         __free_one_page(page, pfn, zone, order, migratetype);
-       if (unlikely(!is_migrate_isolate(migratetype)))
-               __mod_zone_freepage_state(zone, 1 << order, migratetype);
         spin_unlock(&zone->lock);
  }
  
@@ -750,6 +741,9 @@ static bool free_pages_prepare(struct page *page, unsigned int order)
         int i;
         int bad = 0;
  
+       VM_BUG_ON_PAGE(PageTail(page), page);
+       VM_BUG_ON_PAGE(PageHead(page) && compound_order(page) != order, page);
+
         trace_mm_page_free(page, order);
         kmemcheck_free_shadow(page, order);
  
@@ -1276,55 +1270,75 @@ void drain_zone_pages(struct zone *zone, struct per_cpu_pages *pcp)
  #endif
  
  /*
- * Drain pages of the indicated processor.
+ * Drain pcplists of the indicated processor and zone.
   *
   * The processor must either be the current processor and the
   * thread pinned to the current processor or a processor that
   * is not online.
   */
-static void drain_pages(unsigned int cpu)
+static void drain_pages_zone(unsigned int cpu, struct zone *zone)
  {
         unsigned long flags;
-       struct zone *zone;
+       struct per_cpu_pageset *pset;
+       struct per_cpu_pages *pcp;
  
-       for_each_populated_zone(zone) {
-               struct per_cpu_pageset *pset;
-               struct per_cpu_pages *pcp;
+       local_irq_save(flags);
+       pset = per_cpu_ptr(zone->pageset, cpu);
  
-               local_irq_save(flags);
-               pset = per_cpu_ptr(zone->pageset, cpu);
+       pcp = &pset->pcp;
+       if (pcp->count) {
+               free_pcppages_bulk(zone, pcp->count, pcp);
+               pcp->count = 0;
+       }
+       local_irq_restore(flags);
+}
  
-               pcp = &pset->pcp;
-               if (pcp->count) {
-                       free_pcppages_bulk(zone, pcp->count, pcp);
-                       pcp->count = 0;
-               }
-               local_irq_restore(flags);
+/*
+ * Drain pcplists of all zones on the indicated processor.
+ *
+ * The processor must either be the current processor and the
+ * thread pinned to the current processor or a processor that
+ * is not online.
+ */
+static void drain_pages(unsigned int cpu)
+{
+       struct zone *zone;
+
+       for_each_populated_zone(zone) {
+               drain_pages_zone(cpu, zone);
         }
  }
  
  /*
   * Spill all of this CPU's per-cpu pages back into the buddy allocator.
+ *
+ * The CPU has to be pinned. When zone parameter is non-NULL, spill just
+ * the single zone's pages.
   */
-void drain_local_pages(void *arg)
+void drain_local_pages(struct zone *zone)
  {
-       drain_pages(smp_processor_id());
+       int cpu = smp_processor_id();
+
+       if (zone)
+               drain_pages_zone(cpu, zone);
+       else
+               drain_pages(cpu);
  }
  
  /*
   * Spill all the per-cpu pages from all CPUs back into the buddy allocator.
   *
+ * When zone parameter is non-NULL, spill just the single zone's pages.
+ *
   * Note that this code is protected against sending an IPI to an offline
   * CPU but does not guarantee sending an IPI to newly hotplugged CPUs:
   * on_each_cpu_mask() blocks hotplug and won't talk to offlined CPUs but
   * nothing keeps CPUs from showing up after we populated the cpumask and
   * before the call to on_each_cpu_mask().
   */
-void drain_all_pages(void)
+void drain_all_pages(struct zone *zone)
  {
         int cpu;
-       struct per_cpu_pageset *pcp;
-       struct zone *zone;
  
         /*
          * Allocate in the BSS so we wont require allocation in
@@ -1339,20 +1353,31 @@ void drain_all_pages(void)
          * disables preemption as part of its processing
          */
         for_each_online_cpu(cpu) {
+               struct per_cpu_pageset *pcp;
+               struct zone *z;
                 bool has_pcps = false;
-               for_each_populated_zone(zone) {
+
+               if (zone) {
                         pcp = per_cpu_ptr(zone->pageset, cpu);
-                       if (pcp->pcp.count) {
+                       if (pcp->pcp.count)
                                 has_pcps = true;
-                               break;
+               } else {
+                       for_each_populated_zone(z) {
+                               pcp = per_cpu_ptr(z->pageset, cpu);
+                               if (pcp->pcp.count) {
+                                       has_pcps = true;
+                                       break;
+                               }
                         }
                 }
+
                 if (has_pcps)
                         cpumask_set_cpu(cpu, &cpus_with_pcps);
                 else
                         cpumask_clear_cpu(cpu, &cpus_with_pcps);
         }
-       on_each_cpu_mask(&cpus_with_pcps, drain_local_pages, NULL, 1);
+       on_each_cpu_mask(&cpus_with_pcps, (smp_call_func_t) drain_local_pages,
+                                                               zone, 1);
  }
  
  #ifdef CONFIG_HIBERNATION
@@ -1484,7 +1509,7 @@ void split_page(struct page *page, unsigned int order)
  }
  EXPORT_SYMBOL_GPL(split_page);
  
-static int __isolate_free_page(struct page *page, unsigned int order)
+int __isolate_free_page(struct page *page, unsigned int order)
  {
         unsigned long watermark;
         struct zone *zone;
@@ -2316,6 +2341,7 @@ __alloc_pages_direct_compact(gfp_t gfp_mask, unsigned int order,
         compact_result = try_to_compact_pages(zonelist, order, gfp_mask,
                                                 nodemask, mode,
                                                 contended_compaction,
+                                               alloc_flags, classzone_idx,
                                                 &last_compact_zone);
         current->flags &= ~PF_MEMALLOC;
  
@@ -2442,7 +2468,7 @@ retry:
          * pages are pinned on the per-cpu lists. Drain them and try again
          */
         if (!page && !drained) {
-               drain_all_pages();
+               drain_all_pages(NULL);
                 drained = true;
                 goto retry;
         }
@@ -3902,14 +3928,14 @@ void __ref build_all_zonelists(pg_data_t *pgdat, struct zone *zone)
         else
                 page_group_by_mobility_disabled = 0;
  
-       printk("Built %i zonelists in %s order, mobility grouping %s.  "
+       pr_info("Built %i zonelists in %s order, mobility grouping %s.  "
                 "Total pages: %ld\n",
                         nr_online_nodes,
                         zonelist_order_name[current_zonelist_order],
                         page_group_by_mobility_disabled ? "off" : "on",
                         vm_total_pages);
  #ifdef CONFIG_NUMA
-       printk("Policy zone: %s\n", zone_names[policy_zone]);
+       pr_info("Policy zone: %s\n", zone_names[policy_zone]);
  #endif
  }
  
@@ -5343,33 +5369,33 @@ void __init free_area_init_nodes(unsigned long *max_zone_pfn)
         find_zone_movable_pfns_for_nodes();
  
         /* Print out the zone ranges */
-       printk("Zone ranges:\n");
+       pr_info("Zone ranges:\n");
         for (i = 0; i < MAX_NR_ZONES; i++) {
                 if (i == ZONE_MOVABLE)
                         continue;
-               printk(KERN_CONT "  %-8s ", zone_names[i]);
+               pr_info("  %-8s ", zone_names[i]);
                 if (arch_zone_lowest_possible_pfn[i] ==
                                 arch_zone_highest_possible_pfn[i])
-                       printk(KERN_CONT "empty\n");
+                       pr_cont("empty\n");
                 else
-                       printk(KERN_CONT "[mem %0#10lx-%0#10lx]\n",
+                       pr_cont("[mem %0#10lx-%0#10lx]\n",
                                 arch_zone_lowest_possible_pfn[i] << PAGE_SHIFT,
                                 (arch_zone_highest_possible_pfn[i]
                                         << PAGE_SHIFT) - 1);
         }
  
         /* Print out the PFNs ZONE_MOVABLE begins at in each node */
-       printk("Movable zone start for each node\n");
+       pr_info("Movable zone start for each node\n");
         for (i = 0; i < MAX_NUMNODES; i++) {
                 if (zone_movable_pfn[i])
-                       printk("  Node %d: %#010lx\n", i,
+                       pr_info("  Node %d: %#010lx\n", i,
                                zone_movable_pfn[i] << PAGE_SHIFT);
         }
  
         /* Print out the early node map */
-       printk("Early memory node ranges\n");
+       pr_info("Early memory node ranges\n");
         for_each_mem_pfn_range(i, MAX_NUMNODES, &start_pfn, &end_pfn, &nid)
-               printk("  node %3d: [mem %#010lx-%#010lx]\n", nid,
+               pr_info("  node %3d: [mem %#010lx-%#010lx]\n", nid,
                        start_pfn << PAGE_SHIFT, (end_pfn << PAGE_SHIFT) - 1);
  
         /* Initialise every node */
@@ -5505,7 +5531,7 @@ void __init mem_init_print_info(const char *str)
  
  #undef adj_init_size
  
-       printk("Memory: %luK/%luK available "
+       pr_info("Memory: %luK/%luK available "
                "(%luK kernel code, %luK rwdata, %luK rodata, "
                "%luK init, %luK bss, %luK reserved"
  #ifdef CONFIG_HIGHMEM
@@ -6394,7 +6420,7 @@ int alloc_contig_range(unsigned long start, unsigned long end,
          */
  
         lru_add_drain_all();
-       drain_all_pages();
+       drain_all_pages(cc.zone);
  
         order = 0;
         outer_start = start;
@@ -6408,13 +6434,12 @@ int alloc_contig_range(unsigned long start, unsigned long end,
  
         /* Make sure the range is really isolated. */
         if (test_pages_isolated(outer_start, end, false)) {
-               pr_warn("alloc_contig_range test_pages_isolated(%lx, %lx) failed\n",
-                      outer_start, end);
+               pr_info("%s: [%lx, %lx) PFNs busy\n",
+                       __func__, outer_start, end);
                 ret = -EBUSY;
                 goto done;
         }
  
-
         /* Grab isolated pages from freelists. */
         outer_end = isolate_freepages_range(&cc, outer_start, end);
         if (!outer_end) {