[PATCH] fix a bogus OOM condition for __GFP_NOFS allocations

author Andrew Morton <akpm@digeo.com>

Sun, 15 Sep 2002 15:50:53 +0000 (08:50 -0700)

committer Christoph Hellwig <hch@hera.kernel.org>

Sun, 15 Sep 2002 15:50:53 +0000 (08:50 -0700)
author Andrew Morton <akpm@digeo.com>
Sun, 15 Sep 2002 15:50:53 +0000 (08:50 -0700)
committer Christoph Hellwig <hch@hera.kernel.org>
Sun, 15 Sep 2002 15:50:53 +0000 (08:50 -0700)
diff --git a/mm/mempool.c b/mm/mempool.c

index 94a5352feb8cc5f91b07e523d0df6b1d3703ca60..b92e72b211d3f55bfeb9d5111f6c4f5369ff284b 100644 (file)
--- a/mm/mempool.c
+++ b/mm/mempool.c
@@ -196,10 +196,11 @@ repeat_alloc:
                 return element;
  
         /*
-        * If the pool is less than 50% full then try harder
-        * to allocate an element:
+        * If the pool is less than 50% full and we can perform effective
+        * page reclaim then try harder to allocate an element.
          */
-       if ((gfp_mask != gfp_nowait) && (pool->curr_nr <= pool->min_nr/2)) {
+       if ((gfp_mask & __GFP_FS) && (gfp_mask != gfp_nowait) &&
+                               (pool->curr_nr <= pool->min_nr/2)) {
                 element = pool->alloc(gfp_mask, pool->pool_data);
                 if (likely(element != NULL))
                         return element;
diff --git a/mm/vmscan.c b/mm/vmscan.c

index a0979a8cb88cf45df9b7ef093143de65a46e1fb6..f220b40fc9c1b4e92378c08b45e5bc1a1cb7f38a 100644 (file)
--- a/mm/vmscan.c
+++ b/mm/vmscan.c
@@ -536,6 +536,20 @@ shrink_caches(struct zone *classzone, int priority,
  
  /*
   * This is the main entry point to page reclaim.
+ *
+ * If a full scan of the inactive list fails to free enough memory then we
+ * are "out of memory" and something needs to be killed.
+ *
+ * If the caller is !__GFP_FS then the probability of a failure is reasonably
+ * high - the zone may be full of dirty or under-writeback pages, which this
+ * caller can't do much about.  So for !__GFP_FS callers, we just perform a
+ * small LRU walk and if that didn't work out, fail the allocation back to the
+ * caller.  GFP_NOFS allocators need to know how to deal with it.  Kicking
+ * bdflush, waiting and retrying will work.
+ *
+ * This is a fairly lame algorithm - it can result in excessive CPU burning and
+ * excessive rotation of the inactive list, which is _supposed_ to be an LRU,
+ * yes?
   */
  int
  try_to_free_pages(struct zone *classzone,
@@ -546,13 +560,16 @@ try_to_free_pages(struct zone *classzone,
  
         KERNEL_STAT_INC(pageoutrun);
  
-       do {
+       for (priority = DEF_PRIORITY; priority; priority--) {
                 nr_pages = shrink_caches(classzone, priority,
                                         gfp_mask, nr_pages);
                 if (nr_pages <= 0)
                         return 1;
-       } while (--priority);
-       out_of_memory();
+               if (!(gfp_mask & __GFP_FS))
+                       break;
+       }
+       if (gfp_mask & __GFP_FS)
+               out_of_memory();
         return 0;
  }
author	Andrew Morton <akpm@digeo.com>
	Sun, 15 Sep 2002 15:50:53 +0000 (08:50 -0700)
committer	Christoph Hellwig <hch@hera.kernel.org>
	Sun, 15 Sep 2002 15:50:53 +0000 (08:50 -0700)
mm/mempool.c		patch \| blob \| history
mm/vmscan.c		patch \| blob \| history