These changes are the raw update to linux-4.4.6-rt14. Kernel sources

[kvmfornfv.git] / kernel / mm / slab.c
diff --git a/kernel/mm/slab.c b/kernel/mm/slab.c

index 3dd2d1f..4765c97 100644 (file)
--- a/kernel/mm/slab.c
+++ b/kernel/mm/slab.c
@@ -282,6 +282,7 @@ static void kmem_cache_node_init(struct kmem_cache_node *parent)
  
  #define CFLGS_OFF_SLAB         (0x80000000UL)
  #define        OFF_SLAB(x)     ((x)->flags & CFLGS_OFF_SLAB)
+#define OFF_SLAB_MIN_SIZE (max_t(size_t, PAGE_SIZE >> 5, KMALLOC_MIN_SIZE + 1))
  
  #define BATCHREFILL_LIMIT      16
  /*
@@ -1030,12 +1031,12 @@ static inline int cache_free_alien(struct kmem_cache *cachep, void *objp)
  }
  
  /*
- * Construct gfp mask to allocate from a specific node but do not invoke reclaim
- * or warn about failures.
+ * Construct gfp mask to allocate from a specific node but do not direct reclaim
+ * or warn about failures. kswapd may still wake to reclaim in the background.
   */
  static inline gfp_t gfp_exact_node(gfp_t flags)
  {
-       return (flags | __GFP_THISNODE | __GFP_NOWARN) & ~__GFP_WAIT;
+       return (flags | __GFP_THISNODE | __GFP_NOWARN) & ~__GFP_DIRECT_RECLAIM;
  }
  #endif
  
@@ -1454,6 +1455,7 @@ void __init kmem_cache_init(void)
         kmalloc_caches[INDEX_NODE] = create_kmalloc_cache("kmalloc-node",
                                 kmalloc_size(INDEX_NODE), ARCH_KMALLOC_FLAGS);
         slab_state = PARTIAL_NODE;
+       setup_kmalloc_cache_index_table();
  
         slab_early_init = 0;
  
@@ -1591,16 +1593,17 @@ static struct page *kmem_getpages(struct kmem_cache *cachep, gfp_t flags,
         if (cachep->flags & SLAB_RECLAIM_ACCOUNT)
                 flags |= __GFP_RECLAIMABLE;
  
-       if (memcg_charge_slab(cachep, flags, cachep->gfporder))
-               return NULL;
-
-       page = alloc_pages_exact_node(nodeid, flags | __GFP_NOTRACK, cachep->gfporder);
+       page = __alloc_pages_node(nodeid, flags | __GFP_NOTRACK, cachep->gfporder);
         if (!page) {
-               memcg_uncharge_slab(cachep, cachep->gfporder);
                 slab_out_of_memory(cachep, flags, nodeid);
                 return NULL;
         }
  
+       if (memcg_charge_slab(page, flags, cachep->gfporder, cachep)) {
+               __free_pages(page, cachep->gfporder);
+               return NULL;
+       }
+
         /* Record if ALLOC_NO_WATERMARKS was set when allocating the slab */
         if (page_is_pfmemalloc(page))
                 pfmemalloc_active = true;
@@ -1652,8 +1655,7 @@ static void kmem_freepages(struct kmem_cache *cachep, struct page *page)
  
         if (current->reclaim_state)
                 current->reclaim_state->reclaimed_slab += nr_freed;
-       __free_pages(page, cachep->gfporder);
-       memcg_uncharge_slab(cachep, cachep->gfporder);
+       __free_kmem_pages(page, cachep->gfporder);
  }
  
  static void kmem_rcu_free(struct rcu_head *head)
@@ -1887,21 +1889,10 @@ static void slab_destroy(struct kmem_cache *cachep, struct page *page)
  
         freelist = page->freelist;
         slab_destroy_debugcheck(cachep, page);
-       if (unlikely(cachep->flags & SLAB_DESTROY_BY_RCU)) {
-               struct rcu_head *head;
-
-               /*
-                * RCU free overloads the RCU head over the LRU.
-                * slab_page has been overloeaded over the LRU,
-                * however it is not used from now on so that
-                * we can use it safely.
-                */
-               head = (void *)&page->rcu_head;
-               call_rcu(head, kmem_rcu_free);
-
-       } else {
+       if (unlikely(cachep->flags & SLAB_DESTROY_BY_RCU))
+               call_rcu(&page->rcu_head, kmem_rcu_free);
+       else
                 kmem_freepages(cachep, page);
-       }
  
         /*
          * From now on, we don't use freelist
@@ -2189,9 +2180,16 @@ __kmem_cache_create (struct kmem_cache *cachep, unsigned long flags)
                         size += BYTES_PER_WORD;
         }
  #if FORCED_DEBUG && defined(CONFIG_DEBUG_PAGEALLOC)
-       if (size >= kmalloc_size(INDEX_NODE + 1)
-           && cachep->object_size > cache_line_size()
-           && ALIGN(size, cachep->align) < PAGE_SIZE) {
+       /*
+        * To activate debug pagealloc, off-slab management is necessary
+        * requirement. In early phase of initialization, small sized slab
+        * doesn't get initialized so it would not be possible. So, we need
+        * to check size >= 256. It guarantees that all necessary small
+        * sized slab is initialized in current slab initialization sequence.
+        */
+       if (!slab_early_init && size >= kmalloc_size(INDEX_NODE) &&
+               size >= 256 && cachep->object_size > cache_line_size() &&
+               ALIGN(size, cachep->align) < PAGE_SIZE) {
                 cachep->obj_offset += PAGE_SIZE - ALIGN(size, cachep->align);
                 size = PAGE_SIZE;
         }
@@ -2204,7 +2202,7 @@ __kmem_cache_create (struct kmem_cache *cachep, unsigned long flags)
          * it too early on. Always use on-slab management when
          * SLAB_NOLEAKTRACE to avoid recursive calls into kmemleak)
          */
-       if ((size >= (PAGE_SIZE >> 5)) && !slab_early_init &&
+       if (size >= OFF_SLAB_MIN_SIZE && !slab_early_init &&
             !(flags & SLAB_NOLEAKTRACE))
                 /*
                  * Size is large, assume best to place the slab management obj
@@ -2268,7 +2266,7 @@ __kmem_cache_create (struct kmem_cache *cachep, unsigned long flags)
                 /*
                  * This is a possibility for one of the kmalloc_{dma,}_caches.
                  * But since we go off slab only for object size greater than
-                * PAGE_SIZE/8, and kmalloc_{dma,}_caches get created
+                * OFF_SLAB_MIN_SIZE, and kmalloc_{dma,}_caches get created
                  * in ascending order,this should not happen at all.
                  * But leave a BUG_ON for some lucky dude.
                  */
@@ -2624,7 +2622,7 @@ static int cache_grow(struct kmem_cache *cachep,
  
         offset *= cachep->colour_off;
  
-       if (local_flags & __GFP_WAIT)
+       if (gfpflags_allow_blocking(local_flags))
                 local_irq_enable();
  
         /*
@@ -2654,7 +2652,7 @@ static int cache_grow(struct kmem_cache *cachep,
  
         cache_init_objs(cachep, page);
  
-       if (local_flags & __GFP_WAIT)
+       if (gfpflags_allow_blocking(local_flags))
                 local_irq_disable();
         check_irq_off();
         spin_lock(&n->list_lock);
@@ -2668,7 +2666,7 @@ static int cache_grow(struct kmem_cache *cachep,
  opps1:
         kmem_freepages(cachep, page);
  failed:
-       if (local_flags & __GFP_WAIT)
+       if (gfpflags_allow_blocking(local_flags))
                 local_irq_disable();
         return 0;
  }
@@ -2860,7 +2858,7 @@ force_grow:
  static inline void cache_alloc_debugcheck_before(struct kmem_cache *cachep,
                                                 gfp_t flags)
  {
-       might_sleep_if(flags & __GFP_WAIT);
+       might_sleep_if(gfpflags_allow_blocking(flags));
  #if DEBUG
         kmem_flagcheck(cachep, flags);
  #endif
@@ -3048,11 +3046,11 @@ retry:
                  */
                 struct page *page;
  
-               if (local_flags & __GFP_WAIT)
+               if (gfpflags_allow_blocking(local_flags))
                         local_irq_enable();
                 kmem_flagcheck(cache, flags);
                 page = kmem_getpages(cache, local_flags, numa_mem_id());
-               if (local_flags & __GFP_WAIT)
+               if (gfpflags_allow_blocking(local_flags))
                         local_irq_disable();
                 if (page) {
                         /*
@@ -3415,6 +3413,19 @@ void *kmem_cache_alloc(struct kmem_cache *cachep, gfp_t flags)
  }
  EXPORT_SYMBOL(kmem_cache_alloc);
  
+void kmem_cache_free_bulk(struct kmem_cache *s, size_t size, void **p)
+{
+       __kmem_cache_free_bulk(s, size, p);
+}
+EXPORT_SYMBOL(kmem_cache_free_bulk);
+
+int kmem_cache_alloc_bulk(struct kmem_cache *s, gfp_t flags, size_t size,
+                                                               void **p)
+{
+       return __kmem_cache_alloc_bulk(s, flags, size, p);
+}
+EXPORT_SYMBOL(kmem_cache_alloc_bulk);
+
  #ifdef CONFIG_TRACING
  void *
  kmem_cache_alloc_trace(struct kmem_cache *cachep, gfp_t flags, size_t size)