kmalloc() and kmalloc_node() of the SLUB isn't inlined when @flags = __GFP_DMA.
This patch optimize this case,
so when @flags = __GFP_DMA, it will be inlined into generic code.

Cc: Christoph Lameter <c...@linux.com>
Signed-off-by: Joonsoo Kim <js1...@gmail.com>

diff --git a/include/linux/slub_def.h b/include/linux/slub_def.h
index 4c75f2b..4adf50b 100644
--- a/include/linux/slub_def.h
+++ b/include/linux/slub_def.h
@@ -147,6 +147,7 @@ struct kmem_cache {
  * 2^x bytes of allocations.
  */
 extern struct kmem_cache *kmalloc_caches[SLUB_PAGE_SHIFT];
+extern struct kmem_cache *kmalloc_dma_caches[SLUB_PAGE_SHIFT];
 
 /*
  * Sorry that the following has to be that ugly but some versions of GCC
@@ -266,19 +267,24 @@ static __always_inline void *kmalloc_large(size_t size, 
gfp_t flags)
 
 static __always_inline void *kmalloc(size_t size, gfp_t flags)
 {
+       struct kmem_cache *s;
+       int index;
+
        if (__builtin_constant_p(size)) {
                if (size > SLUB_MAX_SIZE)
                        return kmalloc_large(size, flags);
 
-               if (!(flags & SLUB_DMA)) {
-                       int index = kmalloc_index(size);
-                       struct kmem_cache *s = kmalloc_caches[index];
-
-                       if (!index)
-                               return ZERO_SIZE_PTR;
+               index = kmalloc_index(size);
+               if (!index)
+                       return ZERO_SIZE_PTR;
+#ifdef CONFIG_ZONE_DMA
+               if (unlikely(flags & SLUB_DMA)) {
+                       s = kmalloc_dma_caches[index];
+               } else
+#endif
+                       s = kmalloc_caches[index];
 
-                       return kmem_cache_alloc_trace(s, flags, size);
-               }
+               return kmem_cache_alloc_trace(s, flags, size);
        }
        return __kmalloc(size, flags);
 }
@@ -303,13 +309,19 @@ kmem_cache_alloc_node_trace(struct kmem_cache *s,
 
 static __always_inline void *kmalloc_node(size_t size, gfp_t flags, int node)
 {
-       if (__builtin_constant_p(size) &&
-               size <= SLUB_MAX_SIZE && !(flags & SLUB_DMA)) {
-               int index = kmalloc_index(size);
-               struct kmem_cache *s = kmalloc_caches[index];
+       struct kmem_cache *s;
+       int index;
 
+       if (__builtin_constant_p(size) && size <= SLUB_MAX_SIZE) {
+               index = kmalloc_index(size);
                if (!index)
                        return ZERO_SIZE_PTR;
+#ifdef CONFIG_ZONE_DMA
+               if (unlikely(flags & SLUB_DMA)) {
+                       s = kmalloc_dma_caches[index];
+               } else
+#endif
+                       s = kmalloc_caches[index];
 
                return kmem_cache_alloc_node_trace(s, flags, node, size);
        }
diff --git a/mm/slub.c b/mm/slub.c
index a0d6984..a94533c 100644
--- a/mm/slub.c
+++ b/mm/slub.c
@@ -3222,7 +3222,8 @@ struct kmem_cache *kmalloc_caches[SLUB_PAGE_SHIFT];
 EXPORT_SYMBOL(kmalloc_caches);
 
 #ifdef CONFIG_ZONE_DMA
-static struct kmem_cache *kmalloc_dma_caches[SLUB_PAGE_SHIFT];
+struct kmem_cache *kmalloc_dma_caches[SLUB_PAGE_SHIFT];
+EXPORT_SYMBOL(kmalloc_dma_caches);
 #endif
 
 static int __init setup_slub_min_order(char *str)
-- 
1.7.9.5

--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html
Please read the FAQ at  http://www.tux.org/lkml/

Reply via email to