cpuset: PF_SPREAD_PAGE and PF_SPREAD_SLAB should be atomic flags

author Zefan Li <lizefan@huawei.com>

Thu, 25 Sep 2014 01:41:02 +0000 (09:41 +0800)

committer Ben Hutchings <ben@decadent.org.uk>

Thu, 12 Oct 2017 14:27:22 +0000 (15:27 +0100)
author Zefan Li <lizefan@huawei.com>
Thu, 25 Sep 2014 01:41:02 +0000 (09:41 +0800)
committer Ben Hutchings <ben@decadent.org.uk>
Thu, 12 Oct 2017 14:27:22 +0000 (15:27 +0100)
diff --git a/Documentation/cgroups/cpusets.txt b/Documentation/cgroups/cpusets.txt

index 5c51ed4..eedecbb 100644 (file)
--- a/Documentation/cgroups/cpusets.txt
+++ b/Documentation/cgroups/cpusets.txt
@@ -345,14 +345,14 @@ the named feature on.
  The implementation is simple.
  
  Setting the flag 'cpuset.memory_spread_page' turns on a per-process flag
  The implementation is simple.
  
  Setting the flag 'cpuset.memory_spread_page' turns on a per-process flag
-PF_SPREAD_PAGE for each task that is in that cpuset or subsequently
+PFA_SPREAD_PAGE for each task that is in that cpuset or subsequently
  joins that cpuset.  The page allocation calls for the page cache
  joins that cpuset.  The page allocation calls for the page cache
-is modified to perform an inline check for this PF_SPREAD_PAGE task
+is modified to perform an inline check for this PFA_SPREAD_PAGE task
  flag, and if set, a call to a new routine cpuset_mem_spread_node()
  returns the node to prefer for the allocation.
  
  Similarly, setting 'cpuset.memory_spread_slab' turns on the flag
  flag, and if set, a call to a new routine cpuset_mem_spread_node()
  returns the node to prefer for the allocation.
  
  Similarly, setting 'cpuset.memory_spread_slab' turns on the flag
-PF_SPREAD_SLAB, and appropriately marked slab caches will allocate
+PFA_SPREAD_SLAB, and appropriately marked slab caches will allocate
  pages from the node returned by cpuset_mem_spread_node().
  
  The cpuset_mem_spread_node() routine is also simple.  It uses the
  pages from the node returned by cpuset_mem_spread_node().
  
  The cpuset_mem_spread_node() routine is also simple.  It uses the
diff --git a/include/linux/cpuset.h b/include/linux/cpuset.h

index 7a7e5fd..1dc9427 100644 (file)
--- a/include/linux/cpuset.h
+++ b/include/linux/cpuset.h
@@ -74,12 +74,12 @@ extern int cpuset_slab_spread_node(void);
  
  static inline int cpuset_do_page_mem_spread(void)
  {
  
  static inline int cpuset_do_page_mem_spread(void)
  {
-       return current->flags & PF_SPREAD_PAGE;
+       return task_spread_page(current);
  }
  
  static inline int cpuset_do_slab_mem_spread(void)
  {
  }
  
  static inline int cpuset_do_slab_mem_spread(void)
  {
-       return current->flags & PF_SPREAD_SLAB;
+       return task_spread_slab(current);
  }
  
  extern int current_cpuset_is_being_rebound(void);
  }
  
  extern int current_cpuset_is_being_rebound(void);
diff --git a/include/linux/sched.h b/include/linux/sched.h

index a0ec634..2d4ab76 100644 (file)
--- a/include/linux/sched.h
+++ b/include/linux/sched.h
@@ -1812,8 +1812,6 @@ extern void thread_group_times(struct task_struct *p, cputime_t *ut, cputime_t *
  #define PF_KTHREAD     0x00200000      /* I am a kernel thread */
  #define PF_RANDOMIZE   0x00400000      /* randomize virtual address space */
  #define PF_SWAPWRITE   0x00800000      /* Allowed to write to swap */
  #define PF_KTHREAD     0x00200000      /* I am a kernel thread */
  #define PF_RANDOMIZE   0x00400000      /* randomize virtual address space */
  #define PF_SWAPWRITE   0x00800000      /* Allowed to write to swap */
-#define PF_SPREAD_PAGE 0x01000000      /* Spread page cache over cpuset */
-#define PF_SPREAD_SLAB 0x02000000      /* Spread some slab caches over cpuset */
  #define PF_THREAD_BOUND        0x04000000      /* Thread bound to specific cpu */
  #define PF_MCE_EARLY    0x08000000      /* Early kill for mce process policy */
  #define PF_MEMPOLICY   0x10000000      /* Non-default NUMA mempolicy */
  #define PF_THREAD_BOUND        0x04000000      /* Thread bound to specific cpu */
  #define PF_MCE_EARLY    0x08000000      /* Early kill for mce process policy */
  #define PF_MEMPOLICY   0x10000000      /* Non-default NUMA mempolicy */
@@ -1847,6 +1845,8 @@ extern void thread_group_times(struct task_struct *p, cputime_t *ut, cputime_t *
  #define used_math() tsk_used_math(current)
  
  /* Per-process atomic flags. */
  #define used_math() tsk_used_math(current)
  
  /* Per-process atomic flags. */
+#define PFA_SPREAD_PAGE  1      /* Spread page cache over cpuset */
+#define PFA_SPREAD_SLAB  2      /* Spread some slab caches over cpuset */
  
  #define TASK_PFA_TEST(name, func)                                      \
         static inline bool task_##func(struct task_struct *p)           \
  
  #define TASK_PFA_TEST(name, func)                                      \
         static inline bool task_##func(struct task_struct *p)           \
@@ -1950,6 +1950,14 @@ static inline int set_cpus_allowed(struct task_struct *p, cpumask_t new_mask)
  }
  #endif
  
  }
  #endif
  
+TASK_PFA_TEST(SPREAD_PAGE, spread_page)
+TASK_PFA_SET(SPREAD_PAGE, spread_page)
+TASK_PFA_CLEAR(SPREAD_PAGE, spread_page)
+
+TASK_PFA_TEST(SPREAD_SLAB, spread_slab)
+TASK_PFA_SET(SPREAD_SLAB, spread_slab)
+TASK_PFA_CLEAR(SPREAD_SLAB, spread_slab)
+
  /*
   * Do not use outside of architecture code which knows its limitations.
   *
  /*
   * Do not use outside of architecture code which knows its limitations.
   *
diff --git a/kernel/cpuset.c b/kernel/cpuset.c

index 4346f9a..5cc0eec 100644 (file)
--- a/kernel/cpuset.c
+++ b/kernel/cpuset.c
@@ -326,13 +326,14 @@ static void cpuset_update_task_spread_flag(struct cpuset *cs,
                                         struct task_struct *tsk)
  {
         if (is_spread_page(cs))
                                         struct task_struct *tsk)
  {
         if (is_spread_page(cs))
-               tsk->flags |= PF_SPREAD_PAGE;
+               task_set_spread_page(tsk);
         else
         else
-               tsk->flags &= ~PF_SPREAD_PAGE;
+               task_clear_spread_page(tsk);
+
         if (is_spread_slab(cs))
         if (is_spread_slab(cs))
-               tsk->flags |= PF_SPREAD_SLAB;
+               task_set_spread_slab(tsk);
         else
         else
-               tsk->flags &= ~PF_SPREAD_SLAB;
+               task_clear_spread_slab(tsk);
  }
  
  /*
  }
  
  /*
diff --git a/mm/slab.c b/mm/slab.c

index aea5e42..bb39255 100644 (file)
--- a/mm/slab.c
+++ b/mm/slab.c
@@ -3255,7 +3255,7 @@ static inline void *____cache_alloc(struct kmem_cache *cachep, gfp_t flags)
  
  #ifdef CONFIG_NUMA
  /*
  
  #ifdef CONFIG_NUMA
  /*
- * Try allocating on another node if PF_SPREAD_SLAB|PF_MEMPOLICY.
+ * Try allocating on another node if PFA_SPREAD_SLAB|PF_MEMPOLICY.
   *
   * If we are in_interrupt, then process context, including cpusets and
   * mempolicy, may not apply and should not be used for allocation policy.
   *
   * If we are in_interrupt, then process context, including cpusets and
   * mempolicy, may not apply and should not be used for allocation policy.
@@ -3496,7 +3496,7 @@ __do_cache_alloc(struct kmem_cache *cache, gfp_t flags)
  {
         void *objp;
  
  {
         void *objp;
  
-       if (unlikely(current->flags & (PF_SPREAD_SLAB | PF_MEMPOLICY))) {
+       if (unlikely((current->flags & PF_MEMPOLICY) || cpuset_do_slab_mem_spread())) {
                 objp = alternate_node_alloc(cache, flags);
                 if (objp)
                         goto out;
                 objp = alternate_node_alloc(cache, flags);
                 if (objp)
                         goto out;
author	Zefan Li <lizefan@huawei.com>
	Thu, 25 Sep 2014 01:41:02 +0000 (09:41 +0800)
committer	Ben Hutchings <ben@decadent.org.uk>
	Thu, 12 Oct 2017 14:27:22 +0000 (15:27 +0100)
Documentation/cgroups/cpusets.txt		patch \| blob \| history
include/linux/cpuset.h		patch \| blob \| history
include/linux/sched.h		patch \| blob \| history
kernel/cpuset.c		patch \| blob \| history
mm/slab.c		patch \| blob \| history