ARM: dts: at91: sama5d3: define clock rate range for tcb1

[sagit-ice-cold/kernel_xiaomi_msm8998.git] / kernel / cpuset.c
diff --git a/kernel/cpuset.c b/kernel/cpuset.c

index 02a8ea5..dd3ae6e 100644 (file)
--- a/kernel/cpuset.c
+++ b/kernel/cpuset.c
@@ -57,10 +57,10 @@
  #include <asm/uaccess.h>
  #include <linux/atomic.h>
  #include <linux/mutex.h>
-#include <linux/workqueue.h>
  #include <linux/cgroup.h>
  #include <linux/wait.h>
  
+struct static_key cpusets_pre_enable_key __read_mostly = STATIC_KEY_INIT_FALSE;
  struct static_key cpusets_enabled_key __read_mostly = STATIC_KEY_INIT_FALSE;
  
  /* See "Frequency meter" comments, below. */
@@ -174,9 +174,9 @@ typedef enum {
  } cpuset_flagbits_t;
  
  /* convenient tests for these bits */
-static inline bool is_cpuset_online(const struct cpuset *cs)
+static inline bool is_cpuset_online(struct cpuset *cs)
  {
-       return test_bit(CS_ONLINE, &cs->flags);
+       return test_bit(CS_ONLINE, &cs->flags) && !css_is_dying(&cs->css);
  }
  
  static inline int is_cpu_exclusive(const struct cpuset *cs)
@@ -286,6 +286,8 @@ static struct cpuset top_cpuset = {
  static DEFINE_MUTEX(cpuset_mutex);
  static DEFINE_SPINLOCK(callback_lock);
  
+static struct workqueue_struct *cpuset_migrate_mm_wq;
+
  /*
   * CPU / memory hotplug is handled asynchronously.
   */
@@ -323,8 +325,7 @@ static struct file_system_type cpuset_fs_type = {
  /*
   * Return in pmask the portion of a cpusets's cpus_allowed that
   * are online.  If none are online, walk up the cpuset hierarchy
- * until we find one that does have some online cpus.  The top
- * cpuset always has some cpus online.
+ * until we find one that does have some online cpus.
   *
   * One way or another, we guarantee to return some non-empty subset
   * of cpu_online_mask.
@@ -333,8 +334,20 @@ static struct file_system_type cpuset_fs_type = {
   */
  static void guarantee_online_cpus(struct cpuset *cs, struct cpumask *pmask)
  {
-       while (!cpumask_intersects(cs->effective_cpus, cpu_online_mask))
+       while (!cpumask_intersects(cs->effective_cpus, cpu_online_mask)) {
                 cs = parent_cs(cs);
+               if (unlikely(!cs)) {
+                       /*
+                        * The top cpuset doesn't have any online cpu as a
+                        * consequence of a race between cpuset_hotplug_work
+                        * and cpu hotplug notifier.  But we know the top
+                        * cpuset's effective_cpus is on its way to to be
+                        * identical to cpu_online_mask.
+                        */
+                       cpumask_copy(pmask, cpu_online_mask);
+                       return;
+               }
+       }
         cpumask_and(pmask, cs->effective_cpus, cpu_online_mask);
  }
  
@@ -971,31 +984,51 @@ static int update_cpumask(struct cpuset *cs, struct cpuset *trialcs,
  }
  
  /*
- * cpuset_migrate_mm
- *
- *    Migrate memory region from one set of nodes to another.
- *
- *    Temporarilly set tasks mems_allowed to target nodes of migration,
- *    so that the migration code can allocate pages on these nodes.
- *
- *    While the mm_struct we are migrating is typically from some
- *    other task, the task_struct mems_allowed that we are hacking
- *    is for our current task, which must allocate new pages for that
- *    migrating memory region.
+ * Migrate memory region from one set of nodes to another.  This is
+ * performed asynchronously as it can be called from process migration path
+ * holding locks involved in process management.  All mm migrations are
+ * performed in the queued order and can be waited for by flushing
+ * cpuset_migrate_mm_wq.
   */
  
+struct cpuset_migrate_mm_work {
+       struct work_struct      work;
+       struct mm_struct        *mm;
+       nodemask_t              from;
+       nodemask_t              to;
+};
+
+static void cpuset_migrate_mm_workfn(struct work_struct *work)
+{
+       struct cpuset_migrate_mm_work *mwork =
+               container_of(work, struct cpuset_migrate_mm_work, work);
+
+       /* on a wq worker, no need to worry about %current's mems_allowed */
+       do_migrate_pages(mwork->mm, &mwork->from, &mwork->to, MPOL_MF_MOVE_ALL);
+       mmput(mwork->mm);
+       kfree(mwork);
+}
+
  static void cpuset_migrate_mm(struct mm_struct *mm, const nodemask_t *from,
                                                         const nodemask_t *to)
  {
-       struct task_struct *tsk = current;
+       struct cpuset_migrate_mm_work *mwork;
  
-       tsk->mems_allowed = *to;
-
-       do_migrate_pages(mm, from, to, MPOL_MF_MOVE_ALL);
+       mwork = kzalloc(sizeof(*mwork), GFP_KERNEL);
+       if (mwork) {
+               mwork->mm = mm;
+               mwork->from = *from;
+               mwork->to = *to;
+               INIT_WORK(&mwork->work, cpuset_migrate_mm_workfn);
+               queue_work(cpuset_migrate_mm_wq, &mwork->work);
+       } else {
+               mmput(mm);
+       }
+}
  
-       rcu_read_lock();
-       guarantee_online_mems(task_cs(tsk), &tsk->mems_allowed);
-       rcu_read_unlock();
+static void cpuset_post_attach(void)
+{
+       flush_workqueue(cpuset_migrate_mm_wq);
  }
  
  /*
@@ -1096,7 +1129,8 @@ static void update_tasks_nodemask(struct cpuset *cs)
                 mpol_rebind_mm(mm, &cs->mems_allowed);
                 if (migrate)
                         cpuset_migrate_mm(mm, &cs->old_mems_allowed, &newmems);
-               mmput(mm);
+               else
+                       mmput(mm);
         }
         css_task_iter_end(&it);
  
@@ -1541,11 +1575,11 @@ static void cpuset_attach(struct cgroup_taskset *tset)
                          * @old_mems_allowed is the right nodesets that we
                          * migrate mm from.
                          */
-                       if (is_memory_migrate(cs)) {
+                       if (is_memory_migrate(cs))
                                 cpuset_migrate_mm(mm, &oldcs->old_mems_allowed,
                                                   &cpuset_attach_nodemask_to);
-                       }
-                       mmput(mm);
+                       else
+                               mmput(mm);
                 }
         }
  
@@ -1710,6 +1744,7 @@ out_unlock:
         mutex_unlock(&cpuset_mutex);
         kernfs_unbreak_active_protection(of->kn);
         css_put(&cs->css);
+       flush_workqueue(cpuset_migrate_mm_wq);
         return retval ?: nbytes;
  }
  
@@ -1875,6 +1910,7 @@ static struct cftype files[] = {
         {
                 .name = "memory_pressure",
                 .read_u64 = cpuset_read_u64,
+               .private = FILE_MEMORY_PRESSURE,
         },
  
         {
@@ -2051,6 +2087,20 @@ static void cpuset_bind(struct cgroup_subsys_state *root_css)
         mutex_unlock(&cpuset_mutex);
  }
  
+/*
+ * Make sure the new task conform to the current state of its parent,
+ * which could have been changed by cpuset just after it inherits the
+ * state from the parent and before it sits on the cgroup's task list.
+ */
+void cpuset_fork(struct task_struct *task, void *priv)
+{
+       if (task_css_is_root(task, cpuset_cgrp_id))
+               return;
+
+       set_cpus_allowed_ptr(task, &current->cpus_allowed);
+       task->mems_allowed = current->mems_allowed;
+}
+
  struct cgroup_subsys cpuset_cgrp_subsys = {
         .css_alloc      = cpuset_css_alloc,
         .css_online     = cpuset_css_online,
@@ -2059,7 +2109,9 @@ struct cgroup_subsys cpuset_cgrp_subsys = {
         .can_attach     = cpuset_can_attach,
         .cancel_attach  = cpuset_cancel_attach,
         .attach         = cpuset_attach,
+       .post_attach    = cpuset_post_attach,
         .bind           = cpuset_bind,
+       .fork           = cpuset_fork,
         .legacy_cftypes = files,
         .early_init     = 1,
  };
@@ -2229,6 +2281,13 @@ retry:
         mutex_unlock(&cpuset_mutex);
  }
  
+static bool force_rebuild;
+
+void cpuset_force_rebuild(void)
+{
+       force_rebuild = true;
+}
+
  /**
   * cpuset_hotplug_workfn - handle CPU/memory hotunplug for a cpuset
   *
@@ -2303,8 +2362,10 @@ static void cpuset_hotplug_workfn(struct work_struct *work)
         }
  
         /* rebuild sched domains if cpus_allowed has changed */
-       if (cpus_updated)
+       if (cpus_updated || force_rebuild) {
+               force_rebuild = false;
                 rebuild_sched_domains();
+       }
  }
  
  void cpuset_update_active_cpus(bool cpu_online)
@@ -2323,6 +2384,11 @@ void cpuset_update_active_cpus(bool cpu_online)
         schedule_work(&cpuset_hotplug_work);
  }
  
+void cpuset_wait_for_hotplug(void)
+{
+       flush_work(&cpuset_hotplug_work);
+}
+
  /*
   * Keep top_cpuset.mems_allowed tracking node_states[N_MEMORY].
   * Call this routine anytime after node_states[N_MEMORY] changes.
@@ -2355,6 +2421,9 @@ void __init cpuset_init_smp(void)
         top_cpuset.effective_mems = node_states[N_MEMORY];
  
         register_hotmemory_notifier(&cpuset_track_online_nodes_nb);
+
+       cpuset_migrate_mm_wq = alloc_ordered_workqueue("cpuset_migrate_mm", 0);
+       BUG_ON(!cpuset_migrate_mm_wq);
  }
  
  /**