Merge 4.14.22 into android-4.14

[GitHub/LineageOS/android_kernel_motorola_exynos9610.git] / drivers / android / binder.c
diff --git a/drivers/android/binder.c b/drivers/android/binder.c

index fddf76ef5bd6d824e2017fedb9110418b45270de..ac976864b3d1401cd89ea5628f589d510e7a5832 100644 (file)
--- a/drivers/android/binder.c
+++ b/drivers/android/binder.c
@@ -77,6 +77,7 @@
  #endif
  
  #include <uapi/linux/android/binder.h>
+#include <uapi/linux/sched/types.h>
  #include "binder_alloc.h"
  #include "binder_trace.h"
  
@@ -351,10 +352,14 @@ struct binder_error {
   *                        and by @lock)
   * @has_async_transaction: async transaction to node in progress
   *                        (protected by @lock)
+ * @sched_policy:         minimum scheduling policy for node
+ *                        (invariant after initialized)
   * @accept_fds:           file descriptor operations supported for node
   *                        (invariant after initialized)
   * @min_priority:         minimum scheduling priority
   *                        (invariant after initialized)
+ * @inherit_rt:           inherit RT scheduling policy from caller
+ *                        (invariant after initialized)
   * @async_todo:           list of async work items
   *                        (protected by @proc->inner_lock)
   *
@@ -390,6 +395,8 @@ struct binder_node {
                 /*
                  * invariant after initialization
                  */
+               u8 sched_policy:2;
+               u8 inherit_rt:1;
                 u8 accept_fds:1;
                 u8 min_priority;
         };
@@ -463,6 +470,22 @@ enum binder_deferred_state {
         BINDER_DEFERRED_RELEASE      = 0x04,
  };
  
+/**
+ * struct binder_priority - scheduler policy and priority
+ * @sched_policy            scheduler policy
+ * @prio                    [100..139] for SCHED_NORMAL, [0..99] for FIFO/RT
+ *
+ * The binder driver supports inheriting the following scheduler policies:
+ * SCHED_NORMAL
+ * SCHED_BATCH
+ * SCHED_FIFO
+ * SCHED_RR
+ */
+struct binder_priority {
+       unsigned int sched_policy;
+       int prio;
+};
+
  /**
   * struct binder_proc - binder process bookkeeping
   * @proc_node:            element for binder_procs list
@@ -482,7 +505,8 @@ enum binder_deferred_state {
   * @tsk                   task_struct for group_leader of process
   *                        (invariant after initialized)
   * @files                 files_struct for process
- *                        (invariant after initialized)
+ *                        (protected by @files_lock)
+ * @files_lock            mutex to protect @files
   * @deferred_work_node:   element for binder_deferred_list
   *                        (protected by binder_deferred_lock)
   * @deferred_work:        bitmap of deferred work to perform
@@ -492,8 +516,6 @@ enum binder_deferred_state {
   *                        (protected by @inner_lock)
   * @todo:                 list of work for this process
   *                        (protected by @inner_lock)
- * @wait:                 wait queue head to wait for proc work
- *                        (invariant after initialized)
   * @stats:                per-process binder statistics
   *                        (atomics, no lock needed)
   * @delivered_death:      list of delivered death notification
@@ -530,19 +552,19 @@ struct binder_proc {
         int pid;
         struct task_struct *tsk;
         struct files_struct *files;
+       struct mutex files_lock;
         struct hlist_node deferred_work_node;
         int deferred_work;
         bool is_dead;
  
         struct list_head todo;
-       wait_queue_head_t wait;
         struct binder_stats stats;
         struct list_head delivered_death;
         int max_threads;
         int requested_threads;
         int requested_threads_started;
         int tmp_ref;
-       long default_priority;
+       struct binder_priority default_priority;
         struct dentry *debugfs_entry;
         struct binder_alloc alloc;
         struct binder_context *context;
@@ -577,6 +599,8 @@ enum {
   *                        (protected by @proc->inner_lock)
   * @todo:                 list of work to do for this thread
   *                        (protected by @proc->inner_lock)
+ * @process_todo:         whether work in @todo should be processed
+ *                        (protected by @proc->inner_lock)
   * @return_error:         transaction errors reported by this thread
   *                        (only accessed by this thread)
   * @reply_error:          transaction errors reported by target thread
@@ -590,6 +614,7 @@ enum {
   * @is_dead:              thread is dead and awaiting free
   *                        when outstanding transactions are cleaned up
   *                        (protected by @proc->inner_lock)
+ * @task:                 struct task_struct for this thread
   *
   * Bookkeeping structure for binder threads.
   */
@@ -602,12 +627,14 @@ struct binder_thread {
         bool looper_need_return; /* can be written by other thread */
         struct binder_transaction *transaction_stack;
         struct list_head todo;
+       bool process_todo;
         struct binder_error return_error;
         struct binder_error reply_error;
         wait_queue_head_t wait;
         struct binder_stats stats;
         atomic_t tmp_ref;
         bool is_dead;
+       struct task_struct *task;
  };
  
  struct binder_transaction {
@@ -624,8 +651,9 @@ struct binder_transaction {
         struct binder_buffer *buffer;
         unsigned int    code;
         unsigned int    flags;
-       long    priority;
-       long    saved_priority;
+       struct binder_priority  priority;
+       struct binder_priority  saved_priority;
+       bool    set_priority_called;
         kuid_t  sender_euid;
         /**
          * @lock:  protects @from, @to_proc, and @to_thread
@@ -787,6 +815,16 @@ static bool binder_worklist_empty(struct binder_proc *proc,
         return ret;
  }
  
+/**
+ * binder_enqueue_work_ilocked() - Add an item to the work list
+ * @work:         struct binder_work to add to list
+ * @target_list:  list to add work to
+ *
+ * Adds the work to the specified list. Asserts that work
+ * is not already on a list.
+ *
+ * Requires the proc->inner_lock to be held.
+ */
  static void
  binder_enqueue_work_ilocked(struct binder_work *work,
                            struct list_head *target_list)
@@ -797,22 +835,56 @@ binder_enqueue_work_ilocked(struct binder_work *work,
  }
  
  /**
- * binder_enqueue_work() - Add an item to the work list
- * @proc:         binder_proc associated with list
+ * binder_enqueue_deferred_thread_work_ilocked() - Add deferred thread work
+ * @thread:       thread to queue work to
   * @work:         struct binder_work to add to list
- * @target_list:  list to add work to
   *
- * Adds the work to the specified list. Asserts that work
- * is not already on a list.
+ * Adds the work to the todo list of the thread. Doesn't set the process_todo
+ * flag, which means that (if it wasn't already set) the thread will go to
+ * sleep without handling this work when it calls read.
+ *
+ * Requires the proc->inner_lock to be held.
   */
  static void
-binder_enqueue_work(struct binder_proc *proc,
-                   struct binder_work *work,
-                   struct list_head *target_list)
+binder_enqueue_deferred_thread_work_ilocked(struct binder_thread *thread,
+                                           struct binder_work *work)
  {
-       binder_inner_proc_lock(proc);
-       binder_enqueue_work_ilocked(work, target_list);
-       binder_inner_proc_unlock(proc);
+       binder_enqueue_work_ilocked(work, &thread->todo);
+}
+
+/**
+ * binder_enqueue_thread_work_ilocked() - Add an item to the thread work list
+ * @thread:       thread to queue work to
+ * @work:         struct binder_work to add to list
+ *
+ * Adds the work to the todo list of the thread, and enables processing
+ * of the todo queue.
+ *
+ * Requires the proc->inner_lock to be held.
+ */
+static void
+binder_enqueue_thread_work_ilocked(struct binder_thread *thread,
+                                  struct binder_work *work)
+{
+       binder_enqueue_work_ilocked(work, &thread->todo);
+       thread->process_todo = true;
+}
+
+/**
+ * binder_enqueue_thread_work() - Add an item to the thread work list
+ * @thread:       thread to queue work to
+ * @work:         struct binder_work to add to list
+ *
+ * Adds the work to the todo list of the thread, and enables processing
+ * of the todo queue.
+ */
+static void
+binder_enqueue_thread_work(struct binder_thread *thread,
+                          struct binder_work *work)
+{
+       binder_inner_proc_lock(thread->proc);
+       binder_enqueue_thread_work_ilocked(thread, work);
+       binder_inner_proc_unlock(thread->proc);
  }
  
  static void
@@ -877,20 +949,26 @@ static void binder_inc_node_tmpref_ilocked(struct binder_node *node);
  
  static int task_get_unused_fd_flags(struct binder_proc *proc, int flags)
  {
-       struct files_struct *files = proc->files;
         unsigned long rlim_cur;
         unsigned long irqs;
+       int ret;
  
-       if (files == NULL)
-               return -ESRCH;
-
-       if (!lock_task_sighand(proc->tsk, &irqs))
-               return -EMFILE;
-
+       mutex_lock(&proc->files_lock);
+       if (proc->files == NULL) {
+               ret = -ESRCH;
+               goto err;
+       }
+       if (!lock_task_sighand(proc->tsk, &irqs)) {
+               ret = -EMFILE;
+               goto err;
+       }
         rlim_cur = task_rlimit(proc->tsk, RLIMIT_NOFILE);
         unlock_task_sighand(proc->tsk, &irqs);
  
-       return __alloc_fd(files, 0, rlim_cur, flags);
+       ret = __alloc_fd(proc->files, 0, rlim_cur, flags);
+err:
+       mutex_unlock(&proc->files_lock);
+       return ret;
  }
  
  /*
@@ -899,8 +977,10 @@ static int task_get_unused_fd_flags(struct binder_proc *proc, int flags)
  static void task_fd_install(
         struct binder_proc *proc, unsigned int fd, struct file *file)
  {
+       mutex_lock(&proc->files_lock);
         if (proc->files)
                 __fd_install(proc->files, fd, file);
+       mutex_unlock(&proc->files_lock);
  }
  
  /*
@@ -910,9 +990,11 @@ static long task_close_fd(struct binder_proc *proc, unsigned int fd)
  {
         int retval;
  
-       if (proc->files == NULL)
-               return -ESRCH;
-
+       mutex_lock(&proc->files_lock);
+       if (proc->files == NULL) {
+               retval = -ESRCH;
+               goto err;
+       }
         retval = __close_fd(proc->files, fd);
         /* can't restart close syscall because file table entry was cleared */
         if (unlikely(retval == -ERESTARTSYS ||
@@ -920,14 +1002,15 @@ static long task_close_fd(struct binder_proc *proc, unsigned int fd)
                      retval == -ERESTARTNOHAND ||
                      retval == -ERESTART_RESTARTBLOCK))
                 retval = -EINTR;
-
+err:
+       mutex_unlock(&proc->files_lock);
         return retval;
  }
  
  static bool binder_has_work_ilocked(struct binder_thread *thread,
                                     bool do_proc_work)
  {
-       return !binder_worklist_empty_ilocked(&thread->todo) ||
+       return thread->process_todo ||
                 thread->looper_need_return ||
                 (do_proc_work &&
                  !binder_worklist_empty_ilocked(&thread->proc->todo));
@@ -1051,22 +1134,145 @@ static void binder_wakeup_proc_ilocked(struct binder_proc *proc)
         binder_wakeup_thread_ilocked(proc, thread, /* sync = */false);
  }
  
-static void binder_set_nice(long nice)
+static bool is_rt_policy(int policy)
  {
-       long min_nice;
+       return policy == SCHED_FIFO || policy == SCHED_RR;
+}
  
-       if (can_nice(current, nice)) {
-               set_user_nice(current, nice);
+static bool is_fair_policy(int policy)
+{
+       return policy == SCHED_NORMAL || policy == SCHED_BATCH;
+}
+
+static bool binder_supported_policy(int policy)
+{
+       return is_fair_policy(policy) || is_rt_policy(policy);
+}
+
+static int to_userspace_prio(int policy, int kernel_priority)
+{
+       if (is_fair_policy(policy))
+               return PRIO_TO_NICE(kernel_priority);
+       else
+               return MAX_USER_RT_PRIO - 1 - kernel_priority;
+}
+
+static int to_kernel_prio(int policy, int user_priority)
+{
+       if (is_fair_policy(policy))
+               return NICE_TO_PRIO(user_priority);
+       else
+               return MAX_USER_RT_PRIO - 1 - user_priority;
+}
+
+static void binder_do_set_priority(struct task_struct *task,
+                                  struct binder_priority desired,
+                                  bool verify)
+{
+       int priority; /* user-space prio value */
+       bool has_cap_nice;
+       unsigned int policy = desired.sched_policy;
+
+       if (task->policy == policy && task->normal_prio == desired.prio)
                 return;
+
+       has_cap_nice = has_capability_noaudit(task, CAP_SYS_NICE);
+
+       priority = to_userspace_prio(policy, desired.prio);
+
+       if (verify && is_rt_policy(policy) && !has_cap_nice) {
+               long max_rtprio = task_rlimit(task, RLIMIT_RTPRIO);
+
+               if (max_rtprio == 0) {
+                       policy = SCHED_NORMAL;
+                       priority = MIN_NICE;
+               } else if (priority > max_rtprio) {
+                       priority = max_rtprio;
+               }
+       }
+
+       if (verify && is_fair_policy(policy) && !has_cap_nice) {
+               long min_nice = rlimit_to_nice(task_rlimit(task, RLIMIT_NICE));
+
+               if (min_nice > MAX_NICE) {
+                       binder_user_error("%d RLIMIT_NICE not set\n",
+                                         task->pid);
+                       return;
+               } else if (priority < min_nice) {
+                       priority = min_nice;
+               }
+       }
+
+       if (policy != desired.sched_policy ||
+           to_kernel_prio(policy, priority) != desired.prio)
+               binder_debug(BINDER_DEBUG_PRIORITY_CAP,
+                            "%d: priority %d not allowed, using %d instead\n",
+                             task->pid, desired.prio,
+                             to_kernel_prio(policy, priority));
+
+       trace_binder_set_priority(task->tgid, task->pid, task->normal_prio,
+                                 to_kernel_prio(policy, priority),
+                                 desired.prio);
+
+       /* Set the actual priority */
+       if (task->policy != policy || is_rt_policy(policy)) {
+               struct sched_param params;
+
+               params.sched_priority = is_rt_policy(policy) ? priority : 0;
+
+               sched_setscheduler_nocheck(task,
+                                          policy | SCHED_RESET_ON_FORK,
+                                          &params);
         }
-       min_nice = rlimit_to_nice(rlimit(RLIMIT_NICE));
-       binder_debug(BINDER_DEBUG_PRIORITY_CAP,
-                    "%d: nice value %ld not allowed use %ld instead\n",
-                     current->pid, nice, min_nice);
-       set_user_nice(current, min_nice);
-       if (min_nice <= MAX_NICE)
+       if (is_fair_policy(policy))
+               set_user_nice(task, priority);
+}
+
+static void binder_set_priority(struct task_struct *task,
+                               struct binder_priority desired)
+{
+       binder_do_set_priority(task, desired, /* verify = */ true);
+}
+
+static void binder_restore_priority(struct task_struct *task,
+                                   struct binder_priority desired)
+{
+       binder_do_set_priority(task, desired, /* verify = */ false);
+}
+
+static void binder_transaction_priority(struct task_struct *task,
+                                       struct binder_transaction *t,
+                                       struct binder_priority node_prio,
+                                       bool inherit_rt)
+{
+       struct binder_priority desired_prio = t->priority;
+
+       if (t->set_priority_called)
                 return;
-       binder_user_error("%d RLIMIT_NICE not set\n", current->pid);
+
+       t->set_priority_called = true;
+       t->saved_priority.sched_policy = task->policy;
+       t->saved_priority.prio = task->normal_prio;
+
+       if (!inherit_rt && is_rt_policy(desired_prio.sched_policy)) {
+               desired_prio.prio = NICE_TO_PRIO(0);
+               desired_prio.sched_policy = SCHED_NORMAL;
+       }
+
+       if (node_prio.prio < t->priority.prio ||
+           (node_prio.prio == t->priority.prio &&
+            node_prio.sched_policy == SCHED_FIFO)) {
+               /*
+                * In case the minimum priority on the node is
+                * higher (lower value), use that priority. If
+                * the priority is the same, but the node uses
+                * SCHED_FIFO, prefer SCHED_FIFO, since it can
+                * run unbounded, unlike SCHED_RR.
+                */
+               desired_prio = node_prio;
+       }
+
+       binder_set_priority(task, desired_prio);
  }
  
  static struct binder_node *binder_get_node_ilocked(struct binder_proc *proc,
@@ -1119,6 +1325,7 @@ static struct binder_node *binder_init_node_ilocked(
         binder_uintptr_t ptr = fp ? fp->binder : 0;
         binder_uintptr_t cookie = fp ? fp->cookie : 0;
         __u32 flags = fp ? fp->flags : 0;
+       s8 priority;
  
         assert_spin_locked(&proc->inner_lock);
  
@@ -1151,8 +1358,12 @@ static struct binder_node *binder_init_node_ilocked(
         node->ptr = ptr;
         node->cookie = cookie;
         node->work.type = BINDER_WORK_NODE;
-       node->min_priority = flags & FLAT_BINDER_FLAG_PRIORITY_MASK;
+       priority = flags & FLAT_BINDER_FLAG_PRIORITY_MASK;
+       node->sched_policy = (flags & FLAT_BINDER_FLAG_SCHED_POLICY_MASK) >>
+               FLAT_BINDER_FLAG_SCHED_POLICY_SHIFT;
+       node->min_priority = to_kernel_prio(node->sched_policy, priority);
         node->accept_fds = !!(flags & FLAT_BINDER_FLAG_ACCEPTS_FDS);
+       node->inherit_rt = !!(flags & FLAT_BINDER_FLAG_INHERIT_RT);
         spin_lock_init(&node->lock);
         INIT_LIST_HEAD(&node->work.entry);
         INIT_LIST_HEAD(&node->async_todo);
@@ -1215,6 +1426,17 @@ static int binder_inc_node_nilocked(struct binder_node *node, int strong,
                         node->local_strong_refs++;
                 if (!node->has_strong_ref && target_list) {
                         binder_dequeue_work_ilocked(&node->work);
+                       /*
+                        * Note: this function is the only place where we queue
+                        * directly to a thread->todo without using the
+                        * corresponding binder_enqueue_thread_work() helper
+                        * functions; in this case it's ok to not set the
+                        * process_todo flag, since we know this node work will
+                        * always be followed by other work that starts queue
+                        * processing: in case of synchronous transactions, a
+                        * BR_REPLY or BR_ERROR; in case of oneway
+                        * transactions, a BR_TRANSACTION_COMPLETE.
+                        */
                         binder_enqueue_work_ilocked(&node->work, target_list);
                 }
         } else {
@@ -1226,6 +1448,9 @@ static int binder_inc_node_nilocked(struct binder_node *node, int strong,
                                         node->debug_id);
                                 return -EINVAL;
                         }
+                       /*
+                        * See comment above
+                        */
                         binder_enqueue_work_ilocked(&node->work, target_list);
                 }
         }
@@ -1915,13 +2140,19 @@ static void binder_send_failed_reply(struct binder_transaction *t,
                         binder_pop_transaction_ilocked(target_thread, t);
                         if (target_thread->reply_error.cmd == BR_OK) {
                                 target_thread->reply_error.cmd = error_code;
-                               binder_enqueue_work_ilocked(
-                                       &target_thread->reply_error.work,
-                                       &target_thread->todo);
+                               binder_enqueue_thread_work_ilocked(
+                                       target_thread,
+                                       &target_thread->reply_error.work);
                                 wake_up_interruptible(&target_thread->wait);
                         } else {
-                               WARN(1, "Unexpected reply error: %u\n",
-                                               target_thread->reply_error.cmd);
+                               /*
+                                * Cannot get here for normal operation, but
+                                * we can if multiple synchronous transactions
+                                * are sent without blocking for responses.
+                                * Just ignore the 2nd error in this case.
+                                */
+                               pr_warn("Unexpected reply error: %u\n",
+                                       target_thread->reply_error.cmd);
                         }
                         binder_inner_proc_unlock(target_thread->proc);
                         binder_thread_dec_tmpref(target_thread);
@@ -1947,6 +2178,26 @@ static void binder_send_failed_reply(struct binder_transaction *t,
         }
  }
  
+/**
+ * binder_cleanup_transaction() - cleans up undelivered transaction
+ * @t:         transaction that needs to be cleaned up
+ * @reason:    reason the transaction wasn't delivered
+ * @error_code:        error to return to caller (if synchronous call)
+ */
+static void binder_cleanup_transaction(struct binder_transaction *t,
+                                      const char *reason,
+                                      uint32_t error_code)
+{
+       if (t->buffer->target_node && !(t->flags & TF_ONE_WAY)) {
+               binder_send_failed_reply(t, error_code);
+       } else {
+               binder_debug(BINDER_DEBUG_DEAD_TRANSACTION,
+                       "undelivered transaction %d, %s\n",
+                       t->debug_id, reason);
+               binder_free_transaction(t);
+       }
+}
+
  /**
   * binder_validate_object() - checks for a valid metadata object in a buffer.
   * @buffer:    binder_buffer that we're parsing.
@@ -2102,7 +2353,7 @@ static void binder_transaction_buffer_release(struct binder_proc *proc,
         int debug_id = buffer->debug_id;
  
         binder_debug(BINDER_DEBUG_TRANSACTION,
-                    "%d buffer release %d, size %zd-%zd, failed at %p\n",
+                    "%d buffer release %d, size %zd-%zd, failed at %pK\n",
                      proc->pid, buffer->debug_id,
                      buffer->data_size, buffer->offsets_size, failed_at);
  
@@ -2536,18 +2787,20 @@ static bool binder_proc_transaction(struct binder_transaction *t,
                                     struct binder_proc *proc,
                                     struct binder_thread *thread)
  {
-       struct list_head *target_list = NULL;
         struct binder_node *node = t->buffer->target_node;
+       struct binder_priority node_prio;
         bool oneway = !!(t->flags & TF_ONE_WAY);
-       bool wakeup = true;
+       bool pending_async = false;
  
         BUG_ON(!node);
         binder_node_lock(node);
+       node_prio.prio = node->min_priority;
+       node_prio.sched_policy = node->sched_policy;
+
         if (oneway) {
                 BUG_ON(thread);
                 if (node->has_async_transaction) {
-                       target_list = &node->async_todo;
-                       wakeup = false;
+                       pending_async = true;
                 } else {
                         node->has_async_transaction = 1;
                 }
@@ -2561,19 +2814,20 @@ static bool binder_proc_transaction(struct binder_transaction *t,
                 return false;
         }
  
-       if (!thread && !target_list)
+       if (!thread && !pending_async)
                 thread = binder_select_thread_ilocked(proc);
  
-       if (thread)
-               target_list = &thread->todo;
-       else if (!target_list)
-               target_list = &proc->todo;
-       else
-               BUG_ON(target_list != &node->async_todo);
-
-       binder_enqueue_work_ilocked(&t->work, target_list);
+       if (thread) {
+               binder_transaction_priority(thread->task, t, node_prio,
+                                           node->inherit_rt);
+               binder_enqueue_thread_work_ilocked(thread, &t->work);
+       } else if (!pending_async) {
+               binder_enqueue_work_ilocked(&t->work, &proc->todo);
+       } else {
+               binder_enqueue_work_ilocked(&t->work, &node->async_todo);
+       }
  
-       if (wakeup)
+       if (!pending_async)
                 binder_wakeup_thread_ilocked(proc, thread, !oneway /* sync */);
  
         binder_inner_proc_unlock(proc);
@@ -2688,7 +2942,6 @@ static void binder_transaction(struct binder_proc *proc,
                 }
                 thread->transaction_stack = in_reply_to->to_parent;
                 binder_inner_proc_unlock(proc);
-               binder_set_nice(in_reply_to->saved_priority);
                 target_thread = binder_get_txn_from_and_acq_inner(in_reply_to);
                 if (target_thread == NULL) {
                         return_error = BR_DEAD_REPLY;
@@ -2853,7 +3106,15 @@ static void binder_transaction(struct binder_proc *proc,
         t->to_thread = target_thread;
         t->code = tr->code;
         t->flags = tr->flags;
-       t->priority = task_nice(current);
+       if (!(t->flags & TF_ONE_WAY) &&
+           binder_supported_policy(current->policy)) {
+               /* Inherit supported policies for synchronous transactions */
+               t->priority.sched_policy = current->policy;
+               t->priority.prio = current->normal_prio;
+       } else {
+               /* Otherwise, fall back to the default priority */
+               t->priority = target_proc->default_priority;
+       }
  
         trace_binder_transaction(reply, t, target_node);
  
@@ -3068,10 +3329,10 @@ static void binder_transaction(struct binder_proc *proc,
                 }
         }
         tcomplete->type = BINDER_WORK_TRANSACTION_COMPLETE;
-       binder_enqueue_work(proc, tcomplete, &thread->todo);
         t->work.type = BINDER_WORK_TRANSACTION;
  
         if (reply) {
+               binder_enqueue_thread_work(thread, tcomplete);
                 binder_inner_proc_lock(target_proc);
                 if (target_thread->is_dead) {
                         binder_inner_proc_unlock(target_proc);
@@ -3079,13 +3340,22 @@ static void binder_transaction(struct binder_proc *proc,
                 }
                 BUG_ON(t->buffer->async_transaction != 0);
                 binder_pop_transaction_ilocked(target_thread, in_reply_to);
-               binder_enqueue_work_ilocked(&t->work, &target_thread->todo);
+               binder_enqueue_thread_work_ilocked(target_thread, &t->work);
                 binder_inner_proc_unlock(target_proc);
                 wake_up_interruptible_sync(&target_thread->wait);
+               binder_restore_priority(current, in_reply_to->saved_priority);
                 binder_free_transaction(in_reply_to);
         } else if (!(t->flags & TF_ONE_WAY)) {
                 BUG_ON(t->buffer->async_transaction != 0);
                 binder_inner_proc_lock(proc);
+               /*
+                * Defer the TRANSACTION_COMPLETE, so we don't return to
+                * userspace immediately; this allows the target process to
+                * immediately start processing this transaction, reducing
+                * latency. We will then return the TRANSACTION_COMPLETE when
+                * the target replies (or there is an error).
+                */
+               binder_enqueue_deferred_thread_work_ilocked(thread, tcomplete);
                 t->need_reply = 1;
                 t->from_parent = thread->transaction_stack;
                 thread->transaction_stack = t;
@@ -3099,6 +3369,7 @@ static void binder_transaction(struct binder_proc *proc,
         } else {
                 BUG_ON(target_node == NULL);
                 BUG_ON(t->buffer->async_transaction != 1);
+               binder_enqueue_thread_work(thread, tcomplete);
                 if (!binder_proc_transaction(t, target_proc, NULL))
                         goto err_dead_proc_or_thread;
         }
@@ -3176,16 +3447,13 @@ err_invalid_target_handle:
  
         BUG_ON(thread->return_error.cmd != BR_OK);
         if (in_reply_to) {
+               binder_restore_priority(current, in_reply_to->saved_priority);
                 thread->return_error.cmd = BR_TRANSACTION_COMPLETE;
-               binder_enqueue_work(thread->proc,
-                                   &thread->return_error.work,
-                                   &thread->todo);
+               binder_enqueue_thread_work(thread, &thread->return_error.work);
                 binder_send_failed_reply(in_reply_to, return_error);
         } else {
                 thread->return_error.cmd = return_error;
-               binder_enqueue_work(thread->proc,
-                                   &thread->return_error.work,
-                                   &thread->todo);
+               binder_enqueue_thread_work(thread, &thread->return_error.work);
         }
  }
  
@@ -3489,10 +3757,9 @@ static int binder_thread_write(struct binder_proc *proc,
                                         WARN_ON(thread->return_error.cmd !=
                                                 BR_OK);
                                         thread->return_error.cmd = BR_ERROR;
-                                       binder_enqueue_work(
-                                               thread->proc,
-                                               &thread->return_error.work,
-                                               &thread->todo);
+                                       binder_enqueue_thread_work(
+                                               thread,
+                                               &thread->return_error.work);
                                         binder_debug(
                                                 BINDER_DEBUG_FAILED_TRANSACTION,
                                                 "%d:%d BC_REQUEST_DEATH_NOTIFICATION failed\n",
@@ -3572,9 +3839,9 @@ static int binder_thread_write(struct binder_proc *proc,
                                         if (thread->looper &
                                             (BINDER_LOOPER_STATE_REGISTERED |
                                              BINDER_LOOPER_STATE_ENTERED))
-                                               binder_enqueue_work_ilocked(
-                                                               &death->work,
-                                                               &thread->todo);
+                                               binder_enqueue_thread_work_ilocked(
+                                                               thread,
+                                                               &death->work);
                                         else {
                                                 binder_enqueue_work_ilocked(
                                                                 &death->work,
@@ -3614,7 +3881,7 @@ static int binder_thread_write(struct binder_proc *proc,
                                 }
                         }
                         binder_debug(BINDER_DEBUG_DEAD_BINDER,
-                                    "%d:%d BC_DEAD_BINDER_DONE %016llx found %p\n",
+                                    "%d:%d BC_DEAD_BINDER_DONE %016llx found %pK\n",
                                      proc->pid, thread->pid, (u64)cookie,
                                      death);
                         if (death == NULL) {
@@ -3629,8 +3896,8 @@ static int binder_thread_write(struct binder_proc *proc,
                                 if (thread->looper &
                                         (BINDER_LOOPER_STATE_REGISTERED |
                                          BINDER_LOOPER_STATE_ENTERED))
-                                       binder_enqueue_work_ilocked(
-                                               &death->work, &thread->todo);
+                                       binder_enqueue_thread_work_ilocked(
+                                               thread, &death->work);
                                 else {
                                         binder_enqueue_work_ilocked(
                                                         &death->work,
@@ -3761,7 +4028,7 @@ retry:
                         wait_event_interruptible(binder_user_error_wait,
                                                  binder_stop_on_user_error < 2);
                 }
-               binder_set_nice(proc->default_priority);
+               binder_restore_priority(current, proc->default_priority);
         }
  
         if (non_block) {
@@ -3804,6 +4071,8 @@ retry:
                         break;
                 }
                 w = binder_dequeue_work_head_ilocked(list);
+               if (binder_worklist_empty_ilocked(&thread->todo))
+                       thread->process_todo = false;
  
                 switch (w->type) {
                 case BINDER_WORK_TRANSACTION: {
@@ -3973,16 +4242,14 @@ retry:
                 BUG_ON(t->buffer == NULL);
                 if (t->buffer->target_node) {
                         struct binder_node *target_node = t->buffer->target_node;
+                       struct binder_priority node_prio;
  
                         tr.target.ptr = target_node->ptr;
                         tr.cookie =  target_node->cookie;
-                       t->saved_priority = task_nice(current);
-                       if (t->priority < target_node->min_priority &&
-                           !(t->flags & TF_ONE_WAY))
-                               binder_set_nice(t->priority);
-                       else if (!(t->flags & TF_ONE_WAY) ||
-                                t->saved_priority > target_node->min_priority)
-                               binder_set_nice(target_node->min_priority);
+                       node_prio.sched_policy = target_node->sched_policy;
+                       node_prio.prio = target_node->min_priority;
+                       binder_transaction_priority(current, t, node_prio,
+                                                   target_node->inherit_rt);
                         cmd = BR_TRANSACTION;
                 } else {
                         tr.target.ptr = 0;
@@ -4015,12 +4282,20 @@ retry:
                 if (put_user(cmd, (uint32_t __user *)ptr)) {
                         if (t_from)
                                 binder_thread_dec_tmpref(t_from);
+
+                       binder_cleanup_transaction(t, "put_user failed",
+                                                  BR_FAILED_REPLY);
+
                         return -EFAULT;
                 }
                 ptr += sizeof(uint32_t);
                 if (copy_to_user(ptr, &tr, sizeof(tr))) {
                         if (t_from)
                                 binder_thread_dec_tmpref(t_from);
+
+                       binder_cleanup_transaction(t, "copy_to_user failed",
+                                                  BR_FAILED_REPLY);
+
                         return -EFAULT;
                 }
                 ptr += sizeof(tr);
@@ -4090,15 +4365,9 @@ static void binder_release_work(struct binder_proc *proc,
                         struct binder_transaction *t;
  
                         t = container_of(w, struct binder_transaction, work);
-                       if (t->buffer->target_node &&
-                           !(t->flags & TF_ONE_WAY)) {
-                               binder_send_failed_reply(t, BR_DEAD_REPLY);
-                       } else {
-                               binder_debug(BINDER_DEBUG_DEAD_TRANSACTION,
-                                       "undelivered transaction %d\n",
-                                       t->debug_id);
-                               binder_free_transaction(t);
-                       }
+
+                       binder_cleanup_transaction(t, "process died.",
+                                                  BR_DEAD_REPLY);
                 } break;
                 case BINDER_WORK_RETURN_ERROR: {
                         struct binder_error *e = container_of(
@@ -4158,6 +4427,8 @@ static struct binder_thread *binder_get_thread_ilocked(
         binder_stats_created(BINDER_STAT_THREAD);
         thread->proc = proc;
         thread->pid = current->pid;
+       get_task_struct(current);
+       thread->task = current;
         atomic_set(&thread->tmp_ref, 0);
         init_waitqueue_head(&thread->wait);
         INIT_LIST_HEAD(&thread->todo);
@@ -4208,6 +4479,7 @@ static void binder_free_thread(struct binder_thread *thread)
         BUG_ON(!list_empty(&thread->todo));
         binder_stats_deleted(BINDER_STAT_THREAD);
         binder_proc_dec_tmpref(thread->proc);
+       put_task_struct(thread->task);
         kfree(thread);
  }
  
@@ -4267,8 +4539,29 @@ static int binder_thread_release(struct binder_proc *proc,
                 if (t)
                         spin_lock(&t->lock);
         }
+
+       /*
+        * If this thread used poll, make sure we remove the waitqueue
+        * from any epoll data structures holding it with POLLFREE.
+        * waitqueue_active() is safe to use here because we're holding
+        * the inner lock.
+        */
+       if ((thread->looper & BINDER_LOOPER_STATE_POLL) &&
+           waitqueue_active(&thread->wait)) {
+               wake_up_poll(&thread->wait, POLLHUP | POLLFREE);
+       }
+
         binder_inner_proc_unlock(thread->proc);
  
+       /*
+        * This is needed to avoid races between wake_up_poll() above and
+        * and ep_remove_waitqueue() called for other reasons (eg the epoll file
+        * descriptor being closed); ep_remove_waitqueue() holds an RCU read
+        * lock, so we can be sure it's done after calling synchronize_rcu().
+        */
+       if (thread->looper & BINDER_LOOPER_STATE_POLL)
+               synchronize_rcu();
+
         if (send_reply)
                 binder_send_failed_reply(send_reply, BR_DEAD_REPLY);
         binder_release_work(proc, &thread->todo);
@@ -4284,6 +4577,8 @@ static unsigned int binder_poll(struct file *filp,
         bool wait_for_proc_work;
  
         thread = binder_get_thread(proc);
+       if (!thread)
+               return POLLERR;
  
         binder_inner_proc_lock(thread->proc);
         thread->looper |= BINDER_LOOPER_STATE_POLL;
@@ -4605,7 +4900,9 @@ static int binder_mmap(struct file *filp, struct vm_area_struct *vma)
         ret = binder_alloc_mmap_handler(&proc->alloc, vma);
         if (ret)
                 return ret;
+       mutex_lock(&proc->files_lock);
         proc->files = get_files_struct(current);
+       mutex_unlock(&proc->files_lock);
         return 0;
  
  err_bad_arg:
@@ -4629,8 +4926,16 @@ static int binder_open(struct inode *nodp, struct file *filp)
         spin_lock_init(&proc->outer_lock);
         get_task_struct(current->group_leader);
         proc->tsk = current->group_leader;
+       mutex_init(&proc->files_lock);
         INIT_LIST_HEAD(&proc->todo);
-       proc->default_priority = task_nice(current);
+       if (binder_supported_policy(current->policy)) {
+               proc->default_priority.sched_policy = current->policy;
+               proc->default_priority.prio = current->normal_prio;
+       } else {
+               proc->default_priority.sched_policy = SCHED_NORMAL;
+               proc->default_priority.prio = NICE_TO_PRIO(0);
+       }
+
         binder_dev = container_of(filp->private_data, struct binder_device,
                                   miscdev);
         proc->context = &binder_dev->context;
@@ -4881,9 +5186,11 @@ static void binder_deferred_func(struct work_struct *work)
  
                 files = NULL;
                 if (defer & BINDER_DEFERRED_PUT_FILES) {
+                       mutex_lock(&proc->files_lock);
                         files = proc->files;
                         if (files)
                                 proc->files = NULL;
+                       mutex_unlock(&proc->files_lock);
                 }
  
                 if (defer & BINDER_DEFERRED_FLUSH)
@@ -4922,13 +5229,14 @@ static void print_binder_transaction_ilocked(struct seq_file *m,
         spin_lock(&t->lock);
         to_proc = t->to_proc;
         seq_printf(m,
-                  "%s %d: %p from %d:%d to %d:%d code %x flags %x pri %ld r%d",
+                  "%s %d: %pK from %d:%d to %d:%d code %x flags %x pri %d:%d r%d",
                    prefix, t->debug_id, t,
                    t->from ? t->from->proc->pid : 0,
                    t->from ? t->from->pid : 0,
                    to_proc ? to_proc->pid : 0,
                    t->to_thread ? t->to_thread->pid : 0,
-                  t->code, t->flags, t->priority, t->need_reply);
+                  t->code, t->flags, t->priority.sched_policy,
+                  t->priority.prio, t->need_reply);
         spin_unlock(&t->lock);
  
         if (proc != to_proc) {
@@ -4946,7 +5254,7 @@ static void print_binder_transaction_ilocked(struct seq_file *m,
         }
         if (buffer->target_node)
                 seq_printf(m, " node %d", buffer->target_node->debug_id);
-       seq_printf(m, " size %zd:%zd data %p\n",
+       seq_printf(m, " size %zd:%zd data %pK\n",
                    buffer->data_size, buffer->offsets_size,
                    buffer->data);
  }
@@ -5046,8 +5354,9 @@ static void print_binder_node_nilocked(struct seq_file *m,
         hlist_for_each_entry(ref, &node->refs, node_entry)
                 count++;
  
-       seq_printf(m, "  node %d: u%016llx c%016llx hs %d hw %d ls %d lw %d is %d iw %d tr %d",
+       seq_printf(m, "  node %d: u%016llx c%016llx pri %d:%d hs %d hw %d ls %d lw %d is %d iw %d tr %d",
                    node->debug_id, (u64)node->ptr, (u64)node->cookie,
+                  node->sched_policy, node->min_priority,
                    node->has_strong_ref, node->has_weak_ref,
                    node->local_strong_refs, node->local_weak_refs,
                    node->internal_strong_refs, count, node->tmp_refs);