io_uring: get an active ref_node from files_data

[linux-2.6-microblaze.git] / fs / io_uring.c
diff --git a/fs/io_uring.c b/fs/io_uring.c

index 728f3a3..5cb194c 100644 (file)
--- a/fs/io_uring.c
+++ b/fs/io_uring.c
@@ -478,6 +478,7 @@ struct io_sr_msg {
  struct io_open {
         struct file                     *file;
         int                             dfd;
+       bool                            ignore_nonblock;
         struct filename                 *filename;
         struct open_how                 how;
         unsigned long                   nofile;
@@ -1593,14 +1594,29 @@ static void io_cqring_mark_overflow(struct io_ring_ctx *ctx)
         }
  }
  
-static inline bool io_match_files(struct io_kiocb *req,
-                                      struct files_struct *files)
+static inline bool __io_match_files(struct io_kiocb *req,
+                                   struct files_struct *files)
  {
+       return ((req->flags & REQ_F_WORK_INITIALIZED) &&
+               (req->work.flags & IO_WQ_WORK_FILES)) &&
+               req->work.identity->files == files;
+}
+
+static bool io_match_files(struct io_kiocb *req,
+                          struct files_struct *files)
+{
+       struct io_kiocb *link;
+
         if (!files)
                 return true;
-       if ((req->flags & REQ_F_WORK_INITIALIZED) &&
-           (req->work.flags & IO_WQ_WORK_FILES))
-               return req->work.identity->files == files;
+       if (__io_match_files(req, files))
+               return true;
+       if (req->flags & REQ_F_LINK_HEAD) {
+               list_for_each_entry(link, &req->link_list, link_list) {
+                       if (__io_match_files(link, files))
+                               return true;
+               }
+       }
         return false;
  }
  
@@ -2562,7 +2578,6 @@ static bool io_resubmit_prep(struct io_kiocb *req, int error)
         }
  end_req:
         req_set_fail_links(req);
-       io_req_complete(req, ret);
         return false;
  }
  #endif
@@ -3781,6 +3796,7 @@ static int __io_openat_prep(struct io_kiocb *req, const struct io_uring_sqe *sqe
                 return ret;
         }
         req->open.nofile = rlimit(RLIMIT_NOFILE);
+       req->open.ignore_nonblock = false;
         req->flags |= REQ_F_NEED_CLEANUP;
         return 0;
  }
@@ -3824,7 +3840,7 @@ static int io_openat2(struct io_kiocb *req, bool force_nonblock)
         struct file *file;
         int ret;
  
-       if (force_nonblock)
+       if (force_nonblock && !req->open.ignore_nonblock)
                 return -EAGAIN;
  
         ret = build_open_flags(&req->open.how, &op);
@@ -3839,6 +3855,21 @@ static int io_openat2(struct io_kiocb *req, bool force_nonblock)
         if (IS_ERR(file)) {
                 put_unused_fd(ret);
                 ret = PTR_ERR(file);
+               /*
+                * A work-around to ensure that /proc/self works that way
+                * that it should - if we get -EOPNOTSUPP back, then assume
+                * that proc_self_get_link() failed us because we're in async
+                * context. We should be safe to retry this from the task
+                * itself with force_nonblock == false set, as it should not
+                * block on lookup. Would be nice to know this upfront and
+                * avoid the async dance, but doesn't seem feasible.
+                */
+               if (ret == -EOPNOTSUPP && io_wq_current_is_worker()) {
+                       req->open.ignore_nonblock = true;
+                       refcount_inc(&req->refs);
+                       io_req_task_queue(req);
+                       return 0;
+               }
         } else {
                 fsnotify_open(file);
                 fd_install(ret, file);
@@ -6943,9 +6974,7 @@ static int io_sqe_files_unregister(struct io_ring_ctx *ctx)
                 return -ENXIO;
  
         spin_lock(&data->lock);
-       if (!list_empty(&data->ref_list))
-               ref_node = list_first_entry(&data->ref_list,
-                               struct fixed_file_ref_node, node);
+       ref_node = data->node;
         spin_unlock(&data->lock);
         if (ref_node)
                 percpu_ref_kill(&ref_node->refs);
@@ -8406,22 +8435,6 @@ static bool io_match_link(struct io_kiocb *preq, struct io_kiocb *req)
         return false;
  }
  
-static bool io_match_link_files(struct io_kiocb *req,
-                               struct files_struct *files)
-{
-       struct io_kiocb *link;
-
-       if (io_match_files(req, files))
-               return true;
-       if (req->flags & REQ_F_LINK_HEAD) {
-               list_for_each_entry(link, &req->link_list, link_list) {
-                       if (io_match_files(link, files))
-                               return true;
-               }
-       }
-       return false;
-}
-
  /*
   * We're looking to cancel 'req' because it's holding on to our files, but
   * 'req' could be a link to another request. See if it is, and cancel that
@@ -8471,7 +8484,21 @@ static bool io_timeout_remove_link(struct io_ring_ctx *ctx,
  
  static bool io_cancel_link_cb(struct io_wq_work *work, void *data)
  {
-       return io_match_link(container_of(work, struct io_kiocb, work), data);
+       struct io_kiocb *req = container_of(work, struct io_kiocb, work);
+       bool ret;
+
+       if (req->flags & REQ_F_LINK_TIMEOUT) {
+               unsigned long flags;
+               struct io_ring_ctx *ctx = req->ctx;
+
+               /* protect against races with linked timeouts */
+               spin_lock_irqsave(&ctx->completion_lock, flags);
+               ret = io_match_link(req, data);
+               spin_unlock_irqrestore(&ctx->completion_lock, flags);
+       } else {
+               ret = io_match_link(req, data);
+       }
+       return ret;
  }
  
  static void io_attempt_cancel(struct io_ring_ctx *ctx, struct io_kiocb *req)
@@ -8497,6 +8524,7 @@ static void io_attempt_cancel(struct io_ring_ctx *ctx, struct io_kiocb *req)
  }
  
  static void io_cancel_defer_files(struct io_ring_ctx *ctx,
+                                 struct task_struct *task,
                                   struct files_struct *files)
  {
         struct io_defer_entry *de = NULL;
@@ -8504,7 +8532,8 @@ static void io_cancel_defer_files(struct io_ring_ctx *ctx,
  
         spin_lock_irq(&ctx->completion_lock);
         list_for_each_entry_reverse(de, &ctx->defer_list, list) {
-               if (io_match_link_files(de->req, files)) {
+               if (io_task_match(de->req, task) &&
+                   io_match_files(de->req, files)) {
                         list_cut_position(&list, &ctx->defer_list, &de->list);
                         break;
                 }
@@ -8530,7 +8559,6 @@ static bool io_uring_cancel_files(struct io_ring_ctx *ctx,
         if (list_empty_careful(&ctx->inflight_list))
                 return false;
  
-       io_cancel_defer_files(ctx, files);
         /* cancel all at once, should be faster than doing it one by one*/
         io_wq_cancel_cb(ctx->io_wq, io_wq_files_match, files, true);
  
@@ -8622,6 +8650,11 @@ static void io_uring_cancel_task_requests(struct io_ring_ctx *ctx,
                 io_sq_thread_park(ctx->sq_data);
         }
  
+       if (files)
+               io_cancel_defer_files(ctx, NULL, files);
+       else
+               io_cancel_defer_files(ctx, task, NULL);
+
         io_cqring_overflow_flush(ctx, true, task, files);
  
         while (__io_uring_cancel_task_requests(ctx, task, files)) {
@@ -8969,7 +9002,8 @@ out_fput:
  #ifdef CONFIG_PROC_FS
  static int io_uring_show_cred(int id, void *p, void *data)
  {
-       const struct cred *cred = p;
+       struct io_identity *iod = p;
+       const struct cred *cred = iod->creds;
         struct seq_file *m = data;
         struct user_namespace *uns = seq_user_ns(m);
         struct group_info *gi;
@@ -9206,6 +9240,7 @@ static int io_uring_create(unsigned entries, struct io_uring_params *p,
                  * to a power-of-two, if it isn't already. We do NOT impose
                  * any cq vs sq ring sizing.
                  */
+               p->cq_entries = roundup_pow_of_two(p->cq_entries);
                 if (p->cq_entries < p->sq_entries)
                         return -EINVAL;
                 if (p->cq_entries > IORING_MAX_CQ_ENTRIES) {
@@ -9213,7 +9248,6 @@ static int io_uring_create(unsigned entries, struct io_uring_params *p,
                                 return -EINVAL;
                         p->cq_entries = IORING_MAX_CQ_ENTRIES;
                 }
-               p->cq_entries = roundup_pow_of_two(p->cq_entries);
         } else {
                 p->cq_entries = 2 * p->sq_entries;
         }