gpu: host1x: Add no-recovery mode

author Mikko Perttunen <mperttunen@nvidia.com>

Thu, 10 Jun 2021 11:04:43 +0000 (14:04 +0300)

committer Thierry Reding <treding@nvidia.com>

Tue, 10 Aug 2021 12:40:23 +0000 (14:40 +0200)
author Mikko Perttunen <mperttunen@nvidia.com>
Thu, 10 Jun 2021 11:04:43 +0000 (14:04 +0300)
committer Thierry Reding <treding@nvidia.com>
Tue, 10 Aug 2021 12:40:23 +0000 (14:40 +0200)
diff --git a/drivers/gpu/drm/tegra/drm.c b/drivers/gpu/drm/tegra/drm.c

index f96c237..739250a 100644 (file)
--- a/drivers/gpu/drm/tegra/drm.c
+++ b/drivers/gpu/drm/tegra/drm.c
@@ -201,6 +201,7 @@ int tegra_drm_submit(struct tegra_drm_context *context,
         job->client = client;
         job->class = client->class;
         job->serialize = true;
+       job->syncpt_recovery = true;
  
         /*
          * Track referenced BOs so that they can be unreferenced after the
diff --git a/drivers/gpu/host1x/cdma.c b/drivers/gpu/host1x/cdma.c

index 6e6ca77..765e5aa 100644 (file)
--- a/drivers/gpu/host1x/cdma.c
+++ b/drivers/gpu/host1x/cdma.c
@@ -312,10 +312,6 @@ static void update_cdma_locked(struct host1x_cdma *cdma)
         bool signal = false;
         struct host1x_job *job, *n;
  
-       /* If CDMA is stopped, queue is cleared and we can return */
-       if (!cdma->running)
-               return;
-
         /*
          * Walk the sync queue, reading the sync point registers as necessary,
          * to consume as many sync queue entries as possible without blocking
@@ -324,7 +320,8 @@ static void update_cdma_locked(struct host1x_cdma *cdma)
                 struct host1x_syncpt *sp = job->syncpt;
  
                 /* Check whether this syncpt has completed, and bail if not */
-               if (!host1x_syncpt_is_expired(sp, job->syncpt_end)) {
+               if (!host1x_syncpt_is_expired(sp, job->syncpt_end) &&
+                   !job->cancelled) {
                         /* Start timer on next pending syncpt */
                         if (job->timeout)
                                 cdma_start_timer_locked(cdma, job);
@@ -413,8 +410,11 @@ syncpt_incr:
         else
                 restart_addr = cdma->last_pos;
  
+       if (!job)
+               goto resume;
+
         /* do CPU increments for the remaining syncpts */
-       if (job) {
+       if (job->syncpt_recovery) {
                 dev_dbg(dev, "%s: perform CPU incr on pending buffers\n",
                         __func__);
  
@@ -433,8 +433,44 @@ syncpt_incr:
  
                 dev_dbg(dev, "%s: finished sync_queue modification\n",
                         __func__);
+       } else {
+               struct host1x_job *failed_job = job;
+
+               host1x_job_dump(dev, job);
+
+               host1x_syncpt_set_locked(job->syncpt);
+               failed_job->cancelled = true;
+
+               list_for_each_entry_continue(job, &cdma->sync_queue, list) {
+                       unsigned int i;
+
+                       if (job->syncpt != failed_job->syncpt)
+                               continue;
+
+                       for (i = 0; i < job->num_slots; i++) {
+                               unsigned int slot = (job->first_get/8 + i) %
+                                                   HOST1X_PUSHBUFFER_SLOTS;
+                               u32 *mapped = cdma->push_buffer.mapped;
+
+                               /*
+                                * Overwrite opcodes with 0 word writes
+                                * to offset 0xbad. This does nothing but
+                                * has a easily detected signature in debug
+                                * traces.
+                                */
+                               mapped[2*slot+0] = 0x1bad0000;
+                               mapped[2*slot+1] = 0x1bad0000;
+                       }
+
+                       job->cancelled = true;
+               }
+
+               wmb();
+
+               update_cdma_locked(cdma);
         }
  
+resume:
         /* roll back DMAGET and start up channel again */
         host1x_hw_cdma_resume(host1x, cdma, restart_addr);
  }
@@ -490,6 +526,16 @@ int host1x_cdma_begin(struct host1x_cdma *cdma, struct host1x_job *job)
  
         mutex_lock(&cdma->lock);
  
+       /*
+        * Check if syncpoint was locked due to previous job timeout.
+        * This needs to be done within the cdma lock to avoid a race
+        * with the timeout handler.
+        */
+       if (job->syncpt->locked) {
+               mutex_unlock(&cdma->lock);
+               return -EPERM;
+       }
+
         if (job->timeout) {
                 /* init state on first submit with timeout value */
                 if (!cdma->timeout.initialized) {
diff --git a/drivers/gpu/host1x/hw/channel_hw.c b/drivers/gpu/host1x/hw/channel_hw.c

index d4c28fa..bf21512 100644 (file)
--- a/drivers/gpu/host1x/hw/channel_hw.c
+++ b/drivers/gpu/host1x/hw/channel_hw.c
@@ -191,7 +191,7 @@ static int channel_submit(struct host1x_job *job)
         /* schedule a submit complete interrupt */
         err = host1x_intr_add_action(host, sp, syncval,
                                      HOST1X_INTR_ACTION_SUBMIT_COMPLETE, ch,
-                                    completed_waiter, NULL);
+                                    completed_waiter, &job->waiter);
         completed_waiter = NULL;
         WARN(err, "Failed to set submit complete interrupt");
  
diff --git a/drivers/gpu/host1x/job.c b/drivers/gpu/host1x/job.c

index adbdc22..8f59b34 100644 (file)
--- a/drivers/gpu/host1x/job.c
+++ b/drivers/gpu/host1x/job.c
@@ -79,6 +79,10 @@ static void job_free(struct kref *ref)
  {
         struct host1x_job *job = container_of(ref, struct host1x_job, ref);
  
+       if (job->waiter)
+               host1x_intr_put_ref(job->syncpt->host, job->syncpt->id,
+                                   job->waiter, false);
+
         if (job->syncpt)
                 host1x_syncpt_put(job->syncpt);
  
diff --git a/drivers/gpu/host1x/syncpt.c b/drivers/gpu/host1x/syncpt.c

index e648ebb..d198a10 100644 (file)
--- a/drivers/gpu/host1x/syncpt.c
+++ b/drivers/gpu/host1x/syncpt.c
@@ -407,6 +407,8 @@ static void syncpt_release(struct kref *ref)
  
         atomic_set(&sp->max_val, host1x_syncpt_read(sp));
  
+       sp->locked = false;
+
         mutex_lock(&sp->host->syncpt_mutex);
  
         host1x_syncpt_base_free(sp->base);
diff --git a/drivers/gpu/host1x/syncpt.h b/drivers/gpu/host1x/syncpt.h

index a6766f8..95cd29b 100644 (file)
--- a/drivers/gpu/host1x/syncpt.h
+++ b/drivers/gpu/host1x/syncpt.h
@@ -40,6 +40,13 @@ struct host1x_syncpt {
  
         /* interrupt data */
         struct host1x_syncpt_intr intr;
+
+       /*
+        * If a submission incrementing this syncpoint fails, lock it so that
+        * further submission cannot be made until application has handled the
+        * failure.
+        */
+       bool locked;
  };
  
  /* Initialize sync point array  */
@@ -115,4 +122,9 @@ static inline int host1x_syncpt_is_valid(struct host1x_syncpt *sp)
         return sp->id < host1x_syncpt_nb_pts(sp->host);
  }
  
+static inline void host1x_syncpt_set_locked(struct host1x_syncpt *sp)
+{
+       sp->locked = true;
+}
+
  #endif
diff --git a/include/linux/host1x.h b/include/linux/host1x.h

index eb4cc8c..8da088a 100644 (file)
--- a/include/linux/host1x.h
+++ b/include/linux/host1x.h
@@ -236,9 +236,15 @@ struct host1x_job {
         u32 syncpt_incrs;
         u32 syncpt_end;
  
+       /* Completion waiter ref */
+       void *waiter;
+
         /* Maximum time to wait for this job */
         unsigned int timeout;
  
+       /* Job has timed out and should be released */
+       bool cancelled;
+
         /* Index and number of slots used in the push buffer */
         unsigned int first_get;
         unsigned int num_slots;
@@ -259,6 +265,9 @@ struct host1x_job {
  
         /* Add a channel wait for previous ops to complete */
         bool serialize;
+
+       /* Fast-forward syncpoint increments on job timeout */
+       bool syncpt_recovery;
  };
  
  struct host1x_job *host1x_job_alloc(struct host1x_channel *ch,
author	Mikko Perttunen <mperttunen@nvidia.com>
	Thu, 10 Jun 2021 11:04:43 +0000 (14:04 +0300)
committer	Thierry Reding <treding@nvidia.com>
	Tue, 10 Aug 2021 12:40:23 +0000 (14:40 +0200)
drivers/gpu/drm/tegra/drm.c		patch \| blob \| history
drivers/gpu/host1x/cdma.c		patch \| blob \| history
drivers/gpu/host1x/hw/channel_hw.c		patch \| blob \| history
drivers/gpu/host1x/job.c		patch \| blob \| history
drivers/gpu/host1x/syncpt.c		patch \| blob \| history
drivers/gpu/host1x/syncpt.h		patch \| blob \| history
include/linux/host1x.h		patch \| blob \| history