From: Dave Airlie <airlied at redhat.com>
I'm pretty sure this optimisation is actually not a great idea,
and is racy with other things waiting for fences.
Just nuke it, there should be no need to do fence waits in a
busy CPU loop.
Signed-off-by: Dave Airlie <airlied at redhat.com>
---
 drivers/gpu/drm/nouveau/nouveau_bo.c    |  2 +-
 drivers/gpu/drm/nouveau/nouveau_chan.c  |  2 +-
 drivers/gpu/drm/nouveau/nouveau_dmem.c  |  2 +-
 drivers/gpu/drm/nouveau/nouveau_fence.c | 30 +------------------------
 drivers/gpu/drm/nouveau/nouveau_fence.h |  2 +-
 drivers/gpu/drm/nouveau/nouveau_gem.c   |  2 +-
 6 files changed, 6 insertions(+), 34 deletions(-)
diff --git a/drivers/gpu/drm/nouveau/nouveau_bo.c
b/drivers/gpu/drm/nouveau/nouveau_bo.c
index 8a30f5a0525b..a4e8f625fce6 100644
--- a/drivers/gpu/drm/nouveau/nouveau_bo.c
+++ b/drivers/gpu/drm/nouveau/nouveau_bo.c
@@ -902,7 +902,7 @@ nouveau_bo_move_m2mf(struct ttm_buffer_object *bo, int
evict,
 	 * Without this the operation can timeout and we'll fallback to a
 	 * software copy, which might take several minutes to finish.
 	 */
-	nouveau_fence_wait(fence, false, false);
+	nouveau_fence_wait(fence, false);
 	ret = ttm_bo_move_accel_cleanup(bo, &fence->base, evict, false,
 					new_reg);
 	nouveau_fence_unref(&fence);
diff --git a/drivers/gpu/drm/nouveau/nouveau_chan.c
b/drivers/gpu/drm/nouveau/nouveau_chan.c
index 7c97b2886807..66fca95c10c7 100644
--- a/drivers/gpu/drm/nouveau/nouveau_chan.c
+++ b/drivers/gpu/drm/nouveau/nouveau_chan.c
@@ -72,7 +72,7 @@ nouveau_channel_idle(struct nouveau_channel *chan)
 
 		ret = nouveau_fence_new(&fence, chan);
 		if (!ret) {
-			ret = nouveau_fence_wait(fence, false, false);
+			ret = nouveau_fence_wait(fence, false);
 			nouveau_fence_unref(&fence);
 		}
 
diff --git a/drivers/gpu/drm/nouveau/nouveau_dmem.c
b/drivers/gpu/drm/nouveau/nouveau_dmem.c
index 12feecf71e75..033a09cd3c8f 100644
--- a/drivers/gpu/drm/nouveau/nouveau_dmem.c
+++ b/drivers/gpu/drm/nouveau/nouveau_dmem.c
@@ -128,7 +128,7 @@ static void nouveau_dmem_page_free(struct page *page)
 static void nouveau_dmem_fence_done(struct nouveau_fence **fence)
 {
 	if (fence) {
-		nouveau_fence_wait(*fence, true, false);
+		nouveau_fence_wait(*fence, false);
 		nouveau_fence_unref(fence);
 	} else {
 		/*
diff --git a/drivers/gpu/drm/nouveau/nouveau_fence.c
b/drivers/gpu/drm/nouveau/nouveau_fence.c
index c3ea3cd933cd..8de941379324 100644
--- a/drivers/gpu/drm/nouveau/nouveau_fence.c
+++ b/drivers/gpu/drm/nouveau/nouveau_fence.c
@@ -312,39 +312,11 @@ nouveau_fence_wait_legacy(struct dma_fence *f, bool intr,
long wait)
 	return timeout - t;
 }
 
-static int
-nouveau_fence_wait_busy(struct nouveau_fence *fence, bool intr)
-{
-	int ret = 0;
-
-	while (!nouveau_fence_done(fence)) {
-		if (time_after_eq(jiffies, fence->timeout)) {
-			ret = -EBUSY;
-			break;
-		}
-
-		__set_current_state(intr ?
-				    TASK_INTERRUPTIBLE :
-				    TASK_UNINTERRUPTIBLE);
-
-		if (intr && signal_pending(current)) {
-			ret = -ERESTARTSYS;
-			break;
-		}
-	}
-
-	__set_current_state(TASK_RUNNING);
-	return ret;
-}
-
 int
-nouveau_fence_wait(struct nouveau_fence *fence, bool lazy, bool intr)
+nouveau_fence_wait(struct nouveau_fence *fence, bool intr)
 {
 	long ret;
 
-	if (!lazy)
-		return nouveau_fence_wait_busy(fence, intr);
-
 	ret = dma_fence_wait_timeout(&fence->base, intr, 15 * HZ);
 	if (ret < 0)
 		return ret;
diff --git a/drivers/gpu/drm/nouveau/nouveau_fence.h
b/drivers/gpu/drm/nouveau/nouveau_fence.h
index bc13110bdfa4..88213014b675 100644
--- a/drivers/gpu/drm/nouveau/nouveau_fence.h
+++ b/drivers/gpu/drm/nouveau/nouveau_fence.h
@@ -23,7 +23,7 @@ void nouveau_fence_unref(struct nouveau_fence **);
 
 int  nouveau_fence_emit(struct nouveau_fence *);
 bool nouveau_fence_done(struct nouveau_fence *);
-int  nouveau_fence_wait(struct nouveau_fence *, bool lazy, bool intr);
+int  nouveau_fence_wait(struct nouveau_fence *, bool intr);
 int  nouveau_fence_sync(struct nouveau_bo *, struct nouveau_channel *, bool
exclusive, bool intr);
 
 struct nouveau_fence_chan {
diff --git a/drivers/gpu/drm/nouveau/nouveau_gem.c
b/drivers/gpu/drm/nouveau/nouveau_gem.c
index 49c2bcbef129..f715e381da69 100644
--- a/drivers/gpu/drm/nouveau/nouveau_gem.c
+++ b/drivers/gpu/drm/nouveau/nouveau_gem.c
@@ -928,7 +928,7 @@ nouveau_gem_ioctl_pushbuf(struct drm_device *dev, void
*data,
 	}
 
 	if (sync) {
-		if (!(ret = nouveau_fence_wait(fence, false, false))) {
+		if (!(ret = nouveau_fence_wait(fence, false))) {
 			if ((ret = dma_fence_get_status(&fence->base)) == 1)
 				ret = 0;
 		}
-- 
2.43.2
On 17/4/24 15:40, Dave Airlie wrote:> External email: Use caution opening links or attachments > > > From: Dave Airlie <airlied at redhat.com> > > I'm pretty sure this optimisation is actually not a great idea, > and is racy with other things waiting for fences. > > Just nuke it, there should be no need to do fence waits in a > busy CPU loop. > > Signed-off-by: Dave Airlie <airlied at redhat.com>Reviewed-by: Ben Skeggs <bskeggs at nvidia.com>> --- > drivers/gpu/drm/nouveau/nouveau_bo.c | 2 +- > drivers/gpu/drm/nouveau/nouveau_chan.c | 2 +- > drivers/gpu/drm/nouveau/nouveau_dmem.c | 2 +- > drivers/gpu/drm/nouveau/nouveau_fence.c | 30 +------------------------ > drivers/gpu/drm/nouveau/nouveau_fence.h | 2 +- > drivers/gpu/drm/nouveau/nouveau_gem.c | 2 +- > 6 files changed, 6 insertions(+), 34 deletions(-) > > diff --git a/drivers/gpu/drm/nouveau/nouveau_bo.c b/drivers/gpu/drm/nouveau/nouveau_bo.c > index 8a30f5a0525b..a4e8f625fce6 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_bo.c > +++ b/drivers/gpu/drm/nouveau/nouveau_bo.c > @@ -902,7 +902,7 @@ nouveau_bo_move_m2mf(struct ttm_buffer_object *bo, int evict, > * Without this the operation can timeout and we'll fallback to a > * software copy, which might take several minutes to finish. > */ > - nouveau_fence_wait(fence, false, false); > + nouveau_fence_wait(fence, false); > ret = ttm_bo_move_accel_cleanup(bo, &fence->base, evict, false, > new_reg); > nouveau_fence_unref(&fence); > diff --git a/drivers/gpu/drm/nouveau/nouveau_chan.c b/drivers/gpu/drm/nouveau/nouveau_chan.c > index 7c97b2886807..66fca95c10c7 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_chan.c > +++ b/drivers/gpu/drm/nouveau/nouveau_chan.c > @@ -72,7 +72,7 @@ nouveau_channel_idle(struct nouveau_channel *chan) > > ret = nouveau_fence_new(&fence, chan); > if (!ret) { > - ret = nouveau_fence_wait(fence, false, false); > + ret = nouveau_fence_wait(fence, false); > nouveau_fence_unref(&fence); > } > > diff --git a/drivers/gpu/drm/nouveau/nouveau_dmem.c b/drivers/gpu/drm/nouveau/nouveau_dmem.c > index 12feecf71e75..033a09cd3c8f 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_dmem.c > +++ b/drivers/gpu/drm/nouveau/nouveau_dmem.c > @@ -128,7 +128,7 @@ static void nouveau_dmem_page_free(struct page *page) > static void nouveau_dmem_fence_done(struct nouveau_fence **fence) > { > if (fence) { > - nouveau_fence_wait(*fence, true, false); > + nouveau_fence_wait(*fence, false); > nouveau_fence_unref(fence); > } else { > /* > diff --git a/drivers/gpu/drm/nouveau/nouveau_fence.c b/drivers/gpu/drm/nouveau/nouveau_fence.c > index c3ea3cd933cd..8de941379324 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_fence.c > +++ b/drivers/gpu/drm/nouveau/nouveau_fence.c > @@ -312,39 +312,11 @@ nouveau_fence_wait_legacy(struct dma_fence *f, bool intr, long wait) > return timeout - t; > } > > -static int > -nouveau_fence_wait_busy(struct nouveau_fence *fence, bool intr) > -{ > - int ret = 0; > - > - while (!nouveau_fence_done(fence)) { > - if (time_after_eq(jiffies, fence->timeout)) { > - ret = -EBUSY; > - break; > - } > - > - __set_current_state(intr ? > - TASK_INTERRUPTIBLE : > - TASK_UNINTERRUPTIBLE); > - > - if (intr && signal_pending(current)) { > - ret = -ERESTARTSYS; > - break; > - } > - } > - > - __set_current_state(TASK_RUNNING); > - return ret; > -} > - > int > -nouveau_fence_wait(struct nouveau_fence *fence, bool lazy, bool intr) > +nouveau_fence_wait(struct nouveau_fence *fence, bool intr) > { > long ret; > > - if (!lazy) > - return nouveau_fence_wait_busy(fence, intr); > - > ret = dma_fence_wait_timeout(&fence->base, intr, 15 * HZ); > if (ret < 0) > return ret; > diff --git a/drivers/gpu/drm/nouveau/nouveau_fence.h b/drivers/gpu/drm/nouveau/nouveau_fence.h > index bc13110bdfa4..88213014b675 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_fence.h > +++ b/drivers/gpu/drm/nouveau/nouveau_fence.h > @@ -23,7 +23,7 @@ void nouveau_fence_unref(struct nouveau_fence **); > > int nouveau_fence_emit(struct nouveau_fence *); > bool nouveau_fence_done(struct nouveau_fence *); > -int nouveau_fence_wait(struct nouveau_fence *, bool lazy, bool intr); > +int nouveau_fence_wait(struct nouveau_fence *, bool intr); > int nouveau_fence_sync(struct nouveau_bo *, struct nouveau_channel *, bool exclusive, bool intr); > > struct nouveau_fence_chan { > diff --git a/drivers/gpu/drm/nouveau/nouveau_gem.c b/drivers/gpu/drm/nouveau/nouveau_gem.c > index 49c2bcbef129..f715e381da69 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_gem.c > +++ b/drivers/gpu/drm/nouveau/nouveau_gem.c > @@ -928,7 +928,7 @@ nouveau_gem_ioctl_pushbuf(struct drm_device *dev, void *data, > } > > if (sync) { > - if (!(ret = nouveau_fence_wait(fence, false, false))) { > + if (!(ret = nouveau_fence_wait(fence, false))) { > if ((ret = dma_fence_get_status(&fence->base)) == 1) > ret = 0; > } > -- > 2.43.2 >
On 4/17/24 07:40, Dave Airlie wrote:> From: Dave Airlie <airlied at redhat.com> > > I'm pretty sure this optimisation is actually not a great idea, > and is racy with other things waiting for fences.Yes, I tried to use it in the past on scheduler tear down, to have an indicator whether all jobs had the chance to finish. However, it happened that using a CPU busy loop saw the fence as signaled, while an (event based) dma_fence was still seen as unsignaled.> > Just nuke it, there should be no need to do fence waits in a > busy CPU loop. > > Signed-off-by: Dave Airlie <airlied at redhat.com>Applied to drm-misc-next.> --- > drivers/gpu/drm/nouveau/nouveau_bo.c | 2 +- > drivers/gpu/drm/nouveau/nouveau_chan.c | 2 +- > drivers/gpu/drm/nouveau/nouveau_dmem.c | 2 +- > drivers/gpu/drm/nouveau/nouveau_fence.c | 30 +------------------------ > drivers/gpu/drm/nouveau/nouveau_fence.h | 2 +- > drivers/gpu/drm/nouveau/nouveau_gem.c | 2 +- > 6 files changed, 6 insertions(+), 34 deletions(-) > > diff --git a/drivers/gpu/drm/nouveau/nouveau_bo.c b/drivers/gpu/drm/nouveau/nouveau_bo.c > index 8a30f5a0525b..a4e8f625fce6 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_bo.c > +++ b/drivers/gpu/drm/nouveau/nouveau_bo.c > @@ -902,7 +902,7 @@ nouveau_bo_move_m2mf(struct ttm_buffer_object *bo, int evict, > * Without this the operation can timeout and we'll fallback to a > * software copy, which might take several minutes to finish. > */ > - nouveau_fence_wait(fence, false, false); > + nouveau_fence_wait(fence, false); > ret = ttm_bo_move_accel_cleanup(bo, &fence->base, evict, false, > new_reg); > nouveau_fence_unref(&fence); > diff --git a/drivers/gpu/drm/nouveau/nouveau_chan.c b/drivers/gpu/drm/nouveau/nouveau_chan.c > index 7c97b2886807..66fca95c10c7 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_chan.c > +++ b/drivers/gpu/drm/nouveau/nouveau_chan.c > @@ -72,7 +72,7 @@ nouveau_channel_idle(struct nouveau_channel *chan) > > ret = nouveau_fence_new(&fence, chan); > if (!ret) { > - ret = nouveau_fence_wait(fence, false, false); > + ret = nouveau_fence_wait(fence, false); > nouveau_fence_unref(&fence); > } > > diff --git a/drivers/gpu/drm/nouveau/nouveau_dmem.c b/drivers/gpu/drm/nouveau/nouveau_dmem.c > index 12feecf71e75..033a09cd3c8f 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_dmem.c > +++ b/drivers/gpu/drm/nouveau/nouveau_dmem.c > @@ -128,7 +128,7 @@ static void nouveau_dmem_page_free(struct page *page) > static void nouveau_dmem_fence_done(struct nouveau_fence **fence) > { > if (fence) { > - nouveau_fence_wait(*fence, true, false); > + nouveau_fence_wait(*fence, false); > nouveau_fence_unref(fence); > } else { > /* > diff --git a/drivers/gpu/drm/nouveau/nouveau_fence.c b/drivers/gpu/drm/nouveau/nouveau_fence.c > index c3ea3cd933cd..8de941379324 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_fence.c > +++ b/drivers/gpu/drm/nouveau/nouveau_fence.c > @@ -312,39 +312,11 @@ nouveau_fence_wait_legacy(struct dma_fence *f, bool intr, long wait) > return timeout - t; > } > > -static int > -nouveau_fence_wait_busy(struct nouveau_fence *fence, bool intr) > -{ > - int ret = 0; > - > - while (!nouveau_fence_done(fence)) { > - if (time_after_eq(jiffies, fence->timeout)) { > - ret = -EBUSY; > - break; > - } > - > - __set_current_state(intr ? > - TASK_INTERRUPTIBLE : > - TASK_UNINTERRUPTIBLE); > - > - if (intr && signal_pending(current)) { > - ret = -ERESTARTSYS; > - break; > - } > - } > - > - __set_current_state(TASK_RUNNING); > - return ret; > -} > - > int > -nouveau_fence_wait(struct nouveau_fence *fence, bool lazy, bool intr) > +nouveau_fence_wait(struct nouveau_fence *fence, bool intr) > { > long ret; > > - if (!lazy) > - return nouveau_fence_wait_busy(fence, intr); > - > ret = dma_fence_wait_timeout(&fence->base, intr, 15 * HZ); > if (ret < 0) > return ret; > diff --git a/drivers/gpu/drm/nouveau/nouveau_fence.h b/drivers/gpu/drm/nouveau/nouveau_fence.h > index bc13110bdfa4..88213014b675 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_fence.h > +++ b/drivers/gpu/drm/nouveau/nouveau_fence.h > @@ -23,7 +23,7 @@ void nouveau_fence_unref(struct nouveau_fence **); > > int nouveau_fence_emit(struct nouveau_fence *); > bool nouveau_fence_done(struct nouveau_fence *); > -int nouveau_fence_wait(struct nouveau_fence *, bool lazy, bool intr); > +int nouveau_fence_wait(struct nouveau_fence *, bool intr); > int nouveau_fence_sync(struct nouveau_bo *, struct nouveau_channel *, bool exclusive, bool intr); > > struct nouveau_fence_chan { > diff --git a/drivers/gpu/drm/nouveau/nouveau_gem.c b/drivers/gpu/drm/nouveau/nouveau_gem.c > index 49c2bcbef129..f715e381da69 100644 > --- a/drivers/gpu/drm/nouveau/nouveau_gem.c > +++ b/drivers/gpu/drm/nouveau/nouveau_gem.c > @@ -928,7 +928,7 @@ nouveau_gem_ioctl_pushbuf(struct drm_device *dev, void *data, > } > > if (sync) { > - if (!(ret = nouveau_fence_wait(fence, false, false))) { > + if (!(ret = nouveau_fence_wait(fence, false))) { > if ((ret = dma_fence_get_status(&fence->base)) == 1) > ret = 0; > }