Message ID | 5423F0EA.4030708@canonical.com (mailing list archive) |
---|---|
State | New, archived |
Headers | show |
Op 25-09-14 om 12:39 schreef Maarten Lankhorst: > Not the whole world is a radeon! :-) > > Signed-off-by: Maarten Lankhorst <maarten.lankhorst@canonical.com> > --- > Changes: > - Removed interruptible parameter, only 1 place has a use for it, > and it's the only place that can hit it. > - Fail faster in radeon_semaphore_sync_resv. > - Make the break on error in radeon_cs.c more explicit. > - Upgrade the unlikely() to a WARN_ON_ONCE() in radeon_fence_wait, with a comment explaining why. Ping, can you review? > diff --git a/drivers/gpu/drm/radeon/cik.c b/drivers/gpu/drm/radeon/cik.c > index 0d761f73a7fa..7bdf80c2603d 100644 > --- a/drivers/gpu/drm/radeon/cik.c > +++ b/drivers/gpu/drm/radeon/cik.c > @@ -3993,7 +3993,7 @@ struct radeon_fence *cik_copy_cpdma(struct radeon_device *rdev, > return ERR_PTR(r); > } > > - radeon_semaphore_sync_resv(sem, resv, false); > + radeon_semaphore_sync_resv(rdev, sem, resv, false); > radeon_semaphore_sync_rings(rdev, sem, ring->idx); > > for (i = 0; i < num_loops; i++) { > diff --git a/drivers/gpu/drm/radeon/cik_sdma.c b/drivers/gpu/drm/radeon/cik_sdma.c > index c01a6100c318..c473c9125295 100644 > --- a/drivers/gpu/drm/radeon/cik_sdma.c > +++ b/drivers/gpu/drm/radeon/cik_sdma.c > @@ -571,7 +571,7 @@ struct radeon_fence *cik_copy_dma(struct radeon_device *rdev, > return ERR_PTR(r); > } > > - radeon_semaphore_sync_resv(sem, resv, false); > + radeon_semaphore_sync_resv(rdev, sem, resv, false); > radeon_semaphore_sync_rings(rdev, sem, ring->idx); > > for (i = 0; i < num_loops; i++) { > diff --git a/drivers/gpu/drm/radeon/evergreen_dma.c b/drivers/gpu/drm/radeon/evergreen_dma.c > index 946f37d0b469..66bcfadeedd1 100644 > --- a/drivers/gpu/drm/radeon/evergreen_dma.c > +++ b/drivers/gpu/drm/radeon/evergreen_dma.c > @@ -133,7 +133,7 @@ struct radeon_fence *evergreen_copy_dma(struct radeon_device *rdev, > return ERR_PTR(r); > } > > - radeon_semaphore_sync_resv(sem, resv, false); > + radeon_semaphore_sync_resv(rdev, sem, resv, false); > radeon_semaphore_sync_rings(rdev, sem, ring->idx); > > for (i = 0; i < num_loops; i++) { > diff --git a/drivers/gpu/drm/radeon/r600.c b/drivers/gpu/drm/radeon/r600.c > index 25f367ac4637..f8eb519c3286 100644 > --- a/drivers/gpu/drm/radeon/r600.c > +++ b/drivers/gpu/drm/radeon/r600.c > @@ -2912,7 +2912,7 @@ struct radeon_fence *r600_copy_cpdma(struct radeon_device *rdev, > return ERR_PTR(r); > } > > - radeon_semaphore_sync_resv(sem, resv, false); > + radeon_semaphore_sync_resv(rdev, sem, resv, false); > radeon_semaphore_sync_rings(rdev, sem, ring->idx); > > radeon_ring_write(ring, PACKET3(PACKET3_SET_CONFIG_REG, 1)); > diff --git a/drivers/gpu/drm/radeon/r600_dma.c b/drivers/gpu/drm/radeon/r600_dma.c > index fc54224ce87b..a49db830a47f 100644 > --- a/drivers/gpu/drm/radeon/r600_dma.c > +++ b/drivers/gpu/drm/radeon/r600_dma.c > @@ -470,7 +470,7 @@ struct radeon_fence *r600_copy_dma(struct radeon_device *rdev, > return ERR_PTR(r); > } > > - radeon_semaphore_sync_resv(sem, resv, false); > + radeon_semaphore_sync_resv(rdev, sem, resv, false); > radeon_semaphore_sync_rings(rdev, sem, ring->idx); > > for (i = 0; i < num_loops; i++) { > diff --git a/drivers/gpu/drm/radeon/radeon.h b/drivers/gpu/drm/radeon/radeon.h > index 864457cd7c98..07aa961bf5ca 100644 > --- a/drivers/gpu/drm/radeon/radeon.h > +++ b/drivers/gpu/drm/radeon/radeon.h > @@ -589,9 +589,10 @@ bool radeon_semaphore_emit_wait(struct radeon_device *rdev, int ring, > struct radeon_semaphore *semaphore); > void radeon_semaphore_sync_fence(struct radeon_semaphore *semaphore, > struct radeon_fence *fence); > -void radeon_semaphore_sync_resv(struct radeon_semaphore *semaphore, > - struct reservation_object *resv, > - bool shared); > +int radeon_semaphore_sync_resv(struct radeon_device *rdev, > + struct radeon_semaphore *semaphore, > + struct reservation_object *resv, > + bool shared); > int radeon_semaphore_sync_rings(struct radeon_device *rdev, > struct radeon_semaphore *semaphore, > int waiting_ring); > diff --git a/drivers/gpu/drm/radeon/radeon_cs.c b/drivers/gpu/drm/radeon/radeon_cs.c > index f662de41ba49..1c893447d7cd 100644 > --- a/drivers/gpu/drm/radeon/radeon_cs.c > +++ b/drivers/gpu/drm/radeon/radeon_cs.c > @@ -249,9 +249,9 @@ static int radeon_cs_get_ring(struct radeon_cs_parser *p, u32 ring, s32 priority > return 0; > } > > -static void radeon_cs_sync_rings(struct radeon_cs_parser *p) > +static int radeon_cs_sync_rings(struct radeon_cs_parser *p) > { > - int i; > + int i, r = 0; > > for (i = 0; i < p->nrelocs; i++) { > struct reservation_object *resv; > @@ -260,9 +260,13 @@ static void radeon_cs_sync_rings(struct radeon_cs_parser *p) > continue; > > resv = p->relocs[i].robj->tbo.resv; > - radeon_semaphore_sync_resv(p->ib.semaphore, resv, > - p->relocs[i].tv.shared); > + r = radeon_semaphore_sync_resv(p->rdev, p->ib.semaphore, resv, > + p->relocs[i].tv.shared); > + > + if (r) > + break; > } > + return r; > } > > /* XXX: note that this is called from the legacy UMS CS ioctl as well */ > @@ -472,13 +476,19 @@ static int radeon_cs_ib_chunk(struct radeon_device *rdev, > return r; > } > > + r = radeon_cs_sync_rings(parser); > + if (r) { > + if (r != -ERESTARTSYS) > + DRM_ERROR("Failed to sync rings: %i\n", r); > + return r; > + } > + > if (parser->ring == R600_RING_TYPE_UVD_INDEX) > radeon_uvd_note_usage(rdev); > else if ((parser->ring == TN_RING_TYPE_VCE1_INDEX) || > (parser->ring == TN_RING_TYPE_VCE2_INDEX)) > radeon_vce_note_usage(rdev); > > - radeon_cs_sync_rings(parser); > r = radeon_ib_schedule(rdev, &parser->ib, NULL, true); > if (r) { > DRM_ERROR("Failed to schedule IB !\n"); > @@ -565,7 +575,13 @@ static int radeon_cs_ib_vm_chunk(struct radeon_device *rdev, > if (r) { > goto out; > } > - radeon_cs_sync_rings(parser); > + > + r = radeon_cs_sync_rings(parser); > + if (r) { > + if (r != -ERESTARTSYS) > + DRM_ERROR("Failed to sync rings: %i\n", r); > + goto out; > + } > radeon_semaphore_sync_fence(parser->ib.semaphore, vm->fence); > > if ((rdev->family >= CHIP_TAHITI) && > diff --git a/drivers/gpu/drm/radeon/radeon_fence.c b/drivers/gpu/drm/radeon/radeon_fence.c > index af9f2d6bd7d0..995167025282 100644 > --- a/drivers/gpu/drm/radeon/radeon_fence.c > +++ b/drivers/gpu/drm/radeon/radeon_fence.c > @@ -541,6 +541,15 @@ int radeon_fence_wait(struct radeon_fence *fence, bool intr) > uint64_t seq[RADEON_NUM_RINGS] = {}; > long r; > > + /* > + * This function should not be called on !radeon fences. > + * If this is the case, it would mean this function can > + * also be called on radeon fences belonging to another card. > + * exclusive_lock is not held in that case. > + */ > + if (WARN_ON_ONCE(!to_radeon_fence(&fence->base))) > + return fence_wait(&fence->base, intr); > + > seq[fence->ring] = fence->seq; > r = radeon_fence_wait_seq_timeout(fence->rdev, seq, intr, MAX_SCHEDULE_TIMEOUT); > if (r < 0) { > diff --git a/drivers/gpu/drm/radeon/radeon_semaphore.c b/drivers/gpu/drm/radeon/radeon_semaphore.c > index 4d4b0773638a..6deb08f045b7 100644 > --- a/drivers/gpu/drm/radeon/radeon_semaphore.c > +++ b/drivers/gpu/drm/radeon/radeon_semaphore.c > @@ -124,27 +124,42 @@ void radeon_semaphore_sync_fence(struct radeon_semaphore *semaphore, > * > * Sync to the fence using this semaphore object > */ > -void radeon_semaphore_sync_resv(struct radeon_semaphore *sema, > - struct reservation_object *resv, > - bool shared) > +int radeon_semaphore_sync_resv(struct radeon_device *rdev, > + struct radeon_semaphore *sema, > + struct reservation_object *resv, > + bool shared) > { > struct reservation_object_list *flist; > struct fence *f; > + struct radeon_fence *fence; > unsigned i; > + int r = 0; > > /* always sync to the exclusive fence */ > f = reservation_object_get_excl(resv); > - radeon_semaphore_sync_fence(sema, (struct radeon_fence*)f); > + fence = f ? to_radeon_fence(f) : NULL; > + if (fence && fence->rdev == rdev) > + radeon_semaphore_sync_fence(sema, fence); > + else if (f) > + r = fence_wait(f, true); > > flist = reservation_object_get_list(resv); > - if (shared || !flist) > - return; > + if (shared || !flist || r) > + return r; > > for (i = 0; i < flist->shared_count; ++i) { > f = rcu_dereference_protected(flist->shared[i], > reservation_object_held(resv)); > - radeon_semaphore_sync_fence(sema, (struct radeon_fence*)f); > + fence = to_radeon_fence(f); > + if (fence && fence->rdev == rdev) > + radeon_semaphore_sync_fence(sema, fence); > + else > + r = fence_wait(f, true); > + > + if (r) > + break; > } > + return r; > } > > /** > diff --git a/drivers/gpu/drm/radeon/radeon_vm.c b/drivers/gpu/drm/radeon/radeon_vm.c > index ce870959dff8..8af1a94e7448 100644 > --- a/drivers/gpu/drm/radeon/radeon_vm.c > +++ b/drivers/gpu/drm/radeon/radeon_vm.c > @@ -698,7 +698,7 @@ int radeon_vm_update_page_directory(struct radeon_device *rdev, > if (ib.length_dw != 0) { > radeon_asic_vm_pad_ib(rdev, &ib); > > - radeon_semaphore_sync_resv(ib.semaphore, pd->tbo.resv, false); > + radeon_semaphore_sync_resv(rdev, ib.semaphore, pd->tbo.resv, false); > radeon_semaphore_sync_fence(ib.semaphore, vm->last_id_use); > WARN_ON(ib.length_dw > ndw); > r = radeon_ib_schedule(rdev, &ib, NULL, false); > @@ -825,7 +825,7 @@ static void radeon_vm_update_ptes(struct radeon_device *rdev, > unsigned nptes; > uint64_t pte; > > - radeon_semaphore_sync_resv(ib->semaphore, pt->tbo.resv, false); > + radeon_semaphore_sync_resv(rdev, ib->semaphore, pt->tbo.resv, false); > > if ((addr & ~mask) == (end & ~mask)) > nptes = end - addr; > diff --git a/drivers/gpu/drm/radeon/rv770_dma.c b/drivers/gpu/drm/radeon/rv770_dma.c > index c112764adfdf..7f34bad2e724 100644 > --- a/drivers/gpu/drm/radeon/rv770_dma.c > +++ b/drivers/gpu/drm/radeon/rv770_dma.c > @@ -67,7 +67,7 @@ struct radeon_fence *rv770_copy_dma(struct radeon_device *rdev, > return ERR_PTR(r); > } > > - radeon_semaphore_sync_resv(sem, resv, false); > + radeon_semaphore_sync_resv(rdev, sem, resv, false); > radeon_semaphore_sync_rings(rdev, sem, ring->idx); > > for (i = 0; i < num_loops; i++) { > diff --git a/drivers/gpu/drm/radeon/si_dma.c b/drivers/gpu/drm/radeon/si_dma.c > index 9b0dfbc913f3..b58f12b762d7 100644 > --- a/drivers/gpu/drm/radeon/si_dma.c > +++ b/drivers/gpu/drm/radeon/si_dma.c > @@ -252,7 +252,7 @@ struct radeon_fence *si_copy_dma(struct radeon_device *rdev, > return ERR_PTR(r); > } > > - radeon_semaphore_sync_resv(sem, resv, false); > + radeon_semaphore_sync_resv(rdev, sem, resv, false); > radeon_semaphore_sync_rings(rdev, sem, ring->idx); > > for (i = 0; i < num_loops; i++) { >
Am 01.10.2014 um 10:57 schrieb Maarten Lankhorst: > Op 25-09-14 om 12:39 schreef Maarten Lankhorst: >> Not the whole world is a radeon! :-) >> >> Signed-off-by: Maarten Lankhorst <maarten.lankhorst@canonical.com> >> --- >> Changes: >> - Removed interruptible parameter, only 1 place has a use for it, >> and it's the only place that can hit it. >> - Fail faster in radeon_semaphore_sync_resv. >> - Make the break on error in radeon_cs.c more explicit. >> - Upgrade the unlikely() to a WARN_ON_ONCE() in radeon_fence_wait, with a comment explaining why. > Ping, can you review? LGTM, patch is Reviewed-by: Christian König <christian.koenig@amd.com> But we might want to pull it in through Alex drm-next-3.18 (or -3.19) branch to avoid merge conflicts. Regards, Christian. >> diff --git a/drivers/gpu/drm/radeon/cik.c b/drivers/gpu/drm/radeon/cik.c >> index 0d761f73a7fa..7bdf80c2603d 100644 >> --- a/drivers/gpu/drm/radeon/cik.c >> +++ b/drivers/gpu/drm/radeon/cik.c >> @@ -3993,7 +3993,7 @@ struct radeon_fence *cik_copy_cpdma(struct radeon_device *rdev, >> return ERR_PTR(r); >> } >> >> - radeon_semaphore_sync_resv(sem, resv, false); >> + radeon_semaphore_sync_resv(rdev, sem, resv, false); >> radeon_semaphore_sync_rings(rdev, sem, ring->idx); >> >> for (i = 0; i < num_loops; i++) { >> diff --git a/drivers/gpu/drm/radeon/cik_sdma.c b/drivers/gpu/drm/radeon/cik_sdma.c >> index c01a6100c318..c473c9125295 100644 >> --- a/drivers/gpu/drm/radeon/cik_sdma.c >> +++ b/drivers/gpu/drm/radeon/cik_sdma.c >> @@ -571,7 +571,7 @@ struct radeon_fence *cik_copy_dma(struct radeon_device *rdev, >> return ERR_PTR(r); >> } >> >> - radeon_semaphore_sync_resv(sem, resv, false); >> + radeon_semaphore_sync_resv(rdev, sem, resv, false); >> radeon_semaphore_sync_rings(rdev, sem, ring->idx); >> >> for (i = 0; i < num_loops; i++) { >> diff --git a/drivers/gpu/drm/radeon/evergreen_dma.c b/drivers/gpu/drm/radeon/evergreen_dma.c >> index 946f37d0b469..66bcfadeedd1 100644 >> --- a/drivers/gpu/drm/radeon/evergreen_dma.c >> +++ b/drivers/gpu/drm/radeon/evergreen_dma.c >> @@ -133,7 +133,7 @@ struct radeon_fence *evergreen_copy_dma(struct radeon_device *rdev, >> return ERR_PTR(r); >> } >> >> - radeon_semaphore_sync_resv(sem, resv, false); >> + radeon_semaphore_sync_resv(rdev, sem, resv, false); >> radeon_semaphore_sync_rings(rdev, sem, ring->idx); >> >> for (i = 0; i < num_loops; i++) { >> diff --git a/drivers/gpu/drm/radeon/r600.c b/drivers/gpu/drm/radeon/r600.c >> index 25f367ac4637..f8eb519c3286 100644 >> --- a/drivers/gpu/drm/radeon/r600.c >> +++ b/drivers/gpu/drm/radeon/r600.c >> @@ -2912,7 +2912,7 @@ struct radeon_fence *r600_copy_cpdma(struct radeon_device *rdev, >> return ERR_PTR(r); >> } >> >> - radeon_semaphore_sync_resv(sem, resv, false); >> + radeon_semaphore_sync_resv(rdev, sem, resv, false); >> radeon_semaphore_sync_rings(rdev, sem, ring->idx); >> >> radeon_ring_write(ring, PACKET3(PACKET3_SET_CONFIG_REG, 1)); >> diff --git a/drivers/gpu/drm/radeon/r600_dma.c b/drivers/gpu/drm/radeon/r600_dma.c >> index fc54224ce87b..a49db830a47f 100644 >> --- a/drivers/gpu/drm/radeon/r600_dma.c >> +++ b/drivers/gpu/drm/radeon/r600_dma.c >> @@ -470,7 +470,7 @@ struct radeon_fence *r600_copy_dma(struct radeon_device *rdev, >> return ERR_PTR(r); >> } >> >> - radeon_semaphore_sync_resv(sem, resv, false); >> + radeon_semaphore_sync_resv(rdev, sem, resv, false); >> radeon_semaphore_sync_rings(rdev, sem, ring->idx); >> >> for (i = 0; i < num_loops; i++) { >> diff --git a/drivers/gpu/drm/radeon/radeon.h b/drivers/gpu/drm/radeon/radeon.h >> index 864457cd7c98..07aa961bf5ca 100644 >> --- a/drivers/gpu/drm/radeon/radeon.h >> +++ b/drivers/gpu/drm/radeon/radeon.h >> @@ -589,9 +589,10 @@ bool radeon_semaphore_emit_wait(struct radeon_device *rdev, int ring, >> struct radeon_semaphore *semaphore); >> void radeon_semaphore_sync_fence(struct radeon_semaphore *semaphore, >> struct radeon_fence *fence); >> -void radeon_semaphore_sync_resv(struct radeon_semaphore *semaphore, >> - struct reservation_object *resv, >> - bool shared); >> +int radeon_semaphore_sync_resv(struct radeon_device *rdev, >> + struct radeon_semaphore *semaphore, >> + struct reservation_object *resv, >> + bool shared); >> int radeon_semaphore_sync_rings(struct radeon_device *rdev, >> struct radeon_semaphore *semaphore, >> int waiting_ring); >> diff --git a/drivers/gpu/drm/radeon/radeon_cs.c b/drivers/gpu/drm/radeon/radeon_cs.c >> index f662de41ba49..1c893447d7cd 100644 >> --- a/drivers/gpu/drm/radeon/radeon_cs.c >> +++ b/drivers/gpu/drm/radeon/radeon_cs.c >> @@ -249,9 +249,9 @@ static int radeon_cs_get_ring(struct radeon_cs_parser *p, u32 ring, s32 priority >> return 0; >> } >> >> -static void radeon_cs_sync_rings(struct radeon_cs_parser *p) >> +static int radeon_cs_sync_rings(struct radeon_cs_parser *p) >> { >> - int i; >> + int i, r = 0; >> >> for (i = 0; i < p->nrelocs; i++) { >> struct reservation_object *resv; >> @@ -260,9 +260,13 @@ static void radeon_cs_sync_rings(struct radeon_cs_parser *p) >> continue; >> >> resv = p->relocs[i].robj->tbo.resv; >> - radeon_semaphore_sync_resv(p->ib.semaphore, resv, >> - p->relocs[i].tv.shared); >> + r = radeon_semaphore_sync_resv(p->rdev, p->ib.semaphore, resv, >> + p->relocs[i].tv.shared); >> + >> + if (r) >> + break; >> } >> + return r; >> } >> >> /* XXX: note that this is called from the legacy UMS CS ioctl as well */ >> @@ -472,13 +476,19 @@ static int radeon_cs_ib_chunk(struct radeon_device *rdev, >> return r; >> } >> >> + r = radeon_cs_sync_rings(parser); >> + if (r) { >> + if (r != -ERESTARTSYS) >> + DRM_ERROR("Failed to sync rings: %i\n", r); >> + return r; >> + } >> + >> if (parser->ring == R600_RING_TYPE_UVD_INDEX) >> radeon_uvd_note_usage(rdev); >> else if ((parser->ring == TN_RING_TYPE_VCE1_INDEX) || >> (parser->ring == TN_RING_TYPE_VCE2_INDEX)) >> radeon_vce_note_usage(rdev); >> >> - radeon_cs_sync_rings(parser); >> r = radeon_ib_schedule(rdev, &parser->ib, NULL, true); >> if (r) { >> DRM_ERROR("Failed to schedule IB !\n"); >> @@ -565,7 +575,13 @@ static int radeon_cs_ib_vm_chunk(struct radeon_device *rdev, >> if (r) { >> goto out; >> } >> - radeon_cs_sync_rings(parser); >> + >> + r = radeon_cs_sync_rings(parser); >> + if (r) { >> + if (r != -ERESTARTSYS) >> + DRM_ERROR("Failed to sync rings: %i\n", r); >> + goto out; >> + } >> radeon_semaphore_sync_fence(parser->ib.semaphore, vm->fence); >> >> if ((rdev->family >= CHIP_TAHITI) && >> diff --git a/drivers/gpu/drm/radeon/radeon_fence.c b/drivers/gpu/drm/radeon/radeon_fence.c >> index af9f2d6bd7d0..995167025282 100644 >> --- a/drivers/gpu/drm/radeon/radeon_fence.c >> +++ b/drivers/gpu/drm/radeon/radeon_fence.c >> @@ -541,6 +541,15 @@ int radeon_fence_wait(struct radeon_fence *fence, bool intr) >> uint64_t seq[RADEON_NUM_RINGS] = {}; >> long r; >> >> + /* >> + * This function should not be called on !radeon fences. >> + * If this is the case, it would mean this function can >> + * also be called on radeon fences belonging to another card. >> + * exclusive_lock is not held in that case. >> + */ >> + if (WARN_ON_ONCE(!to_radeon_fence(&fence->base))) >> + return fence_wait(&fence->base, intr); >> + >> seq[fence->ring] = fence->seq; >> r = radeon_fence_wait_seq_timeout(fence->rdev, seq, intr, MAX_SCHEDULE_TIMEOUT); >> if (r < 0) { >> diff --git a/drivers/gpu/drm/radeon/radeon_semaphore.c b/drivers/gpu/drm/radeon/radeon_semaphore.c >> index 4d4b0773638a..6deb08f045b7 100644 >> --- a/drivers/gpu/drm/radeon/radeon_semaphore.c >> +++ b/drivers/gpu/drm/radeon/radeon_semaphore.c >> @@ -124,27 +124,42 @@ void radeon_semaphore_sync_fence(struct radeon_semaphore *semaphore, >> * >> * Sync to the fence using this semaphore object >> */ >> -void radeon_semaphore_sync_resv(struct radeon_semaphore *sema, >> - struct reservation_object *resv, >> - bool shared) >> +int radeon_semaphore_sync_resv(struct radeon_device *rdev, >> + struct radeon_semaphore *sema, >> + struct reservation_object *resv, >> + bool shared) >> { >> struct reservation_object_list *flist; >> struct fence *f; >> + struct radeon_fence *fence; >> unsigned i; >> + int r = 0; >> >> /* always sync to the exclusive fence */ >> f = reservation_object_get_excl(resv); >> - radeon_semaphore_sync_fence(sema, (struct radeon_fence*)f); >> + fence = f ? to_radeon_fence(f) : NULL; >> + if (fence && fence->rdev == rdev) >> + radeon_semaphore_sync_fence(sema, fence); >> + else if (f) >> + r = fence_wait(f, true); >> >> flist = reservation_object_get_list(resv); >> - if (shared || !flist) >> - return; >> + if (shared || !flist || r) >> + return r; >> >> for (i = 0; i < flist->shared_count; ++i) { >> f = rcu_dereference_protected(flist->shared[i], >> reservation_object_held(resv)); >> - radeon_semaphore_sync_fence(sema, (struct radeon_fence*)f); >> + fence = to_radeon_fence(f); >> + if (fence && fence->rdev == rdev) >> + radeon_semaphore_sync_fence(sema, fence); >> + else >> + r = fence_wait(f, true); >> + >> + if (r) >> + break; >> } >> + return r; >> } >> >> /** >> diff --git a/drivers/gpu/drm/radeon/radeon_vm.c b/drivers/gpu/drm/radeon/radeon_vm.c >> index ce870959dff8..8af1a94e7448 100644 >> --- a/drivers/gpu/drm/radeon/radeon_vm.c >> +++ b/drivers/gpu/drm/radeon/radeon_vm.c >> @@ -698,7 +698,7 @@ int radeon_vm_update_page_directory(struct radeon_device *rdev, >> if (ib.length_dw != 0) { >> radeon_asic_vm_pad_ib(rdev, &ib); >> >> - radeon_semaphore_sync_resv(ib.semaphore, pd->tbo.resv, false); >> + radeon_semaphore_sync_resv(rdev, ib.semaphore, pd->tbo.resv, false); >> radeon_semaphore_sync_fence(ib.semaphore, vm->last_id_use); >> WARN_ON(ib.length_dw > ndw); >> r = radeon_ib_schedule(rdev, &ib, NULL, false); >> @@ -825,7 +825,7 @@ static void radeon_vm_update_ptes(struct radeon_device *rdev, >> unsigned nptes; >> uint64_t pte; >> >> - radeon_semaphore_sync_resv(ib->semaphore, pt->tbo.resv, false); >> + radeon_semaphore_sync_resv(rdev, ib->semaphore, pt->tbo.resv, false); >> >> if ((addr & ~mask) == (end & ~mask)) >> nptes = end - addr; >> diff --git a/drivers/gpu/drm/radeon/rv770_dma.c b/drivers/gpu/drm/radeon/rv770_dma.c >> index c112764adfdf..7f34bad2e724 100644 >> --- a/drivers/gpu/drm/radeon/rv770_dma.c >> +++ b/drivers/gpu/drm/radeon/rv770_dma.c >> @@ -67,7 +67,7 @@ struct radeon_fence *rv770_copy_dma(struct radeon_device *rdev, >> return ERR_PTR(r); >> } >> >> - radeon_semaphore_sync_resv(sem, resv, false); >> + radeon_semaphore_sync_resv(rdev, sem, resv, false); >> radeon_semaphore_sync_rings(rdev, sem, ring->idx); >> >> for (i = 0; i < num_loops; i++) { >> diff --git a/drivers/gpu/drm/radeon/si_dma.c b/drivers/gpu/drm/radeon/si_dma.c >> index 9b0dfbc913f3..b58f12b762d7 100644 >> --- a/drivers/gpu/drm/radeon/si_dma.c >> +++ b/drivers/gpu/drm/radeon/si_dma.c >> @@ -252,7 +252,7 @@ struct radeon_fence *si_copy_dma(struct radeon_device *rdev, >> return ERR_PTR(r); >> } >> >> - radeon_semaphore_sync_resv(sem, resv, false); >> + radeon_semaphore_sync_resv(rdev, sem, resv, false); >> radeon_semaphore_sync_rings(rdev, sem, ring->idx); >> >> for (i = 0; i < num_loops; i++) { >>
Hey, Op 01-10-14 om 11:04 schreef Christian König: > Am 01.10.2014 um 10:57 schrieb Maarten Lankhorst: >> Op 25-09-14 om 12:39 schreef Maarten Lankhorst: >>> Not the whole world is a radeon! :-) >>> Signed-off-by: Maarten Lankhorst <maarten.lankhorst@canonical.com> >>> --- >>> Changes: >>> - Removed interruptible parameter, only 1 place has a use for it, >>> and it's the only place that can hit it. >>> - Fail faster in radeon_semaphore_sync_resv. >>> - Make the break on error in radeon_cs.c more explicit. >>> - Upgrade the unlikely() to a WARN_ON_ONCE() in radeon_fence_wait, with a comment explaining why. >> Ping, can you review? > > LGTM, patch is Reviewed-by: Christian König <christian.koenig@amd.com> > > But we might want to pull it in through Alex drm-next-3.18 (or -3.19) branch to avoid merge conflicts. I can push nouveau through my own tree and once the patches are merged get the radeon changes through agd5f's tree? ~Maarten
On Wed, Oct 1, 2014 at 5:22 AM, Maarten Lankhorst <maarten.lankhorst@canonical.com> wrote: > Hey, > > Op 01-10-14 om 11:04 schreef Christian König: >> Am 01.10.2014 um 10:57 schrieb Maarten Lankhorst: >>> Op 25-09-14 om 12:39 schreef Maarten Lankhorst: >>>> Not the whole world is a radeon! :-) >>>> Signed-off-by: Maarten Lankhorst <maarten.lankhorst@canonical.com> >>>> --- >>>> Changes: >>>> - Removed interruptible parameter, only 1 place has a use for it, >>>> and it's the only place that can hit it. >>>> - Fail faster in radeon_semaphore_sync_resv. >>>> - Make the break on error in radeon_cs.c more explicit. >>>> - Upgrade the unlikely() to a WARN_ON_ONCE() in radeon_fence_wait, with a comment explaining why. >>> Ping, can you review? >> >> LGTM, patch is Reviewed-by: Christian König <christian.koenig@amd.com> >> >> But we might want to pull it in through Alex drm-next-3.18 (or -3.19) branch to avoid merge conflicts. > I can push nouveau through my own tree and once the patches are merged get the radeon changes through agd5f's tree? Either way works for me. Are we trying to get this in for 3.18 or 3.19? Alex
diff --git a/drivers/gpu/drm/radeon/cik.c b/drivers/gpu/drm/radeon/cik.c index 0d761f73a7fa..7bdf80c2603d 100644 --- a/drivers/gpu/drm/radeon/cik.c +++ b/drivers/gpu/drm/radeon/cik.c @@ -3993,7 +3993,7 @@ struct radeon_fence *cik_copy_cpdma(struct radeon_device *rdev, return ERR_PTR(r); } - radeon_semaphore_sync_resv(sem, resv, false); + radeon_semaphore_sync_resv(rdev, sem, resv, false); radeon_semaphore_sync_rings(rdev, sem, ring->idx); for (i = 0; i < num_loops; i++) { diff --git a/drivers/gpu/drm/radeon/cik_sdma.c b/drivers/gpu/drm/radeon/cik_sdma.c index c01a6100c318..c473c9125295 100644 --- a/drivers/gpu/drm/radeon/cik_sdma.c +++ b/drivers/gpu/drm/radeon/cik_sdma.c @@ -571,7 +571,7 @@ struct radeon_fence *cik_copy_dma(struct radeon_device *rdev, return ERR_PTR(r); } - radeon_semaphore_sync_resv(sem, resv, false); + radeon_semaphore_sync_resv(rdev, sem, resv, false); radeon_semaphore_sync_rings(rdev, sem, ring->idx); for (i = 0; i < num_loops; i++) { diff --git a/drivers/gpu/drm/radeon/evergreen_dma.c b/drivers/gpu/drm/radeon/evergreen_dma.c index 946f37d0b469..66bcfadeedd1 100644 --- a/drivers/gpu/drm/radeon/evergreen_dma.c +++ b/drivers/gpu/drm/radeon/evergreen_dma.c @@ -133,7 +133,7 @@ struct radeon_fence *evergreen_copy_dma(struct radeon_device *rdev, return ERR_PTR(r); } - radeon_semaphore_sync_resv(sem, resv, false); + radeon_semaphore_sync_resv(rdev, sem, resv, false); radeon_semaphore_sync_rings(rdev, sem, ring->idx); for (i = 0; i < num_loops; i++) { diff --git a/drivers/gpu/drm/radeon/r600.c b/drivers/gpu/drm/radeon/r600.c index 25f367ac4637..f8eb519c3286 100644 --- a/drivers/gpu/drm/radeon/r600.c +++ b/drivers/gpu/drm/radeon/r600.c @@ -2912,7 +2912,7 @@ struct radeon_fence *r600_copy_cpdma(struct radeon_device *rdev, return ERR_PTR(r); } - radeon_semaphore_sync_resv(sem, resv, false); + radeon_semaphore_sync_resv(rdev, sem, resv, false); radeon_semaphore_sync_rings(rdev, sem, ring->idx); radeon_ring_write(ring, PACKET3(PACKET3_SET_CONFIG_REG, 1)); diff --git a/drivers/gpu/drm/radeon/r600_dma.c b/drivers/gpu/drm/radeon/r600_dma.c index fc54224ce87b..a49db830a47f 100644 --- a/drivers/gpu/drm/radeon/r600_dma.c +++ b/drivers/gpu/drm/radeon/r600_dma.c @@ -470,7 +470,7 @@ struct radeon_fence *r600_copy_dma(struct radeon_device *rdev, return ERR_PTR(r); } - radeon_semaphore_sync_resv(sem, resv, false); + radeon_semaphore_sync_resv(rdev, sem, resv, false); radeon_semaphore_sync_rings(rdev, sem, ring->idx); for (i = 0; i < num_loops; i++) { diff --git a/drivers/gpu/drm/radeon/radeon.h b/drivers/gpu/drm/radeon/radeon.h index 864457cd7c98..07aa961bf5ca 100644 --- a/drivers/gpu/drm/radeon/radeon.h +++ b/drivers/gpu/drm/radeon/radeon.h @@ -589,9 +589,10 @@ bool radeon_semaphore_emit_wait(struct radeon_device *rdev, int ring, struct radeon_semaphore *semaphore); void radeon_semaphore_sync_fence(struct radeon_semaphore *semaphore, struct radeon_fence *fence); -void radeon_semaphore_sync_resv(struct radeon_semaphore *semaphore, - struct reservation_object *resv, - bool shared); +int radeon_semaphore_sync_resv(struct radeon_device *rdev, + struct radeon_semaphore *semaphore, + struct reservation_object *resv, + bool shared); int radeon_semaphore_sync_rings(struct radeon_device *rdev, struct radeon_semaphore *semaphore, int waiting_ring); diff --git a/drivers/gpu/drm/radeon/radeon_cs.c b/drivers/gpu/drm/radeon/radeon_cs.c index f662de41ba49..1c893447d7cd 100644 --- a/drivers/gpu/drm/radeon/radeon_cs.c +++ b/drivers/gpu/drm/radeon/radeon_cs.c @@ -249,9 +249,9 @@ static int radeon_cs_get_ring(struct radeon_cs_parser *p, u32 ring, s32 priority return 0; } -static void radeon_cs_sync_rings(struct radeon_cs_parser *p) +static int radeon_cs_sync_rings(struct radeon_cs_parser *p) { - int i; + int i, r = 0; for (i = 0; i < p->nrelocs; i++) { struct reservation_object *resv; @@ -260,9 +260,13 @@ static void radeon_cs_sync_rings(struct radeon_cs_parser *p) continue; resv = p->relocs[i].robj->tbo.resv; - radeon_semaphore_sync_resv(p->ib.semaphore, resv, - p->relocs[i].tv.shared); + r = radeon_semaphore_sync_resv(p->rdev, p->ib.semaphore, resv, + p->relocs[i].tv.shared); + + if (r) + break; } + return r; } /* XXX: note that this is called from the legacy UMS CS ioctl as well */ @@ -472,13 +476,19 @@ static int radeon_cs_ib_chunk(struct radeon_device *rdev, return r; } + r = radeon_cs_sync_rings(parser); + if (r) { + if (r != -ERESTARTSYS) + DRM_ERROR("Failed to sync rings: %i\n", r); + return r; + } + if (parser->ring == R600_RING_TYPE_UVD_INDEX) radeon_uvd_note_usage(rdev); else if ((parser->ring == TN_RING_TYPE_VCE1_INDEX) || (parser->ring == TN_RING_TYPE_VCE2_INDEX)) radeon_vce_note_usage(rdev); - radeon_cs_sync_rings(parser); r = radeon_ib_schedule(rdev, &parser->ib, NULL, true); if (r) { DRM_ERROR("Failed to schedule IB !\n"); @@ -565,7 +575,13 @@ static int radeon_cs_ib_vm_chunk(struct radeon_device *rdev, if (r) { goto out; } - radeon_cs_sync_rings(parser); + + r = radeon_cs_sync_rings(parser); + if (r) { + if (r != -ERESTARTSYS) + DRM_ERROR("Failed to sync rings: %i\n", r); + goto out; + } radeon_semaphore_sync_fence(parser->ib.semaphore, vm->fence); if ((rdev->family >= CHIP_TAHITI) && diff --git a/drivers/gpu/drm/radeon/radeon_fence.c b/drivers/gpu/drm/radeon/radeon_fence.c index af9f2d6bd7d0..995167025282 100644 --- a/drivers/gpu/drm/radeon/radeon_fence.c +++ b/drivers/gpu/drm/radeon/radeon_fence.c @@ -541,6 +541,15 @@ int radeon_fence_wait(struct radeon_fence *fence, bool intr) uint64_t seq[RADEON_NUM_RINGS] = {}; long r; + /* + * This function should not be called on !radeon fences. + * If this is the case, it would mean this function can + * also be called on radeon fences belonging to another card. + * exclusive_lock is not held in that case. + */ + if (WARN_ON_ONCE(!to_radeon_fence(&fence->base))) + return fence_wait(&fence->base, intr); + seq[fence->ring] = fence->seq; r = radeon_fence_wait_seq_timeout(fence->rdev, seq, intr, MAX_SCHEDULE_TIMEOUT); if (r < 0) { diff --git a/drivers/gpu/drm/radeon/radeon_semaphore.c b/drivers/gpu/drm/radeon/radeon_semaphore.c index 4d4b0773638a..6deb08f045b7 100644 --- a/drivers/gpu/drm/radeon/radeon_semaphore.c +++ b/drivers/gpu/drm/radeon/radeon_semaphore.c @@ -124,27 +124,42 @@ void radeon_semaphore_sync_fence(struct radeon_semaphore *semaphore, * * Sync to the fence using this semaphore object */ -void radeon_semaphore_sync_resv(struct radeon_semaphore *sema, - struct reservation_object *resv, - bool shared) +int radeon_semaphore_sync_resv(struct radeon_device *rdev, + struct radeon_semaphore *sema, + struct reservation_object *resv, + bool shared) { struct reservation_object_list *flist; struct fence *f; + struct radeon_fence *fence; unsigned i; + int r = 0; /* always sync to the exclusive fence */ f = reservation_object_get_excl(resv); - radeon_semaphore_sync_fence(sema, (struct radeon_fence*)f); + fence = f ? to_radeon_fence(f) : NULL; + if (fence && fence->rdev == rdev) + radeon_semaphore_sync_fence(sema, fence); + else if (f) + r = fence_wait(f, true); flist = reservation_object_get_list(resv); - if (shared || !flist) - return; + if (shared || !flist || r) + return r; for (i = 0; i < flist->shared_count; ++i) { f = rcu_dereference_protected(flist->shared[i], reservation_object_held(resv)); - radeon_semaphore_sync_fence(sema, (struct radeon_fence*)f); + fence = to_radeon_fence(f); + if (fence && fence->rdev == rdev) + radeon_semaphore_sync_fence(sema, fence); + else + r = fence_wait(f, true); + + if (r) + break; } + return r; } /** diff --git a/drivers/gpu/drm/radeon/radeon_vm.c b/drivers/gpu/drm/radeon/radeon_vm.c index ce870959dff8..8af1a94e7448 100644 --- a/drivers/gpu/drm/radeon/radeon_vm.c +++ b/drivers/gpu/drm/radeon/radeon_vm.c @@ -698,7 +698,7 @@ int radeon_vm_update_page_directory(struct radeon_device *rdev, if (ib.length_dw != 0) { radeon_asic_vm_pad_ib(rdev, &ib); - radeon_semaphore_sync_resv(ib.semaphore, pd->tbo.resv, false); + radeon_semaphore_sync_resv(rdev, ib.semaphore, pd->tbo.resv, false); radeon_semaphore_sync_fence(ib.semaphore, vm->last_id_use); WARN_ON(ib.length_dw > ndw); r = radeon_ib_schedule(rdev, &ib, NULL, false); @@ -825,7 +825,7 @@ static void radeon_vm_update_ptes(struct radeon_device *rdev, unsigned nptes; uint64_t pte; - radeon_semaphore_sync_resv(ib->semaphore, pt->tbo.resv, false); + radeon_semaphore_sync_resv(rdev, ib->semaphore, pt->tbo.resv, false); if ((addr & ~mask) == (end & ~mask)) nptes = end - addr; diff --git a/drivers/gpu/drm/radeon/rv770_dma.c b/drivers/gpu/drm/radeon/rv770_dma.c index c112764adfdf..7f34bad2e724 100644 --- a/drivers/gpu/drm/radeon/rv770_dma.c +++ b/drivers/gpu/drm/radeon/rv770_dma.c @@ -67,7 +67,7 @@ struct radeon_fence *rv770_copy_dma(struct radeon_device *rdev, return ERR_PTR(r); } - radeon_semaphore_sync_resv(sem, resv, false); + radeon_semaphore_sync_resv(rdev, sem, resv, false); radeon_semaphore_sync_rings(rdev, sem, ring->idx); for (i = 0; i < num_loops; i++) { diff --git a/drivers/gpu/drm/radeon/si_dma.c b/drivers/gpu/drm/radeon/si_dma.c index 9b0dfbc913f3..b58f12b762d7 100644 --- a/drivers/gpu/drm/radeon/si_dma.c +++ b/drivers/gpu/drm/radeon/si_dma.c @@ -252,7 +252,7 @@ struct radeon_fence *si_copy_dma(struct radeon_device *rdev, return ERR_PTR(r); } - radeon_semaphore_sync_resv(sem, resv, false); + radeon_semaphore_sync_resv(rdev, sem, resv, false); radeon_semaphore_sync_rings(rdev, sem, ring->idx); for (i = 0; i < num_loops; i++) {
Not the whole world is a radeon! :-) Signed-off-by: Maarten Lankhorst <maarten.lankhorst@canonical.com> --- Changes: - Removed interruptible parameter, only 1 place has a use for it, and it's the only place that can hit it. - Fail faster in radeon_semaphore_sync_resv. - Make the break on error in radeon_cs.c more explicit. - Upgrade the unlikely() to a WARN_ON_ONCE() in radeon_fence_wait, with a comment explaining why.