diff mbox series

[3/6] drm: add support of syncobj timeline point wait v2

Message ID 20180920110353.16114-3-david1.zhou@amd.com (mailing list archive)
State New, archived
Headers show
Series [1/6] drm: add flags to drm_syncobj_find_fence | expand

Commit Message

Chunming Zhou Sept. 20, 2018, 11:03 a.m. UTC
points array is one-to-one match with syncobjs array.
v2:
add seperate ioctl for timeline point wait, otherwise break uapi.

Signed-off-by: Chunming Zhou <david1.zhou@amd.com>
---
 drivers/gpu/drm/drm_internal.h |  2 +
 drivers/gpu/drm/drm_ioctl.c    |  2 +
 drivers/gpu/drm/drm_syncobj.c  | 99 +++++++++++++++++++++++++++++-----
 include/uapi/drm/drm.h         | 14 +++++
 4 files changed, 103 insertions(+), 14 deletions(-)

Comments

Christian König Sept. 20, 2018, 11:11 a.m. UTC | #1
Am 20.09.2018 um 13:03 schrieb Chunming Zhou:
> points array is one-to-one match with syncobjs array.
> v2:
> add seperate ioctl for timeline point wait, otherwise break uapi.
>
> Signed-off-by: Chunming Zhou <david1.zhou@amd.com>
> ---
>   drivers/gpu/drm/drm_internal.h |  2 +
>   drivers/gpu/drm/drm_ioctl.c    |  2 +
>   drivers/gpu/drm/drm_syncobj.c  | 99 +++++++++++++++++++++++++++++-----
>   include/uapi/drm/drm.h         | 14 +++++
>   4 files changed, 103 insertions(+), 14 deletions(-)
>
> diff --git a/drivers/gpu/drm/drm_internal.h b/drivers/gpu/drm/drm_internal.h
> index 0c4eb4a9ab31..566d44e3c782 100644
> --- a/drivers/gpu/drm/drm_internal.h
> +++ b/drivers/gpu/drm/drm_internal.h
> @@ -183,6 +183,8 @@ int drm_syncobj_fd_to_handle_ioctl(struct drm_device *dev, void *data,
>   				   struct drm_file *file_private);
>   int drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,
>   			   struct drm_file *file_private);
> +int drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
> +				    struct drm_file *file_private);
>   int drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
>   			    struct drm_file *file_private);
>   int drm_syncobj_signal_ioctl(struct drm_device *dev, void *data,
> diff --git a/drivers/gpu/drm/drm_ioctl.c b/drivers/gpu/drm/drm_ioctl.c
> index 6b4a633b4240..c0891614f516 100644
> --- a/drivers/gpu/drm/drm_ioctl.c
> +++ b/drivers/gpu/drm/drm_ioctl.c
> @@ -669,6 +669,8 @@ static const struct drm_ioctl_desc drm_ioctls[] = {
>   		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
>   	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_WAIT, drm_syncobj_wait_ioctl,
>   		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
> +	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT, drm_syncobj_timeline_wait_ioctl,
> +		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
>   	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_RESET, drm_syncobj_reset_ioctl,
>   		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
>   	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_SIGNAL, drm_syncobj_signal_ioctl,
> diff --git a/drivers/gpu/drm/drm_syncobj.c b/drivers/gpu/drm/drm_syncobj.c
> index 67472bd77c83..a43de0e4616c 100644
> --- a/drivers/gpu/drm/drm_syncobj.c
> +++ b/drivers/gpu/drm/drm_syncobj.c
> @@ -126,13 +126,14 @@ static void drm_syncobj_add_callback_locked(struct drm_syncobj *syncobj,
>   }
>   
>   static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,
> +						 u64 point,
>   						 struct dma_fence **fence,
>   						 struct drm_syncobj_cb *cb,
>   						 drm_syncobj_func_t func)
>   {
>   	int ret;
>   
> -	ret = drm_syncobj_search_fence(syncobj, 0, 0, fence);
> +	ret = drm_syncobj_search_fence(syncobj, point, 0, fence);
>   	if (!ret)
>   		return 1;
>   
> @@ -143,7 +144,7 @@ static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,
>   	 */
>   	if (!list_empty(&syncobj->signal_pt_list)) {
>   		spin_unlock(&syncobj->lock);
> -		drm_syncobj_search_fence(syncobj, 0, 0, fence);
> +		drm_syncobj_search_fence(syncobj, point, 0, fence);
>   		if (*fence)
>   			return 1;
>   		spin_lock(&syncobj->lock);
> @@ -358,7 +359,9 @@ void drm_syncobj_replace_fence(struct drm_syncobj *syncobj,
>   		spin_lock(&syncobj->lock);
>   		list_for_each_entry_safe(cur, tmp, &syncobj->cb_list, node) {
>   			list_del_init(&cur->node);
> +			spin_unlock(&syncobj->lock);
>   			cur->func(syncobj, cur);
> +			spin_lock(&syncobj->lock);

That looks fishy to me. Why do we need to unlock and who guarantees that 
tmp is still valid when we grab the lock again?

Apart from that can't see anything obvious wrong, but I certainly need 
to take a closer look.

Christian.

>   		}
>   		spin_unlock(&syncobj->lock);
>   	}
> @@ -856,6 +859,7 @@ struct syncobj_wait_entry {
>   	struct dma_fence *fence;
>   	struct dma_fence_cb fence_cb;
>   	struct drm_syncobj_cb syncobj_cb;
> +	u64    point;
>   };
>   
>   static void syncobj_wait_fence_func(struct dma_fence *fence,
> @@ -873,12 +877,13 @@ static void syncobj_wait_syncobj_func(struct drm_syncobj *syncobj,
>   	struct syncobj_wait_entry *wait =
>   		container_of(cb, struct syncobj_wait_entry, syncobj_cb);
>   
> -	drm_syncobj_search_fence(syncobj, 0, 0, &wait->fence);
> +	drm_syncobj_search_fence(syncobj, wait->point, 0, &wait->fence);
>   
>   	wake_up_process(wait->task);
>   }
>   
>   static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
> +						  void __user *user_points,
>   						  uint32_t count,
>   						  uint32_t flags,
>   						  signed long timeout,
> @@ -886,13 +891,27 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>   {
>   	struct syncobj_wait_entry *entries;
>   	struct dma_fence *fence;
> +	uint64_t *points;
>   	signed long ret;
>   	uint32_t signaled_count, i;
>   
> -	entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
> -	if (!entries)
> +	points = kmalloc_array(count, sizeof(*points), GFP_KERNEL);
> +	if (points == NULL)
>   		return -ENOMEM;
>   
> +	if (!user_points) {
> +		memset(points, 0, count * sizeof(uint64_t));
> +	} else if (copy_from_user(points, user_points, sizeof(uint64_t) * count)) {
> +		ret = -EFAULT;
> +		goto err_free_points;
> +	}
> +
> +
> +	entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
> +	if (!entries) {
> +		ret = -ENOMEM;
> +		goto err_free_points;
> +	}
>   	/* Walk the list of sync objects and initialize entries.  We do
>   	 * this up-front so that we can properly return -EINVAL if there is
>   	 * a syncobj with a missing fence and then never have the chance of
> @@ -901,7 +920,8 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>   	signaled_count = 0;
>   	for (i = 0; i < count; ++i) {
>   		entries[i].task = current;
> -		ret = drm_syncobj_search_fence(syncobjs[i], 0, 0,
> +		entries[i].point = points[i];
> +		ret = drm_syncobj_search_fence(syncobjs[i], points[i], 0,
>   					       &entries[i].fence);
>   		if (!entries[i].fence) {
>   			if (flags & DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
> @@ -940,6 +960,7 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>   	if (flags & DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
>   		for (i = 0; i < count; ++i) {
>   			drm_syncobj_fence_get_or_add_callback(syncobjs[i],
> +							      entries[i].point,
>   							      &entries[i].fence,
>   							      &entries[i].syncobj_cb,
>   							      syncobj_wait_syncobj_func);
> @@ -1003,6 +1024,9 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>   	}
>   	kfree(entries);
>   
> +err_free_points:
> +	kfree(points);
> +
>   	return ret;
>   }
>   
> @@ -1041,20 +1065,33 @@ static signed long drm_timeout_abs_to_jiffies(int64_t timeout_nsec)
>   static int drm_syncobj_array_wait(struct drm_device *dev,
>   				  struct drm_file *file_private,
>   				  struct drm_syncobj_wait *wait,
> -				  struct drm_syncobj **syncobjs)
> +				  struct drm_syncobj_timeline_wait *timeline_wait,
> +				  struct drm_syncobj **syncobjs, bool timeline)
>   {
> -	signed long timeout = drm_timeout_abs_to_jiffies(wait->timeout_nsec);
> +	signed long timeout = 0;
>   	signed long ret = 0;
>   	uint32_t first = ~0;
>   
> -	ret = drm_syncobj_array_wait_timeout(syncobjs,
> -					     wait->count_handles,
> -					     wait->flags,
> -					     timeout, &first);
> +	if (!timeline) {
> +		timeout = drm_timeout_abs_to_jiffies(wait->timeout_nsec);
> +		ret = drm_syncobj_array_wait_timeout(syncobjs,
> +						     NULL,
> +						     wait->count_handles,
> +						     wait->flags,
> +						     timeout, &first);
> +		wait->first_signaled = first;
> +	} else {
> +		timeout = drm_timeout_abs_to_jiffies(timeline_wait->timeout_nsec);
> +		ret = drm_syncobj_array_wait_timeout(syncobjs,
> +						     u64_to_user_ptr(timeline_wait->points),
> +						     timeline_wait->count_handles,
> +						     timeline_wait->flags,
> +						     timeout, &first);
> +		timeline_wait->first_signaled = first;
> +	}
>   	if (ret < 0)
>   		return ret;
>   
> -	wait->first_signaled = first;
>   	if (ret == 0)
>   		return -ETIME;
>   	return 0;
> @@ -1142,13 +1179,47 @@ drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,
>   		return ret;
>   
>   	ret = drm_syncobj_array_wait(dev, file_private,
> -				     args, syncobjs);
> +				     args, NULL, syncobjs, false);
>   
>   	drm_syncobj_array_free(syncobjs, args->count_handles);
>   
>   	return ret;
>   }
>   
> +int
> +drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
> +				struct drm_file *file_private)
> +{
> +	struct drm_syncobj_timeline_wait *args = data;
> +	struct drm_syncobj **syncobjs;
> +	int ret = 0;
> +
> +	if (!drm_core_check_feature(dev, DRIVER_SYNCOBJ))
> +		return -ENODEV;
> +
> +	if (args->flags & ~(DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |
> +			    DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT))
> +		return -EINVAL;
> +
> +	if (args->count_handles == 0)
> +		return -EINVAL;
> +
> +	ret = drm_syncobj_array_find(file_private,
> +				     u64_to_user_ptr(args->handles),
> +				     args->count_handles,
> +				     &syncobjs);
> +	if (ret < 0)
> +		return ret;
> +
> +	ret = drm_syncobj_array_wait(dev, file_private,
> +				     NULL, args, syncobjs, true);
> +
> +	drm_syncobj_array_free(syncobjs, args->count_handles);
> +
> +	return ret;
> +}
> +
> +
>   int
>   drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
>   			struct drm_file *file_private)
> diff --git a/include/uapi/drm/drm.h b/include/uapi/drm/drm.h
> index cebdb2541eb7..501e86d81f47 100644
> --- a/include/uapi/drm/drm.h
> +++ b/include/uapi/drm/drm.h
> @@ -748,6 +748,19 @@ struct drm_syncobj_wait {
>   	__u32 pad;
>   };
>   
> +struct drm_syncobj_timeline_wait {
> +	__u64 handles;
> +	/* wait on specific timeline point for every handles*/
> +	__u64 points;
> +	/* absolute timeout */
> +	__s64 timeout_nsec;
> +	__u32 count_handles;
> +	__u32 flags;
> +	__u32 first_signaled; /* only valid when not waiting all */
> +	__u32 pad;
> +};
> +
> +
>   struct drm_syncobj_array {
>   	__u64 handles;
>   	__u32 count_handles;
> @@ -910,6 +923,7 @@ extern "C" {
>   #define DRM_IOCTL_MODE_GET_LEASE	DRM_IOWR(0xC8, struct drm_mode_get_lease)
>   #define DRM_IOCTL_MODE_REVOKE_LEASE	DRM_IOWR(0xC9, struct drm_mode_revoke_lease)
>   
> +#define DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT	DRM_IOWR(0xCA, struct drm_syncobj_timeline_wait)
>   /**
>    * Device specific ioctls should only be in their respective headers
>    * The device specific ioctl range is from 0x40 to 0x9f.
Chunming Zhou Sept. 21, 2018, 7:15 a.m. UTC | #2
> -----Original Message-----
> From: amd-gfx <amd-gfx-bounces@lists.freedesktop.org> On Behalf Of
> Christian K?nig
> Sent: Thursday, September 20, 2018 7:11 PM
> To: Zhou, David(ChunMing) <David1.Zhou@amd.com>; dri-
> devel@lists.freedesktop.org
> Cc: amd-gfx@lists.freedesktop.org
> Subject: Re: [PATCH 3/6] drm: add support of syncobj timeline point wait v2
> 
> Am 20.09.2018 um 13:03 schrieb Chunming Zhou:
> > points array is one-to-one match with syncobjs array.
> > v2:
> > add seperate ioctl for timeline point wait, otherwise break uapi.
> >
> > Signed-off-by: Chunming Zhou <david1.zhou@amd.com>
> > ---
> >   drivers/gpu/drm/drm_internal.h |  2 +
> >   drivers/gpu/drm/drm_ioctl.c    |  2 +
> >   drivers/gpu/drm/drm_syncobj.c  | 99
> +++++++++++++++++++++++++++++-----
> >   include/uapi/drm/drm.h         | 14 +++++
> >   4 files changed, 103 insertions(+), 14 deletions(-)
> >
> > diff --git a/drivers/gpu/drm/drm_internal.h
> > b/drivers/gpu/drm/drm_internal.h index 0c4eb4a9ab31..566d44e3c782
> > 100644
> > --- a/drivers/gpu/drm/drm_internal.h
> > +++ b/drivers/gpu/drm/drm_internal.h
> > @@ -183,6 +183,8 @@ int drm_syncobj_fd_to_handle_ioctl(struct
> drm_device *dev, void *data,
> >   				   struct drm_file *file_private);
> >   int drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,
> >   			   struct drm_file *file_private);
> > +int drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
> > +				    struct drm_file *file_private);
> >   int drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
> >   			    struct drm_file *file_private);
> >   int drm_syncobj_signal_ioctl(struct drm_device *dev, void *data,
> > diff --git a/drivers/gpu/drm/drm_ioctl.c b/drivers/gpu/drm/drm_ioctl.c
> > index 6b4a633b4240..c0891614f516 100644
> > --- a/drivers/gpu/drm/drm_ioctl.c
> > +++ b/drivers/gpu/drm/drm_ioctl.c
> > @@ -669,6 +669,8 @@ static const struct drm_ioctl_desc drm_ioctls[] = {
> >   		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
> >   	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_WAIT,
> drm_syncobj_wait_ioctl,
> >   		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
> > +	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT,
> drm_syncobj_timeline_wait_ioctl,
> > +		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
> >   	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_RESET,
> drm_syncobj_reset_ioctl,
> >   		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
> >   	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_SIGNAL,
> drm_syncobj_signal_ioctl,
> > diff --git a/drivers/gpu/drm/drm_syncobj.c
> > b/drivers/gpu/drm/drm_syncobj.c index 67472bd77c83..a43de0e4616c
> > 100644
> > --- a/drivers/gpu/drm/drm_syncobj.c
> > +++ b/drivers/gpu/drm/drm_syncobj.c
> > @@ -126,13 +126,14 @@ static void
> drm_syncobj_add_callback_locked(struct drm_syncobj *syncobj,
> >   }
> >
> >   static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj
> > *syncobj,
> > +						 u64 point,
> >   						 struct dma_fence **fence,
> >   						 struct drm_syncobj_cb *cb,
> >   						 drm_syncobj_func_t func)
> >   {
> >   	int ret;
> >
> > -	ret = drm_syncobj_search_fence(syncobj, 0, 0, fence);
> > +	ret = drm_syncobj_search_fence(syncobj, point, 0, fence);
> >   	if (!ret)
> >   		return 1;
> >
> > @@ -143,7 +144,7 @@ static int
> drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,
> >   	 */
> >   	if (!list_empty(&syncobj->signal_pt_list)) {
> >   		spin_unlock(&syncobj->lock);
> > -		drm_syncobj_search_fence(syncobj, 0, 0, fence);
> > +		drm_syncobj_search_fence(syncobj, point, 0, fence);
> >   		if (*fence)
> >   			return 1;
> >   		spin_lock(&syncobj->lock);
> > @@ -358,7 +359,9 @@ void drm_syncobj_replace_fence(struct
> drm_syncobj *syncobj,
> >   		spin_lock(&syncobj->lock);
> >   		list_for_each_entry_safe(cur, tmp, &syncobj->cb_list, node)
> {
> >   			list_del_init(&cur->node);
> > +			spin_unlock(&syncobj->lock);
> >   			cur->func(syncobj, cur);
> > +			spin_lock(&syncobj->lock);
> 
> That looks fishy to me. Why do we need to unlock 

Cb func will call _search_fence, which will need to grab the lock, otherwise deadlock.


>and who guarantees that
> tmp is still valid when we grab the lock again?

Sorry for that, quickly  fix deadlock and forget to care that when debug.
How about splice to a tmp list, and then list_for _xxx without lock?

Any other comment on patch series and libdrm patches?   That one comment increases a patch set version seems be overcommit. 

Thanks,
David Zhou

> 
> Apart from that can't see anything obvious wrong, but I certainly need to
> take a closer look.
> 
> Christian.
> 
> >   		}
> >   		spin_unlock(&syncobj->lock);
> >   	}
> > @@ -856,6 +859,7 @@ struct syncobj_wait_entry {
> >   	struct dma_fence *fence;
> >   	struct dma_fence_cb fence_cb;
> >   	struct drm_syncobj_cb syncobj_cb;
> > +	u64    point;
> >   };
> >
> >   static void syncobj_wait_fence_func(struct dma_fence *fence, @@
> > -873,12 +877,13 @@ static void syncobj_wait_syncobj_func(struct
> drm_syncobj *syncobj,
> >   	struct syncobj_wait_entry *wait =
> >   		container_of(cb, struct syncobj_wait_entry, syncobj_cb);
> >
> > -	drm_syncobj_search_fence(syncobj, 0, 0, &wait->fence);
> > +	drm_syncobj_search_fence(syncobj, wait->point, 0, &wait->fence);
> >
> >   	wake_up_process(wait->task);
> >   }
> >
> >   static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj
> > **syncobjs,
> > +						  void __user *user_points,
> >   						  uint32_t count,
> >   						  uint32_t flags,
> >   						  signed long timeout,
> > @@ -886,13 +891,27 @@ static signed long
> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
> >   {
> >   	struct syncobj_wait_entry *entries;
> >   	struct dma_fence *fence;
> > +	uint64_t *points;
> >   	signed long ret;
> >   	uint32_t signaled_count, i;
> >
> > -	entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
> > -	if (!entries)
> > +	points = kmalloc_array(count, sizeof(*points), GFP_KERNEL);
> > +	if (points == NULL)
> >   		return -ENOMEM;
> >
> > +	if (!user_points) {
> > +		memset(points, 0, count * sizeof(uint64_t));
> > +	} else if (copy_from_user(points, user_points, sizeof(uint64_t) *
> count)) {
> > +		ret = -EFAULT;
> > +		goto err_free_points;
> > +	}
> > +
> > +
> > +	entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
> > +	if (!entries) {
> > +		ret = -ENOMEM;
> > +		goto err_free_points;
> > +	}
> >   	/* Walk the list of sync objects and initialize entries.  We do
> >   	 * this up-front so that we can properly return -EINVAL if there is
> >   	 * a syncobj with a missing fence and then never have the chance of
> > @@ -901,7 +920,8 @@ static signed long
> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
> >   	signaled_count = 0;
> >   	for (i = 0; i < count; ++i) {
> >   		entries[i].task = current;
> > -		ret = drm_syncobj_search_fence(syncobjs[i], 0, 0,
> > +		entries[i].point = points[i];
> > +		ret = drm_syncobj_search_fence(syncobjs[i], points[i], 0,
> >   					       &entries[i].fence);
> >   		if (!entries[i].fence) {
> >   			if (flags &
> DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) { @@ -940,6
> > +960,7 @@ static signed long drm_syncobj_array_wait_timeout(struct
> drm_syncobj **syncobjs,
> >   	if (flags & DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
> >   		for (i = 0; i < count; ++i) {
> >
> 	drm_syncobj_fence_get_or_add_callback(syncobjs[i],
> > +							      entries[i].point,
> >   							      &entries[i].fence,
> >
> &entries[i].syncobj_cb,
> >
> syncobj_wait_syncobj_func); @@ -1003,6 +1024,9 @@
> > static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj
> **syncobjs,
> >   	}
> >   	kfree(entries);
> >
> > +err_free_points:
> > +	kfree(points);
> > +
> >   	return ret;
> >   }
> >
> > @@ -1041,20 +1065,33 @@ static signed long
> drm_timeout_abs_to_jiffies(int64_t timeout_nsec)
> >   static int drm_syncobj_array_wait(struct drm_device *dev,
> >   				  struct drm_file *file_private,
> >   				  struct drm_syncobj_wait *wait,
> > -				  struct drm_syncobj **syncobjs)
> > +				  struct drm_syncobj_timeline_wait
> *timeline_wait,
> > +				  struct drm_syncobj **syncobjs, bool
> timeline)
> >   {
> > -	signed long timeout = drm_timeout_abs_to_jiffies(wait-
> >timeout_nsec);
> > +	signed long timeout = 0;
> >   	signed long ret = 0;
> >   	uint32_t first = ~0;
> >
> > -	ret = drm_syncobj_array_wait_timeout(syncobjs,
> > -					     wait->count_handles,
> > -					     wait->flags,
> > -					     timeout, &first);
> > +	if (!timeline) {
> > +		timeout = drm_timeout_abs_to_jiffies(wait->timeout_nsec);
> > +		ret = drm_syncobj_array_wait_timeout(syncobjs,
> > +						     NULL,
> > +						     wait->count_handles,
> > +						     wait->flags,
> > +						     timeout, &first);
> > +		wait->first_signaled = first;
> > +	} else {
> > +		timeout = drm_timeout_abs_to_jiffies(timeline_wait-
> >timeout_nsec);
> > +		ret = drm_syncobj_array_wait_timeout(syncobjs,
> > +
> u64_to_user_ptr(timeline_wait->points),
> > +						     timeline_wait-
> >count_handles,
> > +						     timeline_wait->flags,
> > +						     timeout, &first);
> > +		timeline_wait->first_signaled = first;
> > +	}
> >   	if (ret < 0)
> >   		return ret;
> >
> > -	wait->first_signaled = first;
> >   	if (ret == 0)
> >   		return -ETIME;
> >   	return 0;
> > @@ -1142,13 +1179,47 @@ drm_syncobj_wait_ioctl(struct drm_device
> *dev, void *data,
> >   		return ret;
> >
> >   	ret = drm_syncobj_array_wait(dev, file_private,
> > -				     args, syncobjs);
> > +				     args, NULL, syncobjs, false);
> >
> >   	drm_syncobj_array_free(syncobjs, args->count_handles);
> >
> >   	return ret;
> >   }
> >
> > +int
> > +drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
> > +				struct drm_file *file_private)
> > +{
> > +	struct drm_syncobj_timeline_wait *args = data;
> > +	struct drm_syncobj **syncobjs;
> > +	int ret = 0;
> > +
> > +	if (!drm_core_check_feature(dev, DRIVER_SYNCOBJ))
> > +		return -ENODEV;
> > +
> > +	if (args->flags & ~(DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |
> > +
> DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT))
> > +		return -EINVAL;
> > +
> > +	if (args->count_handles == 0)
> > +		return -EINVAL;
> > +
> > +	ret = drm_syncobj_array_find(file_private,
> > +				     u64_to_user_ptr(args->handles),
> > +				     args->count_handles,
> > +				     &syncobjs);
> > +	if (ret < 0)
> > +		return ret;
> > +
> > +	ret = drm_syncobj_array_wait(dev, file_private,
> > +				     NULL, args, syncobjs, true);
> > +
> > +	drm_syncobj_array_free(syncobjs, args->count_handles);
> > +
> > +	return ret;
> > +}
> > +
> > +
> >   int
> >   drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
> >   			struct drm_file *file_private)
> > diff --git a/include/uapi/drm/drm.h b/include/uapi/drm/drm.h index
> > cebdb2541eb7..501e86d81f47 100644
> > --- a/include/uapi/drm/drm.h
> > +++ b/include/uapi/drm/drm.h
> > @@ -748,6 +748,19 @@ struct drm_syncobj_wait {
> >   	__u32 pad;
> >   };
> >
> > +struct drm_syncobj_timeline_wait {
> > +	__u64 handles;
> > +	/* wait on specific timeline point for every handles*/
> > +	__u64 points;
> > +	/* absolute timeout */
> > +	__s64 timeout_nsec;
> > +	__u32 count_handles;
> > +	__u32 flags;
> > +	__u32 first_signaled; /* only valid when not waiting all */
> > +	__u32 pad;
> > +};
> > +
> > +
> >   struct drm_syncobj_array {
> >   	__u64 handles;
> >   	__u32 count_handles;
> > @@ -910,6 +923,7 @@ extern "C" {
> >   #define DRM_IOCTL_MODE_GET_LEASE	DRM_IOWR(0xC8, struct
> drm_mode_get_lease)
> >   #define DRM_IOCTL_MODE_REVOKE_LEASE	DRM_IOWR(0xC9,
> struct drm_mode_revoke_lease)
> >
> > +#define DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT	DRM_IOWR(0xCA,
> struct drm_syncobj_timeline_wait)
> >   /**
> >    * Device specific ioctls should only be in their respective headers
> >    * The device specific ioctl range is from 0x40 to 0x9f.
> 
> _______________________________________________
> amd-gfx mailing list
> amd-gfx@lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/amd-gfx
Christian König Sept. 21, 2018, 7:21 a.m. UTC | #3
Am 21.09.2018 um 09:15 schrieb Zhou, David(ChunMing):
>
>> -----Original Message-----
>> From: amd-gfx <amd-gfx-bounces@lists.freedesktop.org> On Behalf Of
>> Christian K?nig
>> Sent: Thursday, September 20, 2018 7:11 PM
>> To: Zhou, David(ChunMing) <David1.Zhou@amd.com>; dri-
>> devel@lists.freedesktop.org
>> Cc: amd-gfx@lists.freedesktop.org
>> Subject: Re: [PATCH 3/6] drm: add support of syncobj timeline point wait v2
>>
>> Am 20.09.2018 um 13:03 schrieb Chunming Zhou:
>>> points array is one-to-one match with syncobjs array.
>>> v2:
>>> add seperate ioctl for timeline point wait, otherwise break uapi.
>>>
>>> Signed-off-by: Chunming Zhou <david1.zhou@amd.com>
>>> ---
>>>    drivers/gpu/drm/drm_internal.h |  2 +
>>>    drivers/gpu/drm/drm_ioctl.c    |  2 +
>>>    drivers/gpu/drm/drm_syncobj.c  | 99
>> +++++++++++++++++++++++++++++-----
>>>    include/uapi/drm/drm.h         | 14 +++++
>>>    4 files changed, 103 insertions(+), 14 deletions(-)
>>>
>>> diff --git a/drivers/gpu/drm/drm_internal.h
>>> b/drivers/gpu/drm/drm_internal.h index 0c4eb4a9ab31..566d44e3c782
>>> 100644
>>> --- a/drivers/gpu/drm/drm_internal.h
>>> +++ b/drivers/gpu/drm/drm_internal.h
>>> @@ -183,6 +183,8 @@ int drm_syncobj_fd_to_handle_ioctl(struct
>> drm_device *dev, void *data,
>>>    				   struct drm_file *file_private);
>>>    int drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,
>>>    			   struct drm_file *file_private);
>>> +int drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
>>> +				    struct drm_file *file_private);
>>>    int drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
>>>    			    struct drm_file *file_private);
>>>    int drm_syncobj_signal_ioctl(struct drm_device *dev, void *data,
>>> diff --git a/drivers/gpu/drm/drm_ioctl.c b/drivers/gpu/drm/drm_ioctl.c
>>> index 6b4a633b4240..c0891614f516 100644
>>> --- a/drivers/gpu/drm/drm_ioctl.c
>>> +++ b/drivers/gpu/drm/drm_ioctl.c
>>> @@ -669,6 +669,8 @@ static const struct drm_ioctl_desc drm_ioctls[] = {
>>>    		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
>>>    	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_WAIT,
>> drm_syncobj_wait_ioctl,
>>>    		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
>>> +	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT,
>> drm_syncobj_timeline_wait_ioctl,
>>> +		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
>>>    	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_RESET,
>> drm_syncobj_reset_ioctl,
>>>    		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
>>>    	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_SIGNAL,
>> drm_syncobj_signal_ioctl,
>>> diff --git a/drivers/gpu/drm/drm_syncobj.c
>>> b/drivers/gpu/drm/drm_syncobj.c index 67472bd77c83..a43de0e4616c
>>> 100644
>>> --- a/drivers/gpu/drm/drm_syncobj.c
>>> +++ b/drivers/gpu/drm/drm_syncobj.c
>>> @@ -126,13 +126,14 @@ static void
>> drm_syncobj_add_callback_locked(struct drm_syncobj *syncobj,
>>>    }
>>>
>>>    static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj
>>> *syncobj,
>>> +						 u64 point,
>>>    						 struct dma_fence **fence,
>>>    						 struct drm_syncobj_cb *cb,
>>>    						 drm_syncobj_func_t func)
>>>    {
>>>    	int ret;
>>>
>>> -	ret = drm_syncobj_search_fence(syncobj, 0, 0, fence);
>>> +	ret = drm_syncobj_search_fence(syncobj, point, 0, fence);
>>>    	if (!ret)
>>>    		return 1;
>>>
>>> @@ -143,7 +144,7 @@ static int
>> drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,
>>>    	 */
>>>    	if (!list_empty(&syncobj->signal_pt_list)) {
>>>    		spin_unlock(&syncobj->lock);
>>> -		drm_syncobj_search_fence(syncobj, 0, 0, fence);
>>> +		drm_syncobj_search_fence(syncobj, point, 0, fence);
>>>    		if (*fence)
>>>    			return 1;
>>>    		spin_lock(&syncobj->lock);
>>> @@ -358,7 +359,9 @@ void drm_syncobj_replace_fence(struct
>> drm_syncobj *syncobj,
>>>    		spin_lock(&syncobj->lock);
>>>    		list_for_each_entry_safe(cur, tmp, &syncobj->cb_list, node)
>> {
>>>    			list_del_init(&cur->node);
>>> +			spin_unlock(&syncobj->lock);
>>>    			cur->func(syncobj, cur);
>>> +			spin_lock(&syncobj->lock);
>> That looks fishy to me. Why do we need to unlock
> Cb func will call _search_fence, which will need to grab the lock, otherwise deadlock.
>
>
>> and who guarantees that
>> tmp is still valid when we grab the lock again?
> Sorry for that, quickly  fix deadlock and forget to care that when debug.
> How about splice to a tmp list, and then list_for _xxx without lock?

Yeah, that should work. Alternative is to use something like "while 
(!list_empty()) { e = list_first_entry(); list_del(e)....". But either 
way should work.

> Any other comment on patch series and libdrm patches?   That one comment increases a patch set version seems be overcommit.

On a first glance that stuff looked good, but give me till monday for 
that. I'm currently in the middle of debugging issues.

Thanks,
Christian.

>
> Thanks,
> David Zhou
>
>> Apart from that can't see anything obvious wrong, but I certainly need to
>> take a closer look.
>>
>> Christian.
>>
>>>    		}
>>>    		spin_unlock(&syncobj->lock);
>>>    	}
>>> @@ -856,6 +859,7 @@ struct syncobj_wait_entry {
>>>    	struct dma_fence *fence;
>>>    	struct dma_fence_cb fence_cb;
>>>    	struct drm_syncobj_cb syncobj_cb;
>>> +	u64    point;
>>>    };
>>>
>>>    static void syncobj_wait_fence_func(struct dma_fence *fence, @@
>>> -873,12 +877,13 @@ static void syncobj_wait_syncobj_func(struct
>> drm_syncobj *syncobj,
>>>    	struct syncobj_wait_entry *wait =
>>>    		container_of(cb, struct syncobj_wait_entry, syncobj_cb);
>>>
>>> -	drm_syncobj_search_fence(syncobj, 0, 0, &wait->fence);
>>> +	drm_syncobj_search_fence(syncobj, wait->point, 0, &wait->fence);
>>>
>>>    	wake_up_process(wait->task);
>>>    }
>>>
>>>    static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj
>>> **syncobjs,
>>> +						  void __user *user_points,
>>>    						  uint32_t count,
>>>    						  uint32_t flags,
>>>    						  signed long timeout,
>>> @@ -886,13 +891,27 @@ static signed long
>> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>>>    {
>>>    	struct syncobj_wait_entry *entries;
>>>    	struct dma_fence *fence;
>>> +	uint64_t *points;
>>>    	signed long ret;
>>>    	uint32_t signaled_count, i;
>>>
>>> -	entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
>>> -	if (!entries)
>>> +	points = kmalloc_array(count, sizeof(*points), GFP_KERNEL);
>>> +	if (points == NULL)
>>>    		return -ENOMEM;
>>>
>>> +	if (!user_points) {
>>> +		memset(points, 0, count * sizeof(uint64_t));
>>> +	} else if (copy_from_user(points, user_points, sizeof(uint64_t) *
>> count)) {
>>> +		ret = -EFAULT;
>>> +		goto err_free_points;
>>> +	}
>>> +
>>> +
>>> +	entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
>>> +	if (!entries) {
>>> +		ret = -ENOMEM;
>>> +		goto err_free_points;
>>> +	}
>>>    	/* Walk the list of sync objects and initialize entries.  We do
>>>    	 * this up-front so that we can properly return -EINVAL if there is
>>>    	 * a syncobj with a missing fence and then never have the chance of
>>> @@ -901,7 +920,8 @@ static signed long
>> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>>>    	signaled_count = 0;
>>>    	for (i = 0; i < count; ++i) {
>>>    		entries[i].task = current;
>>> -		ret = drm_syncobj_search_fence(syncobjs[i], 0, 0,
>>> +		entries[i].point = points[i];
>>> +		ret = drm_syncobj_search_fence(syncobjs[i], points[i], 0,
>>>    					       &entries[i].fence);
>>>    		if (!entries[i].fence) {
>>>    			if (flags &
>> DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) { @@ -940,6
>>> +960,7 @@ static signed long drm_syncobj_array_wait_timeout(struct
>> drm_syncobj **syncobjs,
>>>    	if (flags & DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
>>>    		for (i = 0; i < count; ++i) {
>>>
>> 	drm_syncobj_fence_get_or_add_callback(syncobjs[i],
>>> +							      entries[i].point,
>>>    							      &entries[i].fence,
>>>
>> &entries[i].syncobj_cb,
>> syncobj_wait_syncobj_func); @@ -1003,6 +1024,9 @@
>>> static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj
>> **syncobjs,
>>>    	}
>>>    	kfree(entries);
>>>
>>> +err_free_points:
>>> +	kfree(points);
>>> +
>>>    	return ret;
>>>    }
>>>
>>> @@ -1041,20 +1065,33 @@ static signed long
>> drm_timeout_abs_to_jiffies(int64_t timeout_nsec)
>>>    static int drm_syncobj_array_wait(struct drm_device *dev,
>>>    				  struct drm_file *file_private,
>>>    				  struct drm_syncobj_wait *wait,
>>> -				  struct drm_syncobj **syncobjs)
>>> +				  struct drm_syncobj_timeline_wait
>> *timeline_wait,
>>> +				  struct drm_syncobj **syncobjs, bool
>> timeline)
>>>    {
>>> -	signed long timeout = drm_timeout_abs_to_jiffies(wait-
>>> timeout_nsec);
>>> +	signed long timeout = 0;
>>>    	signed long ret = 0;
>>>    	uint32_t first = ~0;
>>>
>>> -	ret = drm_syncobj_array_wait_timeout(syncobjs,
>>> -					     wait->count_handles,
>>> -					     wait->flags,
>>> -					     timeout, &first);
>>> +	if (!timeline) {
>>> +		timeout = drm_timeout_abs_to_jiffies(wait->timeout_nsec);
>>> +		ret = drm_syncobj_array_wait_timeout(syncobjs,
>>> +						     NULL,
>>> +						     wait->count_handles,
>>> +						     wait->flags,
>>> +						     timeout, &first);
>>> +		wait->first_signaled = first;
>>> +	} else {
>>> +		timeout = drm_timeout_abs_to_jiffies(timeline_wait-
>>> timeout_nsec);
>>> +		ret = drm_syncobj_array_wait_timeout(syncobjs,
>>> +
>> u64_to_user_ptr(timeline_wait->points),
>>> +						     timeline_wait-
>>> count_handles,
>>> +						     timeline_wait->flags,
>>> +						     timeout, &first);
>>> +		timeline_wait->first_signaled = first;
>>> +	}
>>>    	if (ret < 0)
>>>    		return ret;
>>>
>>> -	wait->first_signaled = first;
>>>    	if (ret == 0)
>>>    		return -ETIME;
>>>    	return 0;
>>> @@ -1142,13 +1179,47 @@ drm_syncobj_wait_ioctl(struct drm_device
>> *dev, void *data,
>>>    		return ret;
>>>
>>>    	ret = drm_syncobj_array_wait(dev, file_private,
>>> -				     args, syncobjs);
>>> +				     args, NULL, syncobjs, false);
>>>
>>>    	drm_syncobj_array_free(syncobjs, args->count_handles);
>>>
>>>    	return ret;
>>>    }
>>>
>>> +int
>>> +drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
>>> +				struct drm_file *file_private)
>>> +{
>>> +	struct drm_syncobj_timeline_wait *args = data;
>>> +	struct drm_syncobj **syncobjs;
>>> +	int ret = 0;
>>> +
>>> +	if (!drm_core_check_feature(dev, DRIVER_SYNCOBJ))
>>> +		return -ENODEV;
>>> +
>>> +	if (args->flags & ~(DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |
>>> +
>> DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT))
>>> +		return -EINVAL;
>>> +
>>> +	if (args->count_handles == 0)
>>> +		return -EINVAL;
>>> +
>>> +	ret = drm_syncobj_array_find(file_private,
>>> +				     u64_to_user_ptr(args->handles),
>>> +				     args->count_handles,
>>> +				     &syncobjs);
>>> +	if (ret < 0)
>>> +		return ret;
>>> +
>>> +	ret = drm_syncobj_array_wait(dev, file_private,
>>> +				     NULL, args, syncobjs, true);
>>> +
>>> +	drm_syncobj_array_free(syncobjs, args->count_handles);
>>> +
>>> +	return ret;
>>> +}
>>> +
>>> +
>>>    int
>>>    drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
>>>    			struct drm_file *file_private)
>>> diff --git a/include/uapi/drm/drm.h b/include/uapi/drm/drm.h index
>>> cebdb2541eb7..501e86d81f47 100644
>>> --- a/include/uapi/drm/drm.h
>>> +++ b/include/uapi/drm/drm.h
>>> @@ -748,6 +748,19 @@ struct drm_syncobj_wait {
>>>    	__u32 pad;
>>>    };
>>>
>>> +struct drm_syncobj_timeline_wait {
>>> +	__u64 handles;
>>> +	/* wait on specific timeline point for every handles*/
>>> +	__u64 points;
>>> +	/* absolute timeout */
>>> +	__s64 timeout_nsec;
>>> +	__u32 count_handles;
>>> +	__u32 flags;
>>> +	__u32 first_signaled; /* only valid when not waiting all */
>>> +	__u32 pad;
>>> +};
>>> +
>>> +
>>>    struct drm_syncobj_array {
>>>    	__u64 handles;
>>>    	__u32 count_handles;
>>> @@ -910,6 +923,7 @@ extern "C" {
>>>    #define DRM_IOCTL_MODE_GET_LEASE	DRM_IOWR(0xC8, struct
>> drm_mode_get_lease)
>>>    #define DRM_IOCTL_MODE_REVOKE_LEASE	DRM_IOWR(0xC9,
>> struct drm_mode_revoke_lease)
>>> +#define DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT	DRM_IOWR(0xCA,
>> struct drm_syncobj_timeline_wait)
>>>    /**
>>>     * Device specific ioctls should only be in their respective headers
>>>     * The device specific ioctl range is from 0x40 to 0x9f.
>> _______________________________________________
>> amd-gfx mailing list
>> amd-gfx@lists.freedesktop.org
>> https://lists.freedesktop.org/mailman/listinfo/amd-gfx
Jason Ekstrand Sept. 25, 2018, 9:22 a.m. UTC | #4
On Thu, Sep 20, 2018 at 6:04 AM Chunming Zhou <david1.zhou@amd.com> wrote:

> points array is one-to-one match with syncobjs array.
> v2:
> add seperate ioctl for timeline point wait, otherwise break uapi.
>

I think ioctl structs can be extended as long as fields aren't re-ordered.
I'm not sure on the details of this though as I'm not a particularly
experienced kernel developer.

Another general comment (no good place to put it) is that I think we want
two kinds of waits:  Wait for time point to be completed and wait for time
point to become available.  The first is the usual CPU wait for completion
while the second is for use by userspace drivers to wait until the first
moment where they can submit work which depends on a given time point.


> Signed-off-by: Chunming Zhou <david1.zhou@amd.com>
> ---
>  drivers/gpu/drm/drm_internal.h |  2 +
>  drivers/gpu/drm/drm_ioctl.c    |  2 +
>  drivers/gpu/drm/drm_syncobj.c  | 99 +++++++++++++++++++++++++++++-----
>  include/uapi/drm/drm.h         | 14 +++++
>  4 files changed, 103 insertions(+), 14 deletions(-)
>
> diff --git a/drivers/gpu/drm/drm_internal.h
> b/drivers/gpu/drm/drm_internal.h
> index 0c4eb4a9ab31..566d44e3c782 100644
> --- a/drivers/gpu/drm/drm_internal.h
> +++ b/drivers/gpu/drm/drm_internal.h
> @@ -183,6 +183,8 @@ int drm_syncobj_fd_to_handle_ioctl(struct drm_device
> *dev, void *data,
>                                    struct drm_file *file_private);
>  int drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,
>                            struct drm_file *file_private);
> +int drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
> +                                   struct drm_file *file_private);
>  int drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
>                             struct drm_file *file_private);
>  int drm_syncobj_signal_ioctl(struct drm_device *dev, void *data,
> diff --git a/drivers/gpu/drm/drm_ioctl.c b/drivers/gpu/drm/drm_ioctl.c
> index 6b4a633b4240..c0891614f516 100644
> --- a/drivers/gpu/drm/drm_ioctl.c
> +++ b/drivers/gpu/drm/drm_ioctl.c
> @@ -669,6 +669,8 @@ static const struct drm_ioctl_desc drm_ioctls[] = {
>                       DRM_UNLOCKED|DRM_RENDER_ALLOW),
>         DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_WAIT, drm_syncobj_wait_ioctl,
>                       DRM_UNLOCKED|DRM_RENDER_ALLOW),
> +       DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT,
> drm_syncobj_timeline_wait_ioctl,
> +                     DRM_UNLOCKED|DRM_RENDER_ALLOW),
>         DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_RESET, drm_syncobj_reset_ioctl,
>                       DRM_UNLOCKED|DRM_RENDER_ALLOW),
>         DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_SIGNAL, drm_syncobj_signal_ioctl,
> diff --git a/drivers/gpu/drm/drm_syncobj.c b/drivers/gpu/drm/drm_syncobj.c
> index 67472bd77c83..a43de0e4616c 100644
> --- a/drivers/gpu/drm/drm_syncobj.c
> +++ b/drivers/gpu/drm/drm_syncobj.c
> @@ -126,13 +126,14 @@ static void drm_syncobj_add_callback_locked(struct
> drm_syncobj *syncobj,
>  }
>
>  static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj
> *syncobj,
> +                                                u64 point,
>                                                  struct dma_fence **fence,
>                                                  struct drm_syncobj_cb *cb,
>                                                  drm_syncobj_func_t func)
>  {
>         int ret;
>
> -       ret = drm_syncobj_search_fence(syncobj, 0, 0, fence);
> +       ret = drm_syncobj_search_fence(syncobj, point, 0, fence);
>         if (!ret)
>                 return 1;
>
> @@ -143,7 +144,7 @@ static int
> drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,
>          */
>         if (!list_empty(&syncobj->signal_pt_list)) {
>                 spin_unlock(&syncobj->lock);
> -               drm_syncobj_search_fence(syncobj, 0, 0, fence);
> +               drm_syncobj_search_fence(syncobj, point, 0, fence);
>                 if (*fence)
>                         return 1;
>                 spin_lock(&syncobj->lock);
> @@ -358,7 +359,9 @@ void drm_syncobj_replace_fence(struct drm_syncobj
> *syncobj,
>                 spin_lock(&syncobj->lock);
>                 list_for_each_entry_safe(cur, tmp, &syncobj->cb_list,
> node) {
>                         list_del_init(&cur->node);
> +                       spin_unlock(&syncobj->lock);
>                         cur->func(syncobj, cur);
> +                       spin_lock(&syncobj->lock);
>                 }
>                 spin_unlock(&syncobj->lock);
>         }
> @@ -856,6 +859,7 @@ struct syncobj_wait_entry {
>         struct dma_fence *fence;
>         struct dma_fence_cb fence_cb;
>         struct drm_syncobj_cb syncobj_cb;
> +       u64    point;
>  };
>
>  static void syncobj_wait_fence_func(struct dma_fence *fence,
> @@ -873,12 +877,13 @@ static void syncobj_wait_syncobj_func(struct
> drm_syncobj *syncobj,
>         struct syncobj_wait_entry *wait =
>                 container_of(cb, struct syncobj_wait_entry, syncobj_cb);
>
> -       drm_syncobj_search_fence(syncobj, 0, 0, &wait->fence);
> +       drm_syncobj_search_fence(syncobj, wait->point, 0, &wait->fence);
>
>         wake_up_process(wait->task);
>  }
>
>  static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj
> **syncobjs,
> +                                                 void __user *user_points,
>                                                   uint32_t count,
>                                                   uint32_t flags,
>                                                   signed long timeout,
> @@ -886,13 +891,27 @@ static signed long
> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>  {
>         struct syncobj_wait_entry *entries;
>         struct dma_fence *fence;
> +       uint64_t *points;
>         signed long ret;
>         uint32_t signaled_count, i;
>
> -       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
> -       if (!entries)
> +       points = kmalloc_array(count, sizeof(*points), GFP_KERNEL);
> +       if (points == NULL)
>                 return -ENOMEM;
>
> +       if (!user_points) {
> +               memset(points, 0, count * sizeof(uint64_t));
> +       } else if (copy_from_user(points, user_points, sizeof(uint64_t) *
> count)) {
> +               ret = -EFAULT;
> +               goto err_free_points;
> +       }
> +
> +
> +       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
> +       if (!entries) {
> +               ret = -ENOMEM;
> +               goto err_free_points;
> +       }
>         /* Walk the list of sync objects and initialize entries.  We do
>          * this up-front so that we can properly return -EINVAL if there is
>          * a syncobj with a missing fence and then never have the chance of
> @@ -901,7 +920,8 @@ static signed long
> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>         signaled_count = 0;
>         for (i = 0; i < count; ++i) {
>                 entries[i].task = current;
> -               ret = drm_syncobj_search_fence(syncobjs[i], 0, 0,
> +               entries[i].point = points[i];
> +               ret = drm_syncobj_search_fence(syncobjs[i], points[i], 0,
>                                                &entries[i].fence);
>                 if (!entries[i].fence) {
>                         if (flags &
> DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
> @@ -940,6 +960,7 @@ static signed long
> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>         if (flags & DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
>                 for (i = 0; i < count; ++i) {
>                         drm_syncobj_fence_get_or_add_callback(syncobjs[i],
> +
>  entries[i].point,
>
> &entries[i].fence,
>
> &entries[i].syncobj_cb,
>
> syncobj_wait_syncobj_func);
> @@ -1003,6 +1024,9 @@ static signed long
> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>         }
>         kfree(entries);
>
> +err_free_points:
> +       kfree(points);
> +
>         return ret;
>  }
>
> @@ -1041,20 +1065,33 @@ static signed long
> drm_timeout_abs_to_jiffies(int64_t timeout_nsec)
>  static int drm_syncobj_array_wait(struct drm_device *dev,
>                                   struct drm_file *file_private,
>                                   struct drm_syncobj_wait *wait,
> -                                 struct drm_syncobj **syncobjs)
> +                                 struct drm_syncobj_timeline_wait
> *timeline_wait,
> +                                 struct drm_syncobj **syncobjs, bool
> timeline)
>  {
> -       signed long timeout =
> drm_timeout_abs_to_jiffies(wait->timeout_nsec);
> +       signed long timeout = 0;
>         signed long ret = 0;
>         uint32_t first = ~0;
>
> -       ret = drm_syncobj_array_wait_timeout(syncobjs,
> -                                            wait->count_handles,
> -                                            wait->flags,
> -                                            timeout, &first);
> +       if (!timeline) {
> +               timeout = drm_timeout_abs_to_jiffies(wait->timeout_nsec);
> +               ret = drm_syncobj_array_wait_timeout(syncobjs,
> +                                                    NULL,
> +                                                    wait->count_handles,
> +                                                    wait->flags,
> +                                                    timeout, &first);
> +               wait->first_signaled = first;
> +       } else {
> +               timeout =
> drm_timeout_abs_to_jiffies(timeline_wait->timeout_nsec);
> +               ret = drm_syncobj_array_wait_timeout(syncobjs,
> +
> u64_to_user_ptr(timeline_wait->points),
> +
> timeline_wait->count_handles,
> +                                                    timeline_wait->flags,
> +                                                    timeout, &first);
> +               timeline_wait->first_signaled = first;
> +       }
>         if (ret < 0)
>                 return ret;
>
> -       wait->first_signaled = first;
>         if (ret == 0)
>                 return -ETIME;
>         return 0;
> @@ -1142,13 +1179,47 @@ drm_syncobj_wait_ioctl(struct drm_device *dev,
> void *data,
>                 return ret;
>
>         ret = drm_syncobj_array_wait(dev, file_private,
> -                                    args, syncobjs);
> +                                    args, NULL, syncobjs, false);
>
>         drm_syncobj_array_free(syncobjs, args->count_handles);
>
>         return ret;
>  }
>
> +int
> +drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
> +                               struct drm_file *file_private)
> +{
> +       struct drm_syncobj_timeline_wait *args = data;
> +       struct drm_syncobj **syncobjs;
> +       int ret = 0;
> +
> +       if (!drm_core_check_feature(dev, DRIVER_SYNCOBJ))
> +               return -ENODEV;
> +
> +       if (args->flags & ~(DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |
> +                           DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT))
> +               return -EINVAL;
> +
> +       if (args->count_handles == 0)
> +               return -EINVAL;
> +
> +       ret = drm_syncobj_array_find(file_private,
> +                                    u64_to_user_ptr(args->handles),
> +                                    args->count_handles,
> +                                    &syncobjs);
> +       if (ret < 0)
> +               return ret;
> +
> +       ret = drm_syncobj_array_wait(dev, file_private,
> +                                    NULL, args, syncobjs, true);
> +
> +       drm_syncobj_array_free(syncobjs, args->count_handles);
> +
> +       return ret;
> +}
> +
> +
>  int
>  drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
>                         struct drm_file *file_private)
> diff --git a/include/uapi/drm/drm.h b/include/uapi/drm/drm.h
> index cebdb2541eb7..501e86d81f47 100644
> --- a/include/uapi/drm/drm.h
> +++ b/include/uapi/drm/drm.h
> @@ -748,6 +748,19 @@ struct drm_syncobj_wait {
>         __u32 pad;
>  };
>
> +struct drm_syncobj_timeline_wait {
> +       __u64 handles;
> +       /* wait on specific timeline point for every handles*/
> +       __u64 points;
> +       /* absolute timeout */
> +       __s64 timeout_nsec;
> +       __u32 count_handles;
> +       __u32 flags;
> +       __u32 first_signaled; /* only valid when not waiting all */
> +       __u32 pad;
> +};
> +
> +
>  struct drm_syncobj_array {
>         __u64 handles;
>         __u32 count_handles;
> @@ -910,6 +923,7 @@ extern "C" {
>  #define DRM_IOCTL_MODE_GET_LEASE       DRM_IOWR(0xC8, struct
> drm_mode_get_lease)
>  #define DRM_IOCTL_MODE_REVOKE_LEASE    DRM_IOWR(0xC9, struct
> drm_mode_revoke_lease)
>
> +#define DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT        DRM_IOWR(0xCA, struct
> drm_syncobj_timeline_wait)
>  /**
>   * Device specific ioctls should only be in their respective headers
>   * The device specific ioctl range is from 0x40 to 0x9f.
> --
> 2.17.1
>
> _______________________________________________
> dri-devel mailing list
> dri-devel@lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/dri-devel
>
<div dir="ltr"><div class="gmail_quote"><div dir="ltr">On Thu, Sep 20, 2018 at 6:04 AM Chunming Zhou &lt;<a href="mailto:david1.zhou@amd.com">david1.zhou@amd.com</a>&gt; wrote:<br></div><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">points array is one-to-one match with syncobjs array.<br>
v2:<br>
add seperate ioctl for timeline point wait, otherwise break uapi.<br></blockquote><div><br></div><div>I think ioctl structs can be extended as long as fields aren&#39;t re-ordered.  I&#39;m not sure on the details of this though as I&#39;m not a particularly experienced kernel developer.</div><div><br></div><div>Another general comment (no good place to put it) is that I think we want two kinds of waits:  Wait for time point to be completed and wait for time point to become available.  The first is the usual CPU wait for completion while the second is for use by userspace drivers to wait until the first moment where they can submit work which depends on a given time point.<br></div><div> </div><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">
Signed-off-by: Chunming Zhou &lt;<a href="mailto:david1.zhou@amd.com" target="_blank">david1.zhou@amd.com</a>&gt;<br>
---<br>
 drivers/gpu/drm/drm_internal.h |  2 +<br>
 drivers/gpu/drm/drm_ioctl.c    |  2 +<br>
 drivers/gpu/drm/drm_syncobj.c  | 99 +++++++++++++++++++++++++++++-----<br>
 include/uapi/drm/drm.h         | 14 +++++<br>
 4 files changed, 103 insertions(+), 14 deletions(-)<br>
<br>
diff --git a/drivers/gpu/drm/drm_internal.h b/drivers/gpu/drm/drm_internal.h<br>
index 0c4eb4a9ab31..566d44e3c782 100644<br>
--- a/drivers/gpu/drm/drm_internal.h<br>
+++ b/drivers/gpu/drm/drm_internal.h<br>
@@ -183,6 +183,8 @@ int drm_syncobj_fd_to_handle_ioctl(struct drm_device *dev, void *data,<br>
                                   struct drm_file *file_private);<br>
 int drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,<br>
                           struct drm_file *file_private);<br>
+int drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,<br>
+                                   struct drm_file *file_private);<br>
 int drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,<br>
                            struct drm_file *file_private);<br>
 int drm_syncobj_signal_ioctl(struct drm_device *dev, void *data,<br>
diff --git a/drivers/gpu/drm/drm_ioctl.c b/drivers/gpu/drm/drm_ioctl.c<br>
index 6b4a633b4240..c0891614f516 100644<br>
--- a/drivers/gpu/drm/drm_ioctl.c<br>
+++ b/drivers/gpu/drm/drm_ioctl.c<br>
@@ -669,6 +669,8 @@ static const struct drm_ioctl_desc drm_ioctls[] = {<br>
                      DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
        DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_WAIT, drm_syncobj_wait_ioctl,<br>
                      DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
+       DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT, drm_syncobj_timeline_wait_ioctl,<br>
+                     DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
        DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_RESET, drm_syncobj_reset_ioctl,<br>
                      DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
        DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_SIGNAL, drm_syncobj_signal_ioctl,<br>
diff --git a/drivers/gpu/drm/drm_syncobj.c b/drivers/gpu/drm/drm_syncobj.c<br>
index 67472bd77c83..a43de0e4616c 100644<br>
--- a/drivers/gpu/drm/drm_syncobj.c<br>
+++ b/drivers/gpu/drm/drm_syncobj.c<br>
@@ -126,13 +126,14 @@ static void drm_syncobj_add_callback_locked(struct drm_syncobj *syncobj,<br>
 }<br>
<br>
 static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,<br>
+                                                u64 point,<br>
                                                 struct dma_fence **fence,<br>
                                                 struct drm_syncobj_cb *cb,<br>
                                                 drm_syncobj_func_t func)<br>
 {<br>
        int ret;<br>
<br>
-       ret = drm_syncobj_search_fence(syncobj, 0, 0, fence);<br>
+       ret = drm_syncobj_search_fence(syncobj, point, 0, fence);<br>
        if (!ret)<br>
                return 1;<br>
<br>
@@ -143,7 +144,7 @@ static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,<br>
         */<br>
        if (!list_empty(&amp;syncobj-&gt;signal_pt_list)) {<br>
                spin_unlock(&amp;syncobj-&gt;lock);<br>
-               drm_syncobj_search_fence(syncobj, 0, 0, fence);<br>
+               drm_syncobj_search_fence(syncobj, point, 0, fence);<br>
                if (*fence)<br>
                        return 1;<br>
                spin_lock(&amp;syncobj-&gt;lock);<br>
@@ -358,7 +359,9 @@ void drm_syncobj_replace_fence(struct drm_syncobj *syncobj,<br>
                spin_lock(&amp;syncobj-&gt;lock);<br>
                list_for_each_entry_safe(cur, tmp, &amp;syncobj-&gt;cb_list, node) {<br>
                        list_del_init(&amp;cur-&gt;node);<br>
+                       spin_unlock(&amp;syncobj-&gt;lock);<br>
                        cur-&gt;func(syncobj, cur);<br>
+                       spin_lock(&amp;syncobj-&gt;lock);<br>
                }<br>
                spin_unlock(&amp;syncobj-&gt;lock);<br>
        }<br>
@@ -856,6 +859,7 @@ struct syncobj_wait_entry {<br>
        struct dma_fence *fence;<br>
        struct dma_fence_cb fence_cb;<br>
        struct drm_syncobj_cb syncobj_cb;<br>
+       u64    point;<br>
 };<br>
<br>
 static void syncobj_wait_fence_func(struct dma_fence *fence,<br>
@@ -873,12 +877,13 @@ static void syncobj_wait_syncobj_func(struct drm_syncobj *syncobj,<br>
        struct syncobj_wait_entry *wait =<br>
                container_of(cb, struct syncobj_wait_entry, syncobj_cb);<br>
<br>
-       drm_syncobj_search_fence(syncobj, 0, 0, &amp;wait-&gt;fence);<br>
+       drm_syncobj_search_fence(syncobj, wait-&gt;point, 0, &amp;wait-&gt;fence);<br>
<br>
        wake_up_process(wait-&gt;task);<br>
 }<br>
<br>
 static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,<br>
+                                                 void __user *user_points,<br>
                                                  uint32_t count,<br>
                                                  uint32_t flags,<br>
                                                  signed long timeout,<br>
@@ -886,13 +891,27 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,<br>
 {<br>
        struct syncobj_wait_entry *entries;<br>
        struct dma_fence *fence;<br>
+       uint64_t *points;<br>
        signed long ret;<br>
        uint32_t signaled_count, i;<br>
<br>
-       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);<br>
-       if (!entries)<br>
+       points = kmalloc_array(count, sizeof(*points), GFP_KERNEL);<br>
+       if (points == NULL)<br>
                return -ENOMEM;<br>
<br>
+       if (!user_points) {<br>
+               memset(points, 0, count * sizeof(uint64_t));<br>
+       } else if (copy_from_user(points, user_points, sizeof(uint64_t) * count)) {<br>
+               ret = -EFAULT;<br>
+               goto err_free_points;<br>
+       }<br>
+<br>
+<br>
+       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);<br>
+       if (!entries) {<br>
+               ret = -ENOMEM;<br>
+               goto err_free_points;<br>
+       }<br>
        /* Walk the list of sync objects and initialize entries.  We do<br>
         * this up-front so that we can properly return -EINVAL if there is<br>
         * a syncobj with a missing fence and then never have the chance of<br>
@@ -901,7 +920,8 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,<br>
        signaled_count = 0;<br>
        for (i = 0; i &lt; count; ++i) {<br>
                entries[i].task = current;<br>
-               ret = drm_syncobj_search_fence(syncobjs[i], 0, 0,<br>
+               entries[i].point = points[i];<br>
+               ret = drm_syncobj_search_fence(syncobjs[i], points[i], 0,<br>
                                               &amp;entries[i].fence);<br>
                if (!entries[i].fence) {<br>
                        if (flags &amp; DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {<br>
@@ -940,6 +960,7 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,<br>
        if (flags &amp; DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {<br>
                for (i = 0; i &lt; count; ++i) {<br>
                        drm_syncobj_fence_get_or_add_callback(syncobjs[i],<br>
+                                                             entries[i].point,<br>
                                                              &amp;entries[i].fence,<br>
                                                              &amp;entries[i].syncobj_cb,<br>
                                                              syncobj_wait_syncobj_func);<br>
@@ -1003,6 +1024,9 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,<br>
        }<br>
        kfree(entries);<br>
<br>
+err_free_points:<br>
+       kfree(points);<br>
+<br>
        return ret;<br>
 }<br>
<br>
@@ -1041,20 +1065,33 @@ static signed long drm_timeout_abs_to_jiffies(int64_t timeout_nsec)<br>
 static int drm_syncobj_array_wait(struct drm_device *dev,<br>
                                  struct drm_file *file_private,<br>
                                  struct drm_syncobj_wait *wait,<br>
-                                 struct drm_syncobj **syncobjs)<br>
+                                 struct drm_syncobj_timeline_wait *timeline_wait,<br>
+                                 struct drm_syncobj **syncobjs, bool timeline)<br>
 {<br>
-       signed long timeout = drm_timeout_abs_to_jiffies(wait-&gt;timeout_nsec);<br>
+       signed long timeout = 0;<br>
        signed long ret = 0;<br>
        uint32_t first = ~0;<br>
<br>
-       ret = drm_syncobj_array_wait_timeout(syncobjs,<br>
-                                            wait-&gt;count_handles,<br>
-                                            wait-&gt;flags,<br>
-                                            timeout, &amp;first);<br>
+       if (!timeline) {<br>
+               timeout = drm_timeout_abs_to_jiffies(wait-&gt;timeout_nsec);<br>
+               ret = drm_syncobj_array_wait_timeout(syncobjs,<br>
+                                                    NULL,<br>
+                                                    wait-&gt;count_handles,<br>
+                                                    wait-&gt;flags,<br>
+                                                    timeout, &amp;first);<br>
+               wait-&gt;first_signaled = first;<br>
+       } else {<br>
+               timeout = drm_timeout_abs_to_jiffies(timeline_wait-&gt;timeout_nsec);<br>
+               ret = drm_syncobj_array_wait_timeout(syncobjs,<br>
+                                                    u64_to_user_ptr(timeline_wait-&gt;points),<br>
+                                                    timeline_wait-&gt;count_handles,<br>
+                                                    timeline_wait-&gt;flags,<br>
+                                                    timeout, &amp;first);<br>
+               timeline_wait-&gt;first_signaled = first;<br>
+       }<br>
        if (ret &lt; 0)<br>
                return ret;<br>
<br>
-       wait-&gt;first_signaled = first;<br>
        if (ret == 0)<br>
                return -ETIME;<br>
        return 0;<br>
@@ -1142,13 +1179,47 @@ drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,<br>
                return ret;<br>
<br>
        ret = drm_syncobj_array_wait(dev, file_private,<br>
-                                    args, syncobjs);<br>
+                                    args, NULL, syncobjs, false);<br>
<br>
        drm_syncobj_array_free(syncobjs, args-&gt;count_handles);<br>
<br>
        return ret;<br>
 }<br>
<br>
+int<br>
+drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,<br>
+                               struct drm_file *file_private)<br>
+{<br>
+       struct drm_syncobj_timeline_wait *args = data;<br>
+       struct drm_syncobj **syncobjs;<br>
+       int ret = 0;<br>
+<br>
+       if (!drm_core_check_feature(dev, DRIVER_SYNCOBJ))<br>
+               return -ENODEV;<br>
+<br>
+       if (args-&gt;flags &amp; ~(DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |<br>
+                           DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT))<br>
+               return -EINVAL;<br>
+<br>
+       if (args-&gt;count_handles == 0)<br>
+               return -EINVAL;<br>
+<br>
+       ret = drm_syncobj_array_find(file_private,<br>
+                                    u64_to_user_ptr(args-&gt;handles),<br>
+                                    args-&gt;count_handles,<br>
+                                    &amp;syncobjs);<br>
+       if (ret &lt; 0)<br>
+               return ret;<br>
+<br>
+       ret = drm_syncobj_array_wait(dev, file_private,<br>
+                                    NULL, args, syncobjs, true);<br>
+<br>
+       drm_syncobj_array_free(syncobjs, args-&gt;count_handles);<br>
+<br>
+       return ret;<br>
+}<br>
+<br>
+<br>
 int<br>
 drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,<br>
                        struct drm_file *file_private)<br>
diff --git a/include/uapi/drm/drm.h b/include/uapi/drm/drm.h<br>
index cebdb2541eb7..501e86d81f47 100644<br>
--- a/include/uapi/drm/drm.h<br>
+++ b/include/uapi/drm/drm.h<br>
@@ -748,6 +748,19 @@ struct drm_syncobj_wait {<br>
        __u32 pad;<br>
 };<br>
<br>
+struct drm_syncobj_timeline_wait {<br>
+       __u64 handles;<br>
+       /* wait on specific timeline point for every handles*/<br>
+       __u64 points;<br>
+       /* absolute timeout */<br>
+       __s64 timeout_nsec;<br>
+       __u32 count_handles;<br>
+       __u32 flags;<br>
+       __u32 first_signaled; /* only valid when not waiting all */<br>
+       __u32 pad;<br>
+};<br>
+<br>
+<br>
 struct drm_syncobj_array {<br>
        __u64 handles;<br>
        __u32 count_handles;<br>
@@ -910,6 +923,7 @@ extern &quot;C&quot; {<br>
 #define DRM_IOCTL_MODE_GET_LEASE       DRM_IOWR(0xC8, struct drm_mode_get_lease)<br>
 #define DRM_IOCTL_MODE_REVOKE_LEASE    DRM_IOWR(0xC9, struct drm_mode_revoke_lease)<br>
<br>
+#define DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT        DRM_IOWR(0xCA, struct drm_syncobj_timeline_wait)<br>
 /**<br>
  * Device specific ioctls should only be in their respective headers<br>
  * The device specific ioctl range is from 0x40 to 0x9f.<br>
-- <br>
2.17.1<br>
<br>
_______________________________________________<br>
dri-devel mailing list<br>
<a href="mailto:dri-devel@lists.freedesktop.org" target="_blank">dri-devel@lists.freedesktop.org</a><br>
<a href="https://lists.freedesktop.org/mailman/listinfo/dri-devel" rel="noreferrer" target="_blank">https://lists.freedesktop.org/mailman/listinfo/dri-devel</a><br>
</blockquote></div></div>
Christian König Sept. 25, 2018, 9:49 a.m. UTC | #5
Am 25.09.2018 um 11:22 schrieb Jason Ekstrand:
> On Thu, Sep 20, 2018 at 6:04 AM Chunming Zhou <david1.zhou@amd.com 
> <mailto:david1.zhou@amd.com>> wrote:
>
>     points array is one-to-one match with syncobjs array.
>     v2:
>     add seperate ioctl for timeline point wait, otherwise break uapi.
>
>
> I think ioctl structs can be extended as long as fields aren't 
> re-ordered.  I'm not sure on the details of this though as I'm not a 
> particularly experienced kernel developer.

Yeah, that is correct. The problem in this particular case is that we 
don't change the direct IOCTL parameter, but rather the array it points to.

We could do something like keep the existing handles array and add a 
separate optional one for the timeline points. That would also drop the 
need for the padding of the structure.

> Another general comment (no good place to put it) is that I think we 
> want two kinds of waits:  Wait for time point to be completed and wait 
> for time point to become available. The first is the usual CPU wait 
> for completion while the second is for use by userspace drivers to 
> wait until the first moment where they can submit work which depends 
> on a given time point.

Oh, yeah that is a really good point as ell.

Christian.

>     Signed-off-by: Chunming Zhou <david1.zhou@amd.com
>     <mailto:david1.zhou@amd.com>>
>     ---
>      drivers/gpu/drm/drm_internal.h |  2 +
>      drivers/gpu/drm/drm_ioctl.c    |  2 +
>      drivers/gpu/drm/drm_syncobj.c  | 99
>     +++++++++++++++++++++++++++++-----
>      include/uapi/drm/drm.h         | 14 +++++
>      4 files changed, 103 insertions(+), 14 deletions(-)
>
>     diff --git a/drivers/gpu/drm/drm_internal.h
>     b/drivers/gpu/drm/drm_internal.h
>     index 0c4eb4a9ab31..566d44e3c782 100644
>     --- a/drivers/gpu/drm/drm_internal.h
>     +++ b/drivers/gpu/drm/drm_internal.h
>     @@ -183,6 +183,8 @@ int drm_syncobj_fd_to_handle_ioctl(struct
>     drm_device *dev, void *data,
>                                        struct drm_file *file_private);
>      int drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,
>                                struct drm_file *file_private);
>     +int drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void
>     *data,
>     +                                   struct drm_file *file_private);
>      int drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
>                                 struct drm_file *file_private);
>      int drm_syncobj_signal_ioctl(struct drm_device *dev, void *data,
>     diff --git a/drivers/gpu/drm/drm_ioctl.c b/drivers/gpu/drm/drm_ioctl.c
>     index 6b4a633b4240..c0891614f516 100644
>     --- a/drivers/gpu/drm/drm_ioctl.c
>     +++ b/drivers/gpu/drm/drm_ioctl.c
>     @@ -669,6 +669,8 @@ static const struct drm_ioctl_desc
>     drm_ioctls[] = {
>                           DRM_UNLOCKED|DRM_RENDER_ALLOW),
>             DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_WAIT, drm_syncobj_wait_ioctl,
>                           DRM_UNLOCKED|DRM_RENDER_ALLOW),
>     +       DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT,
>     drm_syncobj_timeline_wait_ioctl,
>     +                     DRM_UNLOCKED|DRM_RENDER_ALLOW),
>             DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_RESET,
>     drm_syncobj_reset_ioctl,
>                           DRM_UNLOCKED|DRM_RENDER_ALLOW),
>             DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_SIGNAL,
>     drm_syncobj_signal_ioctl,
>     diff --git a/drivers/gpu/drm/drm_syncobj.c
>     b/drivers/gpu/drm/drm_syncobj.c
>     index 67472bd77c83..a43de0e4616c 100644
>     --- a/drivers/gpu/drm/drm_syncobj.c
>     +++ b/drivers/gpu/drm/drm_syncobj.c
>     @@ -126,13 +126,14 @@ static void
>     drm_syncobj_add_callback_locked(struct drm_syncobj *syncobj,
>      }
>
>      static int drm_syncobj_fence_get_or_add_callback(struct
>     drm_syncobj *syncobj,
>     +                                                u64 point,
>                                                      struct dma_fence
>     **fence,
>                                                      struct
>     drm_syncobj_cb *cb,
>      drm_syncobj_func_t func)
>      {
>             int ret;
>
>     -       ret = drm_syncobj_search_fence(syncobj, 0, 0, fence);
>     +       ret = drm_syncobj_search_fence(syncobj, point, 0, fence);
>             if (!ret)
>                     return 1;
>
>     @@ -143,7 +144,7 @@ static int
>     drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,
>              */
>             if (!list_empty(&syncobj->signal_pt_list)) {
>                     spin_unlock(&syncobj->lock);
>     -               drm_syncobj_search_fence(syncobj, 0, 0, fence);
>     +               drm_syncobj_search_fence(syncobj, point, 0, fence);
>                     if (*fence)
>                             return 1;
>                     spin_lock(&syncobj->lock);
>     @@ -358,7 +359,9 @@ void drm_syncobj_replace_fence(struct
>     drm_syncobj *syncobj,
>                     spin_lock(&syncobj->lock);
>                     list_for_each_entry_safe(cur, tmp,
>     &syncobj->cb_list, node) {
>                             list_del_init(&cur->node);
>     +                       spin_unlock(&syncobj->lock);
>                             cur->func(syncobj, cur);
>     +                       spin_lock(&syncobj->lock);
>                     }
>                     spin_unlock(&syncobj->lock);
>             }
>     @@ -856,6 +859,7 @@ struct syncobj_wait_entry {
>             struct dma_fence *fence;
>             struct dma_fence_cb fence_cb;
>             struct drm_syncobj_cb syncobj_cb;
>     +       u64    point;
>      };
>
>      static void syncobj_wait_fence_func(struct dma_fence *fence,
>     @@ -873,12 +877,13 @@ static void syncobj_wait_syncobj_func(struct
>     drm_syncobj *syncobj,
>             struct syncobj_wait_entry *wait =
>                     container_of(cb, struct syncobj_wait_entry,
>     syncobj_cb);
>
>     -       drm_syncobj_search_fence(syncobj, 0, 0, &wait->fence);
>     +       drm_syncobj_search_fence(syncobj, wait->point, 0,
>     &wait->fence);
>
>             wake_up_process(wait->task);
>      }
>
>      static signed long drm_syncobj_array_wait_timeout(struct
>     drm_syncobj **syncobjs,
>     +                                                 void __user
>     *user_points,
>                                                       uint32_t count,
>                                                       uint32_t flags,
>                                                       signed long timeout,
>     @@ -886,13 +891,27 @@ static signed long
>     drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>      {
>             struct syncobj_wait_entry *entries;
>             struct dma_fence *fence;
>     +       uint64_t *points;
>             signed long ret;
>             uint32_t signaled_count, i;
>
>     -       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
>     -       if (!entries)
>     +       points = kmalloc_array(count, sizeof(*points), GFP_KERNEL);
>     +       if (points == NULL)
>                     return -ENOMEM;
>
>     +       if (!user_points) {
>     +               memset(points, 0, count * sizeof(uint64_t));
>     +       } else if (copy_from_user(points, user_points,
>     sizeof(uint64_t) * count)) {
>     +               ret = -EFAULT;
>     +               goto err_free_points;
>     +       }
>     +
>     +
>     +       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
>     +       if (!entries) {
>     +               ret = -ENOMEM;
>     +               goto err_free_points;
>     +       }
>             /* Walk the list of sync objects and initialize entries. 
>     We do
>              * this up-front so that we can properly return -EINVAL if
>     there is
>              * a syncobj with a missing fence and then never have the
>     chance of
>     @@ -901,7 +920,8 @@ static signed long
>     drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>             signaled_count = 0;
>             for (i = 0; i < count; ++i) {
>                     entries[i].task = current;
>     -               ret = drm_syncobj_search_fence(syncobjs[i], 0, 0,
>     +               entries[i].point = points[i];
>     +               ret = drm_syncobj_search_fence(syncobjs[i],
>     points[i], 0,
>      &entries[i].fence);
>                     if (!entries[i].fence) {
>                             if (flags &
>     DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
>     @@ -940,6 +960,7 @@ static signed long
>     drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>             if (flags & DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
>                     for (i = 0; i < count; ++i) {
>     drm_syncobj_fence_get_or_add_callback(syncobjs[i],
>     +  entries[i].point,
>       &entries[i].fence,
>       &entries[i].syncobj_cb,
>       syncobj_wait_syncobj_func);
>     @@ -1003,6 +1024,9 @@ static signed long
>     drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>             }
>             kfree(entries);
>
>     +err_free_points:
>     +       kfree(points);
>     +
>             return ret;
>      }
>
>     @@ -1041,20 +1065,33 @@ static signed long
>     drm_timeout_abs_to_jiffies(int64_t timeout_nsec)
>      static int drm_syncobj_array_wait(struct drm_device *dev,
>                                       struct drm_file *file_private,
>                                       struct drm_syncobj_wait *wait,
>     -                                 struct drm_syncobj **syncobjs)
>     +                                 struct drm_syncobj_timeline_wait
>     *timeline_wait,
>     +                                 struct drm_syncobj **syncobjs,
>     bool timeline)
>      {
>     -       signed long timeout =
>     drm_timeout_abs_to_jiffies(wait->timeout_nsec);
>     +       signed long timeout = 0;
>             signed long ret = 0;
>             uint32_t first = ~0;
>
>     -       ret = drm_syncobj_array_wait_timeout(syncobjs,
>     - wait->count_handles,
>     -                                            wait->flags,
>     -                                            timeout, &first);
>     +       if (!timeline) {
>     +               timeout =
>     drm_timeout_abs_to_jiffies(wait->timeout_nsec);
>     +               ret = drm_syncobj_array_wait_timeout(syncobjs,
>     +                                                    NULL,
>     + wait->count_handles,
>     + wait->flags,
>     + timeout, &first);
>     +               wait->first_signaled = first;
>     +       } else {
>     +               timeout =
>     drm_timeout_abs_to_jiffies(timeline_wait->timeout_nsec);
>     +               ret = drm_syncobj_array_wait_timeout(syncobjs,
>     + u64_to_user_ptr(timeline_wait->points),
>     + timeline_wait->count_handles,
>     + timeline_wait->flags,
>     + timeout, &first);
>     +               timeline_wait->first_signaled = first;
>     +       }
>             if (ret < 0)
>                     return ret;
>
>     -       wait->first_signaled = first;
>             if (ret == 0)
>                     return -ETIME;
>             return 0;
>     @@ -1142,13 +1179,47 @@ drm_syncobj_wait_ioctl(struct drm_device
>     *dev, void *data,
>                     return ret;
>
>             ret = drm_syncobj_array_wait(dev, file_private,
>     -                                    args, syncobjs);
>     +                                    args, NULL, syncobjs, false);
>
>             drm_syncobj_array_free(syncobjs, args->count_handles);
>
>             return ret;
>      }
>
>     +int
>     +drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
>     +                               struct drm_file *file_private)
>     +{
>     +       struct drm_syncobj_timeline_wait *args = data;
>     +       struct drm_syncobj **syncobjs;
>     +       int ret = 0;
>     +
>     +       if (!drm_core_check_feature(dev, DRIVER_SYNCOBJ))
>     +               return -ENODEV;
>     +
>     +       if (args->flags & ~(DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |
>     +  DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT))
>     +               return -EINVAL;
>     +
>     +       if (args->count_handles == 0)
>     +               return -EINVAL;
>     +
>     +       ret = drm_syncobj_array_find(file_private,
>     + u64_to_user_ptr(args->handles),
>     +                                    args->count_handles,
>     +                                    &syncobjs);
>     +       if (ret < 0)
>     +               return ret;
>     +
>     +       ret = drm_syncobj_array_wait(dev, file_private,
>     +                                    NULL, args, syncobjs, true);
>     +
>     +       drm_syncobj_array_free(syncobjs, args->count_handles);
>     +
>     +       return ret;
>     +}
>     +
>     +
>      int
>      drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
>                             struct drm_file *file_private)
>     diff --git a/include/uapi/drm/drm.h b/include/uapi/drm/drm.h
>     index cebdb2541eb7..501e86d81f47 100644
>     --- a/include/uapi/drm/drm.h
>     +++ b/include/uapi/drm/drm.h
>     @@ -748,6 +748,19 @@ struct drm_syncobj_wait {
>             __u32 pad;
>      };
>
>     +struct drm_syncobj_timeline_wait {
>     +       __u64 handles;
>     +       /* wait on specific timeline point for every handles*/
>     +       __u64 points;
>     +       /* absolute timeout */
>     +       __s64 timeout_nsec;
>     +       __u32 count_handles;
>     +       __u32 flags;
>     +       __u32 first_signaled; /* only valid when not waiting all */
>     +       __u32 pad;
>     +};
>     +
>     +
>      struct drm_syncobj_array {
>             __u64 handles;
>             __u32 count_handles;
>     @@ -910,6 +923,7 @@ extern "C" {
>      #define DRM_IOCTL_MODE_GET_LEASE       DRM_IOWR(0xC8, struct
>     drm_mode_get_lease)
>      #define DRM_IOCTL_MODE_REVOKE_LEASE    DRM_IOWR(0xC9, struct
>     drm_mode_revoke_lease)
>
>     +#define DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT DRM_IOWR(0xCA, struct
>     drm_syncobj_timeline_wait)
>      /**
>       * Device specific ioctls should only be in their respective headers
>       * The device specific ioctl range is from 0x40 to 0x9f.
>     -- 
>     2.17.1
>
>     _______________________________________________
>     dri-devel mailing list
>     dri-devel@lists.freedesktop.org
>     <mailto:dri-devel@lists.freedesktop.org>
>     https://lists.freedesktop.org/mailman/listinfo/dri-devel
>
>
>
> _______________________________________________
> dri-devel mailing list
> dri-devel@lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/dri-devel
<html>
  <head>
    <meta http-equiv="Content-Type" content="text/html; charset=utf-8">
  </head>
  <body text="#000000" bgcolor="#FFFFFF">
    <div class="moz-cite-prefix">Am 25.09.2018 um 11:22 schrieb Jason
      Ekstrand:<br>
    </div>
    <blockquote type="cite"
cite="mid:CAOFGe96fXDQ8Q1piYCWhn2Z8ToOmf1JXyu+2YgUWYbMLCX7nzg@mail.gmail.com">
      <meta http-equiv="content-type" content="text/html; charset=utf-8">
      <div dir="ltr">
        <div class="gmail_quote">
          <div dir="ltr">On Thu, Sep 20, 2018 at 6:04 AM Chunming Zhou
            &lt;<a href="mailto:david1.zhou@amd.com"
              moz-do-not-send="true">david1.zhou@amd.com</a>&gt; wrote:<br>
          </div>
          <blockquote class="gmail_quote" style="margin:0 0 0
            .8ex;border-left:1px #ccc solid;padding-left:1ex">points
            array is one-to-one match with syncobjs array.<br>
            v2:<br>
            add seperate ioctl for timeline point wait, otherwise break
            uapi.<br>
          </blockquote>
          <div><br>
          </div>
          <div>I think ioctl structs can be extended as long as fields
            aren't re-ordered.  I'm not sure on the details of this
            though as I'm not a particularly experienced kernel
            developer.</div>
        </div>
      </div>
    </blockquote>
    <br>
    Yeah, that is correct. The problem in this particular case is that
    we don't change the direct IOCTL parameter, but rather the array it
    points to.<br>
    <br>
    We could do something like keep the existing handles array and add a
    separate optional one for the timeline points. That would also drop
    the need for the padding of the structure.<br>
    <br>
    <blockquote type="cite"
cite="mid:CAOFGe96fXDQ8Q1piYCWhn2Z8ToOmf1JXyu+2YgUWYbMLCX7nzg@mail.gmail.com">
      <div dir="ltr">
        <div class="gmail_quote">
          <div>Another general comment (no good place to put it) is that
            I think we want two kinds of waits:  Wait for time point to
            be completed and wait for time point to become available. 
            The first is the usual CPU wait for completion while the
            second is for use by userspace drivers to wait until the
            first moment where they can submit work which depends on a
            given time point.<br>
          </div>
        </div>
      </div>
    </blockquote>
    <br>
    Oh, yeah that is a really good point as ell.<br>
    <br>
    Christian.<br>
    <br>
    <blockquote type="cite"
cite="mid:CAOFGe96fXDQ8Q1piYCWhn2Z8ToOmf1JXyu+2YgUWYbMLCX7nzg@mail.gmail.com">
      <div dir="ltr">
        <div class="gmail_quote">
          <div> </div>
          <blockquote class="gmail_quote" style="margin:0 0 0
            .8ex;border-left:1px #ccc solid;padding-left:1ex">
            Signed-off-by: Chunming Zhou &lt;<a
              href="mailto:david1.zhou@amd.com" target="_blank"
              moz-do-not-send="true">david1.zhou@amd.com</a>&gt;<br>
            ---<br>
             drivers/gpu/drm/drm_internal.h |  2 +<br>
             drivers/gpu/drm/drm_ioctl.c    |  2 +<br>
             drivers/gpu/drm/drm_syncobj.c  | 99
            +++++++++++++++++++++++++++++-----<br>
             include/uapi/drm/drm.h         | 14 +++++<br>
             4 files changed, 103 insertions(+), 14 deletions(-)<br>
            <br>
            diff --git a/drivers/gpu/drm/drm_internal.h
            b/drivers/gpu/drm/drm_internal.h<br>
            index 0c4eb4a9ab31..566d44e3c782 100644<br>
            --- a/drivers/gpu/drm/drm_internal.h<br>
            +++ b/drivers/gpu/drm/drm_internal.h<br>
            @@ -183,6 +183,8 @@ int
            drm_syncobj_fd_to_handle_ioctl(struct drm_device *dev, void
            *data,<br>
                                               struct drm_file
            *file_private);<br>
             int drm_syncobj_wait_ioctl(struct drm_device *dev, void
            *data,<br>
                                       struct drm_file *file_private);<br>
            +int drm_syncobj_timeline_wait_ioctl(struct drm_device *dev,
            void *data,<br>
            +                                   struct drm_file
            *file_private);<br>
             int drm_syncobj_reset_ioctl(struct drm_device *dev, void
            *data,<br>
                                        struct drm_file *file_private);<br>
             int drm_syncobj_signal_ioctl(struct drm_device *dev, void
            *data,<br>
            diff --git a/drivers/gpu/drm/drm_ioctl.c
            b/drivers/gpu/drm/drm_ioctl.c<br>
            index 6b4a633b4240..c0891614f516 100644<br>
            --- a/drivers/gpu/drm/drm_ioctl.c<br>
            +++ b/drivers/gpu/drm/drm_ioctl.c<br>
            @@ -669,6 +669,8 @@ static const struct drm_ioctl_desc
            drm_ioctls[] = {<br>
                                  DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
                    DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_WAIT,
            drm_syncobj_wait_ioctl,<br>
                                  DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
            +       DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT,
            drm_syncobj_timeline_wait_ioctl,<br>
            +                     DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
                    DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_RESET,
            drm_syncobj_reset_ioctl,<br>
                                  DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
                    DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_SIGNAL,
            drm_syncobj_signal_ioctl,<br>
            diff --git a/drivers/gpu/drm/drm_syncobj.c
            b/drivers/gpu/drm/drm_syncobj.c<br>
            index 67472bd77c83..a43de0e4616c 100644<br>
            --- a/drivers/gpu/drm/drm_syncobj.c<br>
            +++ b/drivers/gpu/drm/drm_syncobj.c<br>
            @@ -126,13 +126,14 @@ static void
            drm_syncobj_add_callback_locked(struct drm_syncobj *syncobj,<br>
             }<br>
            <br>
             static int drm_syncobj_fence_get_or_add_callback(struct
            drm_syncobj *syncobj,<br>
            +                                                u64 point,<br>
                                                             struct
            dma_fence **fence,<br>
                                                             struct
            drm_syncobj_cb *cb,<br>
                                                           
             drm_syncobj_func_t func)<br>
             {<br>
                    int ret;<br>
            <br>
            -       ret = drm_syncobj_search_fence(syncobj, 0, 0,
            fence);<br>
            +       ret = drm_syncobj_search_fence(syncobj, point, 0,
            fence);<br>
                    if (!ret)<br>
                            return 1;<br>
            <br>
            @@ -143,7 +144,7 @@ static int
            drm_syncobj_fence_get_or_add_callback(struct drm_syncobj
            *syncobj,<br>
                     */<br>
                    if (!list_empty(&amp;syncobj-&gt;signal_pt_list)) {<br>
                            spin_unlock(&amp;syncobj-&gt;lock);<br>
            -               drm_syncobj_search_fence(syncobj, 0, 0,
            fence);<br>
            +               drm_syncobj_search_fence(syncobj, point, 0,
            fence);<br>
                            if (*fence)<br>
                                    return 1;<br>
                            spin_lock(&amp;syncobj-&gt;lock);<br>
            @@ -358,7 +359,9 @@ void drm_syncobj_replace_fence(struct
            drm_syncobj *syncobj,<br>
                            spin_lock(&amp;syncobj-&gt;lock);<br>
                            list_for_each_entry_safe(cur, tmp,
            &amp;syncobj-&gt;cb_list, node) {<br>
                                    list_del_init(&amp;cur-&gt;node);<br>
            +                       spin_unlock(&amp;syncobj-&gt;lock);<br>
                                    cur-&gt;func(syncobj, cur);<br>
            +                       spin_lock(&amp;syncobj-&gt;lock);<br>
                            }<br>
                            spin_unlock(&amp;syncobj-&gt;lock);<br>
                    }<br>
            @@ -856,6 +859,7 @@ struct syncobj_wait_entry {<br>
                    struct dma_fence *fence;<br>
                    struct dma_fence_cb fence_cb;<br>
                    struct drm_syncobj_cb syncobj_cb;<br>
            +       u64    point;<br>
             };<br>
            <br>
             static void syncobj_wait_fence_func(struct dma_fence
            *fence,<br>
            @@ -873,12 +877,13 @@ static void
            syncobj_wait_syncobj_func(struct drm_syncobj *syncobj,<br>
                    struct syncobj_wait_entry *wait =<br>
                            container_of(cb, struct syncobj_wait_entry,
            syncobj_cb);<br>
            <br>
            -       drm_syncobj_search_fence(syncobj, 0, 0,
            &amp;wait-&gt;fence);<br>
            +       drm_syncobj_search_fence(syncobj, wait-&gt;point, 0,
            &amp;wait-&gt;fence);<br>
            <br>
                    wake_up_process(wait-&gt;task);<br>
             }<br>
            <br>
             static signed long drm_syncobj_array_wait_timeout(struct
            drm_syncobj **syncobjs,<br>
            +                                                 void
            __user *user_points,<br>
                                                              uint32_t
            count,<br>
                                                              uint32_t
            flags,<br>
                                                              signed
            long timeout,<br>
            @@ -886,13 +891,27 @@ static signed long
            drm_syncobj_array_wait_timeout(struct drm_syncobj
            **syncobjs,<br>
             {<br>
                    struct syncobj_wait_entry *entries;<br>
                    struct dma_fence *fence;<br>
            +       uint64_t *points;<br>
                    signed long ret;<br>
                    uint32_t signaled_count, i;<br>
            <br>
            -       entries = kcalloc(count, sizeof(*entries),
            GFP_KERNEL);<br>
            -       if (!entries)<br>
            +       points = kmalloc_array(count, sizeof(*points),
            GFP_KERNEL);<br>
            +       if (points == NULL)<br>
                            return -ENOMEM;<br>
            <br>
            +       if (!user_points) {<br>
            +               memset(points, 0, count * sizeof(uint64_t));<br>
            +       } else if (copy_from_user(points, user_points,
            sizeof(uint64_t) * count)) {<br>
            +               ret = -EFAULT;<br>
            +               goto err_free_points;<br>
            +       }<br>
            +<br>
            +<br>
            +       entries = kcalloc(count, sizeof(*entries),
            GFP_KERNEL);<br>
            +       if (!entries) {<br>
            +               ret = -ENOMEM;<br>
            +               goto err_free_points;<br>
            +       }<br>
                    /* Walk the list of sync objects and initialize
            entries.  We do<br>
                     * this up-front so that we can properly return
            -EINVAL if there is<br>
                     * a syncobj with a missing fence and then never
            have the chance of<br>
            @@ -901,7 +920,8 @@ static signed long
            drm_syncobj_array_wait_timeout(struct drm_syncobj
            **syncobjs,<br>
                    signaled_count = 0;<br>
                    for (i = 0; i &lt; count; ++i) {<br>
                            entries[i].task = current;<br>
            -               ret = drm_syncobj_search_fence(syncobjs[i],
            0, 0,<br>
            +               entries[i].point = points[i];<br>
            +               ret = drm_syncobj_search_fence(syncobjs[i],
            points[i], 0,<br>
                                                         
             &amp;entries[i].fence);<br>
                            if (!entries[i].fence) {<br>
                                    if (flags &amp;
            DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {<br>
            @@ -940,6 +960,7 @@ static signed long
            drm_syncobj_array_wait_timeout(struct drm_syncobj
            **syncobjs,<br>
                    if (flags &amp;
            DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {<br>
                            for (i = 0; i &lt; count; ++i) {<br>
                                   
            drm_syncobj_fence_get_or_add_callback(syncobjs[i],<br>
            +                                                           
             entries[i].point,<br>
                                                                       
              &amp;entries[i].fence,<br>
                                                                       
              &amp;entries[i].syncobj_cb,<br>
                                                                       
              syncobj_wait_syncobj_func);<br>
            @@ -1003,6 +1024,9 @@ static signed long
            drm_syncobj_array_wait_timeout(struct drm_syncobj
            **syncobjs,<br>
                    }<br>
                    kfree(entries);<br>
            <br>
            +err_free_points:<br>
            +       kfree(points);<br>
            +<br>
                    return ret;<br>
             }<br>
            <br>
            @@ -1041,20 +1065,33 @@ static signed long
            drm_timeout_abs_to_jiffies(int64_t timeout_nsec)<br>
             static int drm_syncobj_array_wait(struct drm_device *dev,<br>
                                              struct drm_file
            *file_private,<br>
                                              struct drm_syncobj_wait
            *wait,<br>
            -                                 struct drm_syncobj
            **syncobjs)<br>
            +                                 struct
            drm_syncobj_timeline_wait *timeline_wait,<br>
            +                                 struct drm_syncobj
            **syncobjs, bool timeline)<br>
             {<br>
            -       signed long timeout =
            drm_timeout_abs_to_jiffies(wait-&gt;timeout_nsec);<br>
            +       signed long timeout = 0;<br>
                    signed long ret = 0;<br>
                    uint32_t first = ~0;<br>
            <br>
            -       ret = drm_syncobj_array_wait_timeout(syncobjs,<br>
            -                                           
            wait-&gt;count_handles,<br>
            -                                            wait-&gt;flags,<br>
            -                                            timeout,
            &amp;first);<br>
            +       if (!timeline) {<br>
            +               timeout =
            drm_timeout_abs_to_jiffies(wait-&gt;timeout_nsec);<br>
            +               ret =
            drm_syncobj_array_wait_timeout(syncobjs,<br>
            +                                                    NULL,<br>
            +                                                   
            wait-&gt;count_handles,<br>
            +                                                   
            wait-&gt;flags,<br>
            +                                                   
            timeout, &amp;first);<br>
            +               wait-&gt;first_signaled = first;<br>
            +       } else {<br>
            +               timeout =
            drm_timeout_abs_to_jiffies(timeline_wait-&gt;timeout_nsec);<br>
            +               ret =
            drm_syncobj_array_wait_timeout(syncobjs,<br>
            +                                                   
            u64_to_user_ptr(timeline_wait-&gt;points),<br>
            +                                                   
            timeline_wait-&gt;count_handles,<br>
            +                                                   
            timeline_wait-&gt;flags,<br>
            +                                                   
            timeout, &amp;first);<br>
            +               timeline_wait-&gt;first_signaled = first;<br>
            +       }<br>
                    if (ret &lt; 0)<br>
                            return ret;<br>
            <br>
            -       wait-&gt;first_signaled = first;<br>
                    if (ret == 0)<br>
                            return -ETIME;<br>
                    return 0;<br>
            @@ -1142,13 +1179,47 @@ drm_syncobj_wait_ioctl(struct
            drm_device *dev, void *data,<br>
                            return ret;<br>
            <br>
                    ret = drm_syncobj_array_wait(dev, file_private,<br>
            -                                    args, syncobjs);<br>
            +                                    args, NULL, syncobjs,
            false);<br>
            <br>
                    drm_syncobj_array_free(syncobjs,
            args-&gt;count_handles);<br>
            <br>
                    return ret;<br>
             }<br>
            <br>
            +int<br>
            +drm_syncobj_timeline_wait_ioctl(struct drm_device *dev,
            void *data,<br>
            +                               struct drm_file
            *file_private)<br>
            +{<br>
            +       struct drm_syncobj_timeline_wait *args = data;<br>
            +       struct drm_syncobj **syncobjs;<br>
            +       int ret = 0;<br>
            +<br>
            +       if (!drm_core_check_feature(dev, DRIVER_SYNCOBJ))<br>
            +               return -ENODEV;<br>
            +<br>
            +       if (args-&gt;flags &amp;
            ~(DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |<br>
            +                         
             DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT))<br>
            +               return -EINVAL;<br>
            +<br>
            +       if (args-&gt;count_handles == 0)<br>
            +               return -EINVAL;<br>
            +<br>
            +       ret = drm_syncobj_array_find(file_private,<br>
            +                                   
            u64_to_user_ptr(args-&gt;handles),<br>
            +                                    args-&gt;count_handles,<br>
            +                                    &amp;syncobjs);<br>
            +       if (ret &lt; 0)<br>
            +               return ret;<br>
            +<br>
            +       ret = drm_syncobj_array_wait(dev, file_private,<br>
            +                                    NULL, args, syncobjs,
            true);<br>
            +<br>
            +       drm_syncobj_array_free(syncobjs,
            args-&gt;count_handles);<br>
            +<br>
            +       return ret;<br>
            +}<br>
            +<br>
            +<br>
             int<br>
             drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,<br>
                                    struct drm_file *file_private)<br>
            diff --git a/include/uapi/drm/drm.h b/include/uapi/drm/drm.h<br>
            index cebdb2541eb7..501e86d81f47 100644<br>
            --- a/include/uapi/drm/drm.h<br>
            +++ b/include/uapi/drm/drm.h<br>
            @@ -748,6 +748,19 @@ struct drm_syncobj_wait {<br>
                    __u32 pad;<br>
             };<br>
            <br>
            +struct drm_syncobj_timeline_wait {<br>
            +       __u64 handles;<br>
            +       /* wait on specific timeline point for every
            handles*/<br>
            +       __u64 points;<br>
            +       /* absolute timeout */<br>
            +       __s64 timeout_nsec;<br>
            +       __u32 count_handles;<br>
            +       __u32 flags;<br>
            +       __u32 first_signaled; /* only valid when not waiting
            all */<br>
            +       __u32 pad;<br>
            +};<br>
            +<br>
            +<br>
             struct drm_syncobj_array {<br>
                    __u64 handles;<br>
                    __u32 count_handles;<br>
            @@ -910,6 +923,7 @@ extern "C" {<br>
             #define DRM_IOCTL_MODE_GET_LEASE       DRM_IOWR(0xC8,
            struct drm_mode_get_lease)<br>
             #define DRM_IOCTL_MODE_REVOKE_LEASE    DRM_IOWR(0xC9,
            struct drm_mode_revoke_lease)<br>
            <br>
            +#define DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT       
            DRM_IOWR(0xCA, struct drm_syncobj_timeline_wait)<br>
             /**<br>
              * Device specific ioctls should only be in their
            respective headers<br>
              * The device specific ioctl range is from 0x40 to 0x9f.<br>
            -- <br>
            2.17.1<br>
            <br>
            _______________________________________________<br>
            dri-devel mailing list<br>
            <a href="mailto:dri-devel@lists.freedesktop.org"
              target="_blank" moz-do-not-send="true">dri-devel@lists.freedesktop.org</a><br>
            <a
              href="https://lists.freedesktop.org/mailman/listinfo/dri-devel"
              rel="noreferrer" target="_blank" moz-do-not-send="true">https://lists.freedesktop.org/mailman/listinfo/dri-devel</a><br>
          </blockquote>
        </div>
      </div>
      <br>
      <fieldset class="mimeAttachmentHeader"></fieldset>
      <br>
      <pre wrap="">_______________________________________________
dri-devel mailing list
<a class="moz-txt-link-abbreviated" href="mailto:dri-devel@lists.freedesktop.org">dri-devel@lists.freedesktop.org</a>
<a class="moz-txt-link-freetext" href="https://lists.freedesktop.org/mailman/listinfo/dri-devel">https://lists.freedesktop.org/mailman/listinfo/dri-devel</a>
</pre>
    </blockquote>
    <br>
  </body>
</html>
Chunming Zhou Oct. 8, 2018, 5:53 a.m. UTC | #6
>> Another general comment (no good place to put it) is that I think we want two kinds of waits:  Wait for time point to be completed and wait for time point to become available.  The first is the usual CPU wait for completion while the second is for use by userspace drivers to wait until the first moment where they can submit work which depends on a given time point.

Hi Jason,

How about adding two new wait flags?
DRM_SYNCOBJ_WAIT_FLAGS_WAIT_COMPLETED
DRM_SYNCOBJ_WAIT_FLAGS_WAIT_AVAILABLE

Thanks,
David

From: Christian König <ckoenig.leichtzumerken@gmail.com>
Sent: Tuesday, September 25, 2018 5:50 PM
To: Jason Ekstrand <jason@jlekstrand.net>; Zhou, David(ChunMing) <David1.Zhou@amd.com>
Cc: amd-gfx mailing list <amd-gfx@lists.freedesktop.org>; Maling list - DRI developers <dri-devel@lists.freedesktop.org>
Subject: Re: [PATCH 3/6] drm: add support of syncobj timeline point wait v2

Am 25.09.2018 um 11:22 schrieb Jason Ekstrand:
On Thu, Sep 20, 2018 at 6:04 AM Chunming Zhou <david1.zhou@amd.com<mailto:david1.zhou@amd.com>> wrote:
points array is one-to-one match with syncobjs array.
v2:
add seperate ioctl for timeline point wait, otherwise break uapi.

I think ioctl structs can be extended as long as fields aren't re-ordered.  I'm not sure on the details of this though as I'm not a particularly experienced kernel developer.

Yeah, that is correct. The problem in this particular case is that we don't change the direct IOCTL parameter, but rather the array it points to.

We could do something like keep the existing handles array and add a separate optional one for the timeline points. That would also drop the need for the padding of the structure.


Another general comment (no good place to put it) is that I think we want two kinds of waits:  Wait for time point to be completed and wait for time point to become available.  The first is the usual CPU wait for completion while the second is for use by userspace drivers to wait until the first moment where they can submit work which depends on a given time point.

Oh, yeah that is a really good point as ell.

Christian.



Signed-off-by: Chunming Zhou <david1.zhou@amd.com<mailto:david1.zhou@amd.com>>
---
 drivers/gpu/drm/drm_internal.h |  2 +
 drivers/gpu/drm/drm_ioctl.c    |  2 +
 drivers/gpu/drm/drm_syncobj.c  | 99 +++++++++++++++++++++++++++++-----
 include/uapi/drm/drm.h         | 14 +++++
 4 files changed, 103 insertions(+), 14 deletions(-)

diff --git a/drivers/gpu/drm/drm_internal.h b/drivers/gpu/drm/drm_internal.h
index 0c4eb4a9ab31..566d44e3c782 100644
--- a/drivers/gpu/drm/drm_internal.h
+++ b/drivers/gpu/drm/drm_internal.h
@@ -183,6 +183,8 @@ int drm_syncobj_fd_to_handle_ioctl(struct drm_device *dev, void *data,
                                   struct drm_file *file_private);
 int drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,
                           struct drm_file *file_private);
+int drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
+                                   struct drm_file *file_private);
 int drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
                            struct drm_file *file_private);
 int drm_syncobj_signal_ioctl(struct drm_device *dev, void *data,
diff --git a/drivers/gpu/drm/drm_ioctl.c b/drivers/gpu/drm/drm_ioctl.c
index 6b4a633b4240..c0891614f516 100644
--- a/drivers/gpu/drm/drm_ioctl.c
+++ b/drivers/gpu/drm/drm_ioctl.c
@@ -669,6 +669,8 @@ static const struct drm_ioctl_desc drm_ioctls[] = {
                      DRM_UNLOCKED|DRM_RENDER_ALLOW),
        DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_WAIT, drm_syncobj_wait_ioctl,
                      DRM_UNLOCKED|DRM_RENDER_ALLOW),
+       DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT, drm_syncobj_timeline_wait_ioctl,
+                     DRM_UNLOCKED|DRM_RENDER_ALLOW),
        DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_RESET, drm_syncobj_reset_ioctl,
                      DRM_UNLOCKED|DRM_RENDER_ALLOW),
        DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_SIGNAL, drm_syncobj_signal_ioctl,
diff --git a/drivers/gpu/drm/drm_syncobj.c b/drivers/gpu/drm/drm_syncobj.c
index 67472bd77c83..a43de0e4616c 100644
--- a/drivers/gpu/drm/drm_syncobj.c
+++ b/drivers/gpu/drm/drm_syncobj.c
@@ -126,13 +126,14 @@ static void drm_syncobj_add_callback_locked(struct drm_syncobj *syncobj,
 }

 static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,
+                                                u64 point,
                                                 struct dma_fence **fence,
                                                 struct drm_syncobj_cb *cb,
                                                 drm_syncobj_func_t func)
 {
        int ret;

-       ret = drm_syncobj_search_fence(syncobj, 0, 0, fence);
+       ret = drm_syncobj_search_fence(syncobj, point, 0, fence);
        if (!ret)
                return 1;

@@ -143,7 +144,7 @@ static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,
         */
        if (!list_empty(&syncobj->signal_pt_list)) {
                spin_unlock(&syncobj->lock);
-               drm_syncobj_search_fence(syncobj, 0, 0, fence);
+               drm_syncobj_search_fence(syncobj, point, 0, fence);
                if (*fence)
                        return 1;
                spin_lock(&syncobj->lock);
@@ -358,7 +359,9 @@ void drm_syncobj_replace_fence(struct drm_syncobj *syncobj,
                spin_lock(&syncobj->lock);
                list_for_each_entry_safe(cur, tmp, &syncobj->cb_list, node) {
                        list_del_init(&cur->node);
+                       spin_unlock(&syncobj->lock);
                        cur->func(syncobj, cur);
+                       spin_lock(&syncobj->lock);
                }
                spin_unlock(&syncobj->lock);
        }
@@ -856,6 +859,7 @@ struct syncobj_wait_entry {
        struct dma_fence *fence;
        struct dma_fence_cb fence_cb;
        struct drm_syncobj_cb syncobj_cb;
+       u64    point;
 };

 static void syncobj_wait_fence_func(struct dma_fence *fence,
@@ -873,12 +877,13 @@ static void syncobj_wait_syncobj_func(struct drm_syncobj *syncobj,
        struct syncobj_wait_entry *wait =
                container_of(cb, struct syncobj_wait_entry, syncobj_cb);

-       drm_syncobj_search_fence(syncobj, 0, 0, &wait->fence);
+       drm_syncobj_search_fence(syncobj, wait->point, 0, &wait->fence);

        wake_up_process(wait->task);
 }

 static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
+                                                 void __user *user_points,
                                                  uint32_t count,
                                                  uint32_t flags,
                                                  signed long timeout,
@@ -886,13 +891,27 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
 {
        struct syncobj_wait_entry *entries;
        struct dma_fence *fence;
+       uint64_t *points;
        signed long ret;
        uint32_t signaled_count, i;

-       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
-       if (!entries)
+       points = kmalloc_array(count, sizeof(*points), GFP_KERNEL);
+       if (points == NULL)
                return -ENOMEM;

+       if (!user_points) {
+               memset(points, 0, count * sizeof(uint64_t));
+       } else if (copy_from_user(points, user_points, sizeof(uint64_t) * count)) {
+               ret = -EFAULT;
+               goto err_free_points;
+       }
+
+
+       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
+       if (!entries) {
+               ret = -ENOMEM;
+               goto err_free_points;
+       }
        /* Walk the list of sync objects and initialize entries.  We do
         * this up-front so that we can properly return -EINVAL if there is
         * a syncobj with a missing fence and then never have the chance of
@@ -901,7 +920,8 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
        signaled_count = 0;
        for (i = 0; i < count; ++i) {
                entries[i].task = current;
-               ret = drm_syncobj_search_fence(syncobjs[i], 0, 0,
+               entries[i].point = points[i];
+               ret = drm_syncobj_search_fence(syncobjs[i], points[i], 0,
                                               &entries[i].fence);
                if (!entries[i].fence) {
                        if (flags & DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
@@ -940,6 +960,7 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
        if (flags & DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
                for (i = 0; i < count; ++i) {
                        drm_syncobj_fence_get_or_add_callback(syncobjs[i],
+                                                             entries[i].point,
                                                              &entries[i].fence,
                                                              &entries[i].syncobj_cb,
                                                              syncobj_wait_syncobj_func);
@@ -1003,6 +1024,9 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
        }
        kfree(entries);

+err_free_points:
+       kfree(points);
+
        return ret;
 }

@@ -1041,20 +1065,33 @@ static signed long drm_timeout_abs_to_jiffies(int64_t timeout_nsec)
 static int drm_syncobj_array_wait(struct drm_device *dev,
                                  struct drm_file *file_private,
                                  struct drm_syncobj_wait *wait,
-                                 struct drm_syncobj **syncobjs)
+                                 struct drm_syncobj_timeline_wait *timeline_wait,
+                                 struct drm_syncobj **syncobjs, bool timeline)
 {
-       signed long timeout = drm_timeout_abs_to_jiffies(wait->timeout_nsec);
+       signed long timeout = 0;
        signed long ret = 0;
        uint32_t first = ~0;

-       ret = drm_syncobj_array_wait_timeout(syncobjs,
-                                            wait->count_handles,
-                                            wait->flags,
-                                            timeout, &first);
+       if (!timeline) {
+               timeout = drm_timeout_abs_to_jiffies(wait->timeout_nsec);
+               ret = drm_syncobj_array_wait_timeout(syncobjs,
+                                                    NULL,
+                                                    wait->count_handles,
+                                                    wait->flags,
+                                                    timeout, &first);
+               wait->first_signaled = first;
+       } else {
+               timeout = drm_timeout_abs_to_jiffies(timeline_wait->timeout_nsec);
+               ret = drm_syncobj_array_wait_timeout(syncobjs,
+                                                    u64_to_user_ptr(timeline_wait->points),
+                                                    timeline_wait->count_handles,
+                                                    timeline_wait->flags,
+                                                    timeout, &first);
+               timeline_wait->first_signaled = first;
+       }
        if (ret < 0)
                return ret;

-       wait->first_signaled = first;
        if (ret == 0)
                return -ETIME;
        return 0;
@@ -1142,13 +1179,47 @@ drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,
                return ret;

        ret = drm_syncobj_array_wait(dev, file_private,
-                                    args, syncobjs);
+                                    args, NULL, syncobjs, false);

        drm_syncobj_array_free(syncobjs, args->count_handles);

        return ret;
 }

+int
+drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
+                               struct drm_file *file_private)
+{
+       struct drm_syncobj_timeline_wait *args = data;
+       struct drm_syncobj **syncobjs;
+       int ret = 0;
+
+       if (!drm_core_check_feature(dev, DRIVER_SYNCOBJ))
+               return -ENODEV;
+
+       if (args->flags & ~(DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |
+                           DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT))
+               return -EINVAL;
+
+       if (args->count_handles == 0)
+               return -EINVAL;
+
+       ret = drm_syncobj_array_find(file_private,
+                                    u64_to_user_ptr(args->handles),
+                                    args->count_handles,
+                                    &syncobjs);
+       if (ret < 0)
+               return ret;
+
+       ret = drm_syncobj_array_wait(dev, file_private,
+                                    NULL, args, syncobjs, true);
+
+       drm_syncobj_array_free(syncobjs, args->count_handles);
+
+       return ret;
+}
+
+
 int
 drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
                        struct drm_file *file_private)
diff --git a/include/uapi/drm/drm.h b/include/uapi/drm/drm.h
index cebdb2541eb7..501e86d81f47 100644
--- a/include/uapi/drm/drm.h
+++ b/include/uapi/drm/drm.h
@@ -748,6 +748,19 @@ struct drm_syncobj_wait {
        __u32 pad;
 };

+struct drm_syncobj_timeline_wait {
+       __u64 handles;
+       /* wait on specific timeline point for every handles*/
+       __u64 points;
+       /* absolute timeout */
+       __s64 timeout_nsec;
+       __u32 count_handles;
+       __u32 flags;
+       __u32 first_signaled; /* only valid when not waiting all */
+       __u32 pad;
+};
+
+
 struct drm_syncobj_array {
        __u64 handles;
        __u32 count_handles;
@@ -910,6 +923,7 @@ extern "C" {
 #define DRM_IOCTL_MODE_GET_LEASE       DRM_IOWR(0xC8, struct drm_mode_get_lease)
 #define DRM_IOCTL_MODE_REVOKE_LEASE    DRM_IOWR(0xC9, struct drm_mode_revoke_lease)

+#define DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT        DRM_IOWR(0xCA, struct drm_syncobj_timeline_wait)
 /**
  * Device specific ioctls should only be in their respective headers
  * The device specific ioctl range is from 0x40 to 0x9f.
--
2.17.1
Jason Ekstrand Oct. 8, 2018, 5:53 p.m. UTC | #7
On Mon, Oct 8, 2018 at 12:53 AM Zhou, David(ChunMing) <David1.Zhou@amd.com>
wrote:

> >> Another general comment (no good place to put it) is that I think we
> want two kinds of waits:  Wait for time point to be completed and wait for
> time point to become available.  The first is the usual CPU wait for
> completion while the second is for use by userspace drivers to wait until
> the first moment where they can submit work which depends on a given time
> point.
>
>
>
> Hi Jason,
>
>
>
> How about adding two new wait flags?
>
> DRM_SYNCOBJ_WAIT_FLAGS_WAIT_COMPLETED
>
> DRM_SYNCOBJ_WAIT_FLAGS_WAIT_AVAILABLE
>

Those seem like fine names to me.  We should require that one of the two
flags be present when the sync object is a timeline.

--Jason


> Thanks,
>
> David
>
>
>
> *From:* Christian König <ckoenig.leichtzumerken@gmail.com>
> *Sent:* Tuesday, September 25, 2018 5:50 PM
> *To:* Jason Ekstrand <jason@jlekstrand.net>; Zhou, David(ChunMing) <
> David1.Zhou@amd.com>
> *Cc:* amd-gfx mailing list <amd-gfx@lists.freedesktop.org>; Maling list -
> DRI developers <dri-devel@lists.freedesktop.org>
> *Subject:* Re: [PATCH 3/6] drm: add support of syncobj timeline point
> wait v2
>
>
>
> Am 25.09.2018 um 11:22 schrieb Jason Ekstrand:
>
> On Thu, Sep 20, 2018 at 6:04 AM Chunming Zhou <david1.zhou@amd.com> wrote:
>
> points array is one-to-one match with syncobjs array.
> v2:
> add seperate ioctl for timeline point wait, otherwise break uapi.
>
>
>
> I think ioctl structs can be extended as long as fields aren't
> re-ordered.  I'm not sure on the details of this though as I'm not a
> particularly experienced kernel developer.
>
>
> Yeah, that is correct. The problem in this particular case is that we
> don't change the direct IOCTL parameter, but rather the array it points to.
>
> We could do something like keep the existing handles array and add a
> separate optional one for the timeline points. That would also drop the
> need for the padding of the structure.
>
>
> Another general comment (no good place to put it) is that I think we want
> two kinds of waits:  Wait for time point to be completed and wait for time
> point to become available.  The first is the usual CPU wait for completion
> while the second is for use by userspace drivers to wait until the first
> moment where they can submit work which depends on a given time point.
>
>
> Oh, yeah that is a really good point as ell.
>
> Christian.
>
>
>
>
> Signed-off-by: Chunming Zhou <david1.zhou@amd.com>
> ---
>  drivers/gpu/drm/drm_internal.h |  2 +
>  drivers/gpu/drm/drm_ioctl.c    |  2 +
>  drivers/gpu/drm/drm_syncobj.c  | 99 +++++++++++++++++++++++++++++-----
>  include/uapi/drm/drm.h         | 14 +++++
>  4 files changed, 103 insertions(+), 14 deletions(-)
>
> diff --git a/drivers/gpu/drm/drm_internal.h
> b/drivers/gpu/drm/drm_internal.h
> index 0c4eb4a9ab31..566d44e3c782 100644
> --- a/drivers/gpu/drm/drm_internal.h
> +++ b/drivers/gpu/drm/drm_internal.h
> @@ -183,6 +183,8 @@ int drm_syncobj_fd_to_handle_ioctl(struct drm_device
> *dev, void *data,
>                                    struct drm_file *file_private);
>  int drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,
>                            struct drm_file *file_private);
> +int drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
> +                                   struct drm_file *file_private);
>  int drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
>                             struct drm_file *file_private);
>  int drm_syncobj_signal_ioctl(struct drm_device *dev, void *data,
> diff --git a/drivers/gpu/drm/drm_ioctl.c b/drivers/gpu/drm/drm_ioctl.c
> index 6b4a633b4240..c0891614f516 100644
> --- a/drivers/gpu/drm/drm_ioctl.c
> +++ b/drivers/gpu/drm/drm_ioctl.c
> @@ -669,6 +669,8 @@ static const struct drm_ioctl_desc drm_ioctls[] = {
>                       DRM_UNLOCKED|DRM_RENDER_ALLOW),
>         DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_WAIT, drm_syncobj_wait_ioctl,
>                       DRM_UNLOCKED|DRM_RENDER_ALLOW),
> +       DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT,
> drm_syncobj_timeline_wait_ioctl,
> +                     DRM_UNLOCKED|DRM_RENDER_ALLOW),
>         DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_RESET, drm_syncobj_reset_ioctl,
>                       DRM_UNLOCKED|DRM_RENDER_ALLOW),
>         DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_SIGNAL, drm_syncobj_signal_ioctl,
> diff --git a/drivers/gpu/drm/drm_syncobj.c b/drivers/gpu/drm/drm_syncobj.c
> index 67472bd77c83..a43de0e4616c 100644
> --- a/drivers/gpu/drm/drm_syncobj.c
> +++ b/drivers/gpu/drm/drm_syncobj.c
> @@ -126,13 +126,14 @@ static void drm_syncobj_add_callback_locked(struct
> drm_syncobj *syncobj,
>  }
>
>  static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj
> *syncobj,
> +                                                u64 point,
>                                                  struct dma_fence **fence,
>                                                  struct drm_syncobj_cb *cb,
>                                                  drm_syncobj_func_t func)
>  {
>         int ret;
>
> -       ret = drm_syncobj_search_fence(syncobj, 0, 0, fence);
> +       ret = drm_syncobj_search_fence(syncobj, point, 0, fence);
>         if (!ret)
>                 return 1;
>
> @@ -143,7 +144,7 @@ static int
> drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,
>          */
>         if (!list_empty(&syncobj->signal_pt_list)) {
>                 spin_unlock(&syncobj->lock);
> -               drm_syncobj_search_fence(syncobj, 0, 0, fence);
> +               drm_syncobj_search_fence(syncobj, point, 0, fence);
>                 if (*fence)
>                         return 1;
>                 spin_lock(&syncobj->lock);
> @@ -358,7 +359,9 @@ void drm_syncobj_replace_fence(struct drm_syncobj
> *syncobj,
>                 spin_lock(&syncobj->lock);
>                 list_for_each_entry_safe(cur, tmp, &syncobj->cb_list,
> node) {
>                         list_del_init(&cur->node);
> +                       spin_unlock(&syncobj->lock);
>                         cur->func(syncobj, cur);
> +                       spin_lock(&syncobj->lock);
>                 }
>                 spin_unlock(&syncobj->lock);
>         }
> @@ -856,6 +859,7 @@ struct syncobj_wait_entry {
>         struct dma_fence *fence;
>         struct dma_fence_cb fence_cb;
>         struct drm_syncobj_cb syncobj_cb;
> +       u64    point;
>  };
>
>  static void syncobj_wait_fence_func(struct dma_fence *fence,
> @@ -873,12 +877,13 @@ static void syncobj_wait_syncobj_func(struct
> drm_syncobj *syncobj,
>         struct syncobj_wait_entry *wait =
>                 container_of(cb, struct syncobj_wait_entry, syncobj_cb);
>
> -       drm_syncobj_search_fence(syncobj, 0, 0, &wait->fence);
> +       drm_syncobj_search_fence(syncobj, wait->point, 0, &wait->fence);
>
>         wake_up_process(wait->task);
>  }
>
>  static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj
> **syncobjs,
> +                                                 void __user *user_points,
>                                                   uint32_t count,
>                                                   uint32_t flags,
>                                                   signed long timeout,
> @@ -886,13 +891,27 @@ static signed long
> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>  {
>         struct syncobj_wait_entry *entries;
>         struct dma_fence *fence;
> +       uint64_t *points;
>         signed long ret;
>         uint32_t signaled_count, i;
>
> -       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
> -       if (!entries)
> +       points = kmalloc_array(count, sizeof(*points), GFP_KERNEL);
> +       if (points == NULL)
>                 return -ENOMEM;
>
> +       if (!user_points) {
> +               memset(points, 0, count * sizeof(uint64_t));
> +       } else if (copy_from_user(points, user_points, sizeof(uint64_t) *
> count)) {
> +               ret = -EFAULT;
> +               goto err_free_points;
> +       }
> +
> +
> +       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
> +       if (!entries) {
> +               ret = -ENOMEM;
> +               goto err_free_points;
> +       }
>         /* Walk the list of sync objects and initialize entries.  We do
>          * this up-front so that we can properly return -EINVAL if there is
>          * a syncobj with a missing fence and then never have the chance of
> @@ -901,7 +920,8 @@ static signed long
> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>         signaled_count = 0;
>         for (i = 0; i < count; ++i) {
>                 entries[i].task = current;
> -               ret = drm_syncobj_search_fence(syncobjs[i], 0, 0,
> +               entries[i].point = points[i];
> +               ret = drm_syncobj_search_fence(syncobjs[i], points[i], 0,
>                                                &entries[i].fence);
>                 if (!entries[i].fence) {
>                         if (flags &
> DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
> @@ -940,6 +960,7 @@ static signed long
> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>         if (flags & DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
>                 for (i = 0; i < count; ++i) {
>                         drm_syncobj_fence_get_or_add_callback(syncobjs[i],
> +
>  entries[i].point,
>
> &entries[i].fence,
>
> &entries[i].syncobj_cb,
>
> syncobj_wait_syncobj_func);
> @@ -1003,6 +1024,9 @@ static signed long
> drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
>         }
>         kfree(entries);
>
> +err_free_points:
> +       kfree(points);
> +
>         return ret;
>  }
>
> @@ -1041,20 +1065,33 @@ static signed long
> drm_timeout_abs_to_jiffies(int64_t timeout_nsec)
>  static int drm_syncobj_array_wait(struct drm_device *dev,
>                                   struct drm_file *file_private,
>                                   struct drm_syncobj_wait *wait,
> -                                 struct drm_syncobj **syncobjs)
> +                                 struct drm_syncobj_timeline_wait
> *timeline_wait,
> +                                 struct drm_syncobj **syncobjs, bool
> timeline)
>  {
> -       signed long timeout =
> drm_timeout_abs_to_jiffies(wait->timeout_nsec);
> +       signed long timeout = 0;
>         signed long ret = 0;
>         uint32_t first = ~0;
>
> -       ret = drm_syncobj_array_wait_timeout(syncobjs,
> -                                            wait->count_handles,
> -                                            wait->flags,
> -                                            timeout, &first);
> +       if (!timeline) {
> +               timeout = drm_timeout_abs_to_jiffies(wait->timeout_nsec);
> +               ret = drm_syncobj_array_wait_timeout(syncobjs,
> +                                                    NULL,
> +                                                    wait->count_handles,
> +                                                    wait->flags,
> +                                                    timeout, &first);
> +               wait->first_signaled = first;
> +       } else {
> +               timeout =
> drm_timeout_abs_to_jiffies(timeline_wait->timeout_nsec);
> +               ret = drm_syncobj_array_wait_timeout(syncobjs,
> +
> u64_to_user_ptr(timeline_wait->points),
> +
> timeline_wait->count_handles,
> +                                                    timeline_wait->flags,
> +                                                    timeout, &first);
> +               timeline_wait->first_signaled = first;
> +       }
>         if (ret < 0)
>                 return ret;
>
> -       wait->first_signaled = first;
>         if (ret == 0)
>                 return -ETIME;
>         return 0;
> @@ -1142,13 +1179,47 @@ drm_syncobj_wait_ioctl(struct drm_device *dev,
> void *data,
>                 return ret;
>
>         ret = drm_syncobj_array_wait(dev, file_private,
> -                                    args, syncobjs);
> +                                    args, NULL, syncobjs, false);
>
>         drm_syncobj_array_free(syncobjs, args->count_handles);
>
>         return ret;
>  }
>
> +int
> +drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
> +                               struct drm_file *file_private)
> +{
> +       struct drm_syncobj_timeline_wait *args = data;
> +       struct drm_syncobj **syncobjs;
> +       int ret = 0;
> +
> +       if (!drm_core_check_feature(dev, DRIVER_SYNCOBJ))
> +               return -ENODEV;
> +
> +       if (args->flags & ~(DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |
> +                           DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT))
> +               return -EINVAL;
> +
> +       if (args->count_handles == 0)
> +               return -EINVAL;
> +
> +       ret = drm_syncobj_array_find(file_private,
> +                                    u64_to_user_ptr(args->handles),
> +                                    args->count_handles,
> +                                    &syncobjs);
> +       if (ret < 0)
> +               return ret;
> +
> +       ret = drm_syncobj_array_wait(dev, file_private,
> +                                    NULL, args, syncobjs, true);
> +
> +       drm_syncobj_array_free(syncobjs, args->count_handles);
> +
> +       return ret;
> +}
> +
> +
>  int
>  drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
>                         struct drm_file *file_private)
> diff --git a/include/uapi/drm/drm.h b/include/uapi/drm/drm.h
> index cebdb2541eb7..501e86d81f47 100644
> --- a/include/uapi/drm/drm.h
> +++ b/include/uapi/drm/drm.h
> @@ -748,6 +748,19 @@ struct drm_syncobj_wait {
>         __u32 pad;
>  };
>
> +struct drm_syncobj_timeline_wait {
> +       __u64 handles;
> +       /* wait on specific timeline point for every handles*/
> +       __u64 points;
> +       /* absolute timeout */
> +       __s64 timeout_nsec;
> +       __u32 count_handles;
> +       __u32 flags;
> +       __u32 first_signaled; /* only valid when not waiting all */
> +       __u32 pad;
> +};
> +
> +
>  struct drm_syncobj_array {
>         __u64 handles;
>         __u32 count_handles;
> @@ -910,6 +923,7 @@ extern "C" {
>  #define DRM_IOCTL_MODE_GET_LEASE       DRM_IOWR(0xC8, struct
> drm_mode_get_lease)
>  #define DRM_IOCTL_MODE_REVOKE_LEASE    DRM_IOWR(0xC9, struct
> drm_mode_revoke_lease)
>
> +#define DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT        DRM_IOWR(0xCA, struct
> drm_syncobj_timeline_wait)
>  /**
>   * Device specific ioctls should only be in their respective headers
>   * The device specific ioctl range is from 0x40 to 0x9f.
> --
> 2.17.1
>
> _______________________________________________
> dri-devel mailing list
> dri-devel@lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/dri-devel
>
>
>
>
> _______________________________________________
>
> dri-devel mailing list
>
> dri-devel@lists.freedesktop.org
>
> https://lists.freedesktop.org/mailman/listinfo/dri-devel
>
>
>
<div dir="ltr"><div class="gmail_quote"><div dir="ltr">On Mon, Oct 8, 2018 at 12:53 AM Zhou, David(ChunMing) &lt;<a href="mailto:David1.Zhou@amd.com">David1.Zhou@amd.com</a>&gt; wrote:<br></div><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">





<div bgcolor="white" link="blue" vlink="purple" lang="EN-US">
<div class="m_-1584312309811383151WordSection1">
<p class="MsoNormal"><span style="color:windowtext">&gt;&gt;</span> Another general comment (no good place to put it) is that I think we want two kinds of waits:  Wait for time point to be completed and wait for time point to become available.  The first is the usual
 CPU wait for completion while the second is for use by userspace drivers to wait until the first moment where they can submit work which depends on a given time point.<u></u><u></u></p>
<p class="MsoNormal"><span style="color:windowtext"><u></u> <u></u></span></p>
<p class="MsoNormal"><span style="color:windowtext">Hi Jason,<u></u><u></u></span></p>
<p class="MsoNormal"><span style="color:windowtext"><u></u> <u></u></span></p>
<p class="MsoNormal"><span style="color:windowtext">How about adding two new wait flags?<u></u><u></u></span></p>
<p class="MsoNormal"><span style="color:windowtext">DRM_SYNCOBJ_WAIT_FLAGS_WAIT_COMPLETED<u></u><u></u></span></p>
<p class="MsoNormal"><span style="color:windowtext">DRM_SYNCOBJ_WAIT_FLAGS_WAIT_AVAILABLE<u></u><u></u></span></p>
</div></div></blockquote><div><br></div><div>Those seem like fine names to me.  We should require that one of the two flags be present when the sync object is a timeline.</div><div><br></div><div>--Jason<br></div><div> </div><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex"><div bgcolor="white" link="blue" vlink="purple" lang="EN-US"><div class="m_-1584312309811383151WordSection1">
<p class="MsoNormal"><span style="color:windowtext">Thanks,<u></u><u></u></span></p>
<p class="MsoNormal"><span style="color:windowtext">David<u></u><u></u></span></p>
<p class="MsoNormal"><span style="color:windowtext"><u></u> <u></u></span></p>
<div style="border:none;border-left:solid blue 1.5pt;padding:0in 0in 0in 4.0pt">
<div>
<div style="border:none;border-top:solid #e1e1e1 1.0pt;padding:3.0pt 0in 0in 0in">
<p class="MsoNormal"><b><span style="color:windowtext">From:</span></b><span style="color:windowtext"> Christian König &lt;<a href="mailto:ckoenig.leichtzumerken@gmail.com" target="_blank">ckoenig.leichtzumerken@gmail.com</a>&gt;
<br>
<b>Sent:</b> Tuesday, September 25, 2018 5:50 PM<br>
<b>To:</b> Jason Ekstrand &lt;<a href="mailto:jason@jlekstrand.net" target="_blank">jason@jlekstrand.net</a>&gt;; Zhou, David(ChunMing) &lt;<a href="mailto:David1.Zhou@amd.com" target="_blank">David1.Zhou@amd.com</a>&gt;<br>
<b>Cc:</b> amd-gfx mailing list &lt;<a href="mailto:amd-gfx@lists.freedesktop.org" target="_blank">amd-gfx@lists.freedesktop.org</a>&gt;; Maling list - DRI developers &lt;<a href="mailto:dri-devel@lists.freedesktop.org" target="_blank">dri-devel@lists.freedesktop.org</a>&gt;<br>
<b>Subject:</b> Re: [PATCH 3/6] drm: add support of syncobj timeline point wait v2<u></u><u></u></span></p>
</div>
</div>
<p class="MsoNormal"><u></u> <u></u></p>
<div>
<p class="MsoNormal">Am 25.09.2018 um 11:22 schrieb Jason Ekstrand:<u></u><u></u></p>
</div>
<blockquote style="margin-top:5.0pt;margin-bottom:5.0pt">
<div>
<div>
<div>
<p class="MsoNormal">On Thu, Sep 20, 2018 at 6:04 AM Chunming Zhou &lt;<a href="mailto:david1.zhou@amd.com" target="_blank">david1.zhou@amd.com</a>&gt; wrote:<u></u><u></u></p>
</div>
<blockquote style="border:none;border-left:solid #cccccc 1.0pt;padding:0in 0in 0in 6.0pt;margin-left:4.8pt;margin-right:0in">
<p class="MsoNormal">points array is one-to-one match with syncobjs array.<br>
v2:<br>
add seperate ioctl for timeline point wait, otherwise break uapi.<u></u><u></u></p>
</blockquote>
<div>
<p class="MsoNormal"><u></u> <u></u></p>
</div>
<div>
<p class="MsoNormal">I think ioctl structs can be extended as long as fields aren&#39;t re-ordered.  I&#39;m not sure on the details of this though as I&#39;m not a particularly experienced kernel developer.<u></u><u></u></p>
</div>
</div>
</div>
</blockquote>
<p class="MsoNormal"><br>
Yeah, that is correct. The problem in this particular case is that we don&#39;t change the direct IOCTL parameter, but rather the array it points to.<br>
<br>
We could do something like keep the existing handles array and add a separate optional one for the timeline points. That would also drop the need for the padding of the structure.<br>
<br>
<br>
<u></u><u></u></p>
<blockquote style="margin-top:5.0pt;margin-bottom:5.0pt">
<div>
<div>
<div>
<p class="MsoNormal">Another general comment (no good place to put it) is that I think we want two kinds of waits:  Wait for time point to be completed and wait for time point to become available.  The first is the usual CPU wait for completion while the second
 is for use by userspace drivers to wait until the first moment where they can submit work which depends on a given time point.<u></u><u></u></p>
</div>
</div>
</div>
</blockquote>
<p class="MsoNormal"><br>
Oh, yeah that is a really good point as ell.<br>
<br>
Christian.<br>
<br>
<br>
<u></u><u></u></p>
<blockquote style="margin-top:5.0pt;margin-bottom:5.0pt">
<div>
<div>
<div>
<p class="MsoNormal"> <u></u><u></u></p>
</div>
<blockquote style="border:none;border-left:solid #cccccc 1.0pt;padding:0in 0in 0in 6.0pt;margin-left:4.8pt;margin-right:0in">
<p class="MsoNormal">Signed-off-by: Chunming Zhou &lt;<a href="mailto:david1.zhou@amd.com" target="_blank">david1.zhou@amd.com</a>&gt;<br>
---<br>
 drivers/gpu/drm/drm_internal.h |  2 +<br>
 drivers/gpu/drm/drm_ioctl.c    |  2 +<br>
 drivers/gpu/drm/drm_syncobj.c  | 99 +++++++++++++++++++++++++++++-----<br>
 include/uapi/drm/drm.h         | 14 +++++<br>
 4 files changed, 103 insertions(+), 14 deletions(-)<br>
<br>
diff --git a/drivers/gpu/drm/drm_internal.h b/drivers/gpu/drm/drm_internal.h<br>
index 0c4eb4a9ab31..566d44e3c782 100644<br>
--- a/drivers/gpu/drm/drm_internal.h<br>
+++ b/drivers/gpu/drm/drm_internal.h<br>
@@ -183,6 +183,8 @@ int drm_syncobj_fd_to_handle_ioctl(struct drm_device *dev, void *data,<br>
                                   struct drm_file *file_private);<br>
 int drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,<br>
                           struct drm_file *file_private);<br>
+int drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,<br>
+                                   struct drm_file *file_private);<br>
 int drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,<br>
                            struct drm_file *file_private);<br>
 int drm_syncobj_signal_ioctl(struct drm_device *dev, void *data,<br>
diff --git a/drivers/gpu/drm/drm_ioctl.c b/drivers/gpu/drm/drm_ioctl.c<br>
index 6b4a633b4240..c0891614f516 100644<br>
--- a/drivers/gpu/drm/drm_ioctl.c<br>
+++ b/drivers/gpu/drm/drm_ioctl.c<br>
@@ -669,6 +669,8 @@ static const struct drm_ioctl_desc drm_ioctls[] = {<br>
                      DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
        DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_WAIT, drm_syncobj_wait_ioctl,<br>
                      DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
+       DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT, drm_syncobj_timeline_wait_ioctl,<br>
+                     DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
        DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_RESET, drm_syncobj_reset_ioctl,<br>
                      DRM_UNLOCKED|DRM_RENDER_ALLOW),<br>
        DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_SIGNAL, drm_syncobj_signal_ioctl,<br>
diff --git a/drivers/gpu/drm/drm_syncobj.c b/drivers/gpu/drm/drm_syncobj.c<br>
index 67472bd77c83..a43de0e4616c 100644<br>
--- a/drivers/gpu/drm/drm_syncobj.c<br>
+++ b/drivers/gpu/drm/drm_syncobj.c<br>
@@ -126,13 +126,14 @@ static void drm_syncobj_add_callback_locked(struct drm_syncobj *syncobj,<br>
 }<br>
<br>
 static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,<br>
+                                                u64 point,<br>
                                                 struct dma_fence **fence,<br>
                                                 struct drm_syncobj_cb *cb,<br>
                                                 drm_syncobj_func_t func)<br>
 {<br>
        int ret;<br>
<br>
-       ret = drm_syncobj_search_fence(syncobj, 0, 0, fence);<br>
+       ret = drm_syncobj_search_fence(syncobj, point, 0, fence);<br>
        if (!ret)<br>
                return 1;<br>
<br>
@@ -143,7 +144,7 @@ static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,<br>
         */<br>
        if (!list_empty(&amp;syncobj-&gt;signal_pt_list)) {<br>
                spin_unlock(&amp;syncobj-&gt;lock);<br>
-               drm_syncobj_search_fence(syncobj, 0, 0, fence);<br>
+               drm_syncobj_search_fence(syncobj, point, 0, fence);<br>
                if (*fence)<br>
                        return 1;<br>
                spin_lock(&amp;syncobj-&gt;lock);<br>
@@ -358,7 +359,9 @@ void drm_syncobj_replace_fence(struct drm_syncobj *syncobj,<br>
                spin_lock(&amp;syncobj-&gt;lock);<br>
                list_for_each_entry_safe(cur, tmp, &amp;syncobj-&gt;cb_list, node) {<br>
                        list_del_init(&amp;cur-&gt;node);<br>
+                       spin_unlock(&amp;syncobj-&gt;lock);<br>
                        cur-&gt;func(syncobj, cur);<br>
+                       spin_lock(&amp;syncobj-&gt;lock);<br>
                }<br>
                spin_unlock(&amp;syncobj-&gt;lock);<br>
        }<br>
@@ -856,6 +859,7 @@ struct syncobj_wait_entry {<br>
        struct dma_fence *fence;<br>
        struct dma_fence_cb fence_cb;<br>
        struct drm_syncobj_cb syncobj_cb;<br>
+       u64    point;<br>
 };<br>
<br>
 static void syncobj_wait_fence_func(struct dma_fence *fence,<br>
@@ -873,12 +877,13 @@ static void syncobj_wait_syncobj_func(struct drm_syncobj *syncobj,<br>
        struct syncobj_wait_entry *wait =<br>
                container_of(cb, struct syncobj_wait_entry, syncobj_cb);<br>
<br>
-       drm_syncobj_search_fence(syncobj, 0, 0, &amp;wait-&gt;fence);<br>
+       drm_syncobj_search_fence(syncobj, wait-&gt;point, 0, &amp;wait-&gt;fence);<br>
<br>
        wake_up_process(wait-&gt;task);<br>
 }<br>
<br>
 static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,<br>
+                                                 void __user *user_points,<br>
                                                  uint32_t count,<br>
                                                  uint32_t flags,<br>
                                                  signed long timeout,<br>
@@ -886,13 +891,27 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,<br>
 {<br>
        struct syncobj_wait_entry *entries;<br>
        struct dma_fence *fence;<br>
+       uint64_t *points;<br>
        signed long ret;<br>
        uint32_t signaled_count, i;<br>
<br>
-       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);<br>
-       if (!entries)<br>
+       points = kmalloc_array(count, sizeof(*points), GFP_KERNEL);<br>
+       if (points == NULL)<br>
                return -ENOMEM;<br>
<br>
+       if (!user_points) {<br>
+               memset(points, 0, count * sizeof(uint64_t));<br>
+       } else if (copy_from_user(points, user_points, sizeof(uint64_t) * count)) {<br>
+               ret = -EFAULT;<br>
+               goto err_free_points;<br>
+       }<br>
+<br>
+<br>
+       entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);<br>
+       if (!entries) {<br>
+               ret = -ENOMEM;<br>
+               goto err_free_points;<br>
+       }<br>
        /* Walk the list of sync objects and initialize entries.  We do<br>
         * this up-front so that we can properly return -EINVAL if there is<br>
         * a syncobj with a missing fence and then never have the chance of<br>
@@ -901,7 +920,8 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,<br>
        signaled_count = 0;<br>
        for (i = 0; i &lt; count; ++i) {<br>
                entries[i].task = current;<br>
-               ret = drm_syncobj_search_fence(syncobjs[i], 0, 0,<br>
+               entries[i].point = points[i];<br>
+               ret = drm_syncobj_search_fence(syncobjs[i], points[i], 0,<br>
                                               &amp;entries[i].fence);<br>
                if (!entries[i].fence) {<br>
                        if (flags &amp; DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {<br>
@@ -940,6 +960,7 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,<br>
        if (flags &amp; DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {<br>
                for (i = 0; i &lt; count; ++i) {<br>
                        drm_syncobj_fence_get_or_add_callback(syncobjs[i],<br>
+                                                             entries[i].point,<br>
                                                              &amp;entries[i].fence,<br>
                                                              &amp;entries[i].syncobj_cb,<br>
                                                              syncobj_wait_syncobj_func);<br>
@@ -1003,6 +1024,9 @@ static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,<br>
        }<br>
        kfree(entries);<br>
<br>
+err_free_points:<br>
+       kfree(points);<br>
+<br>
        return ret;<br>
 }<br>
<br>
@@ -1041,20 +1065,33 @@ static signed long drm_timeout_abs_to_jiffies(int64_t timeout_nsec)<br>
 static int drm_syncobj_array_wait(struct drm_device *dev,<br>
                                  struct drm_file *file_private,<br>
                                  struct drm_syncobj_wait *wait,<br>
-                                 struct drm_syncobj **syncobjs)<br>
+                                 struct drm_syncobj_timeline_wait *timeline_wait,<br>
+                                 struct drm_syncobj **syncobjs, bool timeline)<br>
 {<br>
-       signed long timeout = drm_timeout_abs_to_jiffies(wait-&gt;timeout_nsec);<br>
+       signed long timeout = 0;<br>
        signed long ret = 0;<br>
        uint32_t first = ~0;<br>
<br>
-       ret = drm_syncobj_array_wait_timeout(syncobjs,<br>
-                                            wait-&gt;count_handles,<br>
-                                            wait-&gt;flags,<br>
-                                            timeout, &amp;first);<br>
+       if (!timeline) {<br>
+               timeout = drm_timeout_abs_to_jiffies(wait-&gt;timeout_nsec);<br>
+               ret = drm_syncobj_array_wait_timeout(syncobjs,<br>
+                                                    NULL,<br>
+                                                    wait-&gt;count_handles,<br>
+                                                    wait-&gt;flags,<br>
+                                                    timeout, &amp;first);<br>
+               wait-&gt;first_signaled = first;<br>
+       } else {<br>
+               timeout = drm_timeout_abs_to_jiffies(timeline_wait-&gt;timeout_nsec);<br>
+               ret = drm_syncobj_array_wait_timeout(syncobjs,<br>
+                                                    u64_to_user_ptr(timeline_wait-&gt;points),<br>
+                                                    timeline_wait-&gt;count_handles,<br>
+                                                    timeline_wait-&gt;flags,<br>
+                                                    timeout, &amp;first);<br>
+               timeline_wait-&gt;first_signaled = first;<br>
+       }<br>
        if (ret &lt; 0)<br>
                return ret;<br>
<br>
-       wait-&gt;first_signaled = first;<br>
        if (ret == 0)<br>
                return -ETIME;<br>
        return 0;<br>
@@ -1142,13 +1179,47 @@ drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,<br>
                return ret;<br>
<br>
        ret = drm_syncobj_array_wait(dev, file_private,<br>
-                                    args, syncobjs);<br>
+                                    args, NULL, syncobjs, false);<br>
<br>
        drm_syncobj_array_free(syncobjs, args-&gt;count_handles);<br>
<br>
        return ret;<br>
 }<br>
<br>
+int<br>
+drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,<br>
+                               struct drm_file *file_private)<br>
+{<br>
+       struct drm_syncobj_timeline_wait *args = data;<br>
+       struct drm_syncobj **syncobjs;<br>
+       int ret = 0;<br>
+<br>
+       if (!drm_core_check_feature(dev, DRIVER_SYNCOBJ))<br>
+               return -ENODEV;<br>
+<br>
+       if (args-&gt;flags &amp; ~(DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |<br>
+                           DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT))<br>
+               return -EINVAL;<br>
+<br>
+       if (args-&gt;count_handles == 0)<br>
+               return -EINVAL;<br>
+<br>
+       ret = drm_syncobj_array_find(file_private,<br>
+                                    u64_to_user_ptr(args-&gt;handles),<br>
+                                    args-&gt;count_handles,<br>
+                                    &amp;syncobjs);<br>
+       if (ret &lt; 0)<br>
+               return ret;<br>
+<br>
+       ret = drm_syncobj_array_wait(dev, file_private,<br>
+                                    NULL, args, syncobjs, true);<br>
+<br>
+       drm_syncobj_array_free(syncobjs, args-&gt;count_handles);<br>
+<br>
+       return ret;<br>
+}<br>
+<br>
+<br>
 int<br>
 drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,<br>
                        struct drm_file *file_private)<br>
diff --git a/include/uapi/drm/drm.h b/include/uapi/drm/drm.h<br>
index cebdb2541eb7..501e86d81f47 100644<br>
--- a/include/uapi/drm/drm.h<br>
+++ b/include/uapi/drm/drm.h<br>
@@ -748,6 +748,19 @@ struct drm_syncobj_wait {<br>
        __u32 pad;<br>
 };<br>
<br>
+struct drm_syncobj_timeline_wait {<br>
+       __u64 handles;<br>
+       /* wait on specific timeline point for every handles*/<br>
+       __u64 points;<br>
+       /* absolute timeout */<br>
+       __s64 timeout_nsec;<br>
+       __u32 count_handles;<br>
+       __u32 flags;<br>
+       __u32 first_signaled; /* only valid when not waiting all */<br>
+       __u32 pad;<br>
+};<br>
+<br>
+<br>
 struct drm_syncobj_array {<br>
        __u64 handles;<br>
        __u32 count_handles;<br>
@@ -910,6 +923,7 @@ extern &quot;C&quot; {<br>
 #define DRM_IOCTL_MODE_GET_LEASE       DRM_IOWR(0xC8, struct drm_mode_get_lease)<br>
 #define DRM_IOCTL_MODE_REVOKE_LEASE    DRM_IOWR(0xC9, struct drm_mode_revoke_lease)<br>
<br>
+#define DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT        DRM_IOWR(0xCA, struct drm_syncobj_timeline_wait)<br>
 /**<br>
  * Device specific ioctls should only be in their respective headers<br>
  * The device specific ioctl range is from 0x40 to 0x9f.<br>
-- <br>
2.17.1<br>
<br>
_______________________________________________<br>
dri-devel mailing list<br>
<a href="mailto:dri-devel@lists.freedesktop.org" target="_blank">dri-devel@lists.freedesktop.org</a><br>
<a href="https://lists.freedesktop.org/mailman/listinfo/dri-devel" target="_blank">https://lists.freedesktop.org/mailman/listinfo/dri-devel</a><u></u><u></u></p>
</blockquote>
</div>
</div>
<p class="MsoNormal"><br>
<br>
<br>
<u></u><u></u></p>
<pre>_______________________________________________<u></u><u></u></pre>
<pre>dri-devel mailing list<u></u><u></u></pre>
<pre><a href="mailto:dri-devel@lists.freedesktop.org" target="_blank">dri-devel@lists.freedesktop.org</a><u></u><u></u></pre>
<pre><a href="https://lists.freedesktop.org/mailman/listinfo/dri-devel" target="_blank">https://lists.freedesktop.org/mailman/listinfo/dri-devel</a><u></u><u></u></pre>
</blockquote>
<p class="MsoNormal"><u></u> <u></u></p>
</div>
</div>
</div>

</blockquote></div></div>
diff mbox series

Patch

diff --git a/drivers/gpu/drm/drm_internal.h b/drivers/gpu/drm/drm_internal.h
index 0c4eb4a9ab31..566d44e3c782 100644
--- a/drivers/gpu/drm/drm_internal.h
+++ b/drivers/gpu/drm/drm_internal.h
@@ -183,6 +183,8 @@  int drm_syncobj_fd_to_handle_ioctl(struct drm_device *dev, void *data,
 				   struct drm_file *file_private);
 int drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,
 			   struct drm_file *file_private);
+int drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
+				    struct drm_file *file_private);
 int drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
 			    struct drm_file *file_private);
 int drm_syncobj_signal_ioctl(struct drm_device *dev, void *data,
diff --git a/drivers/gpu/drm/drm_ioctl.c b/drivers/gpu/drm/drm_ioctl.c
index 6b4a633b4240..c0891614f516 100644
--- a/drivers/gpu/drm/drm_ioctl.c
+++ b/drivers/gpu/drm/drm_ioctl.c
@@ -669,6 +669,8 @@  static const struct drm_ioctl_desc drm_ioctls[] = {
 		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
 	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_WAIT, drm_syncobj_wait_ioctl,
 		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
+	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT, drm_syncobj_timeline_wait_ioctl,
+		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
 	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_RESET, drm_syncobj_reset_ioctl,
 		      DRM_UNLOCKED|DRM_RENDER_ALLOW),
 	DRM_IOCTL_DEF(DRM_IOCTL_SYNCOBJ_SIGNAL, drm_syncobj_signal_ioctl,
diff --git a/drivers/gpu/drm/drm_syncobj.c b/drivers/gpu/drm/drm_syncobj.c
index 67472bd77c83..a43de0e4616c 100644
--- a/drivers/gpu/drm/drm_syncobj.c
+++ b/drivers/gpu/drm/drm_syncobj.c
@@ -126,13 +126,14 @@  static void drm_syncobj_add_callback_locked(struct drm_syncobj *syncobj,
 }
 
 static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,
+						 u64 point,
 						 struct dma_fence **fence,
 						 struct drm_syncobj_cb *cb,
 						 drm_syncobj_func_t func)
 {
 	int ret;
 
-	ret = drm_syncobj_search_fence(syncobj, 0, 0, fence);
+	ret = drm_syncobj_search_fence(syncobj, point, 0, fence);
 	if (!ret)
 		return 1;
 
@@ -143,7 +144,7 @@  static int drm_syncobj_fence_get_or_add_callback(struct drm_syncobj *syncobj,
 	 */
 	if (!list_empty(&syncobj->signal_pt_list)) {
 		spin_unlock(&syncobj->lock);
-		drm_syncobj_search_fence(syncobj, 0, 0, fence);
+		drm_syncobj_search_fence(syncobj, point, 0, fence);
 		if (*fence)
 			return 1;
 		spin_lock(&syncobj->lock);
@@ -358,7 +359,9 @@  void drm_syncobj_replace_fence(struct drm_syncobj *syncobj,
 		spin_lock(&syncobj->lock);
 		list_for_each_entry_safe(cur, tmp, &syncobj->cb_list, node) {
 			list_del_init(&cur->node);
+			spin_unlock(&syncobj->lock);
 			cur->func(syncobj, cur);
+			spin_lock(&syncobj->lock);
 		}
 		spin_unlock(&syncobj->lock);
 	}
@@ -856,6 +859,7 @@  struct syncobj_wait_entry {
 	struct dma_fence *fence;
 	struct dma_fence_cb fence_cb;
 	struct drm_syncobj_cb syncobj_cb;
+	u64    point;
 };
 
 static void syncobj_wait_fence_func(struct dma_fence *fence,
@@ -873,12 +877,13 @@  static void syncobj_wait_syncobj_func(struct drm_syncobj *syncobj,
 	struct syncobj_wait_entry *wait =
 		container_of(cb, struct syncobj_wait_entry, syncobj_cb);
 
-	drm_syncobj_search_fence(syncobj, 0, 0, &wait->fence);
+	drm_syncobj_search_fence(syncobj, wait->point, 0, &wait->fence);
 
 	wake_up_process(wait->task);
 }
 
 static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
+						  void __user *user_points,
 						  uint32_t count,
 						  uint32_t flags,
 						  signed long timeout,
@@ -886,13 +891,27 @@  static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
 {
 	struct syncobj_wait_entry *entries;
 	struct dma_fence *fence;
+	uint64_t *points;
 	signed long ret;
 	uint32_t signaled_count, i;
 
-	entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
-	if (!entries)
+	points = kmalloc_array(count, sizeof(*points), GFP_KERNEL);
+	if (points == NULL)
 		return -ENOMEM;
 
+	if (!user_points) {
+		memset(points, 0, count * sizeof(uint64_t));
+	} else if (copy_from_user(points, user_points, sizeof(uint64_t) * count)) {
+		ret = -EFAULT;
+		goto err_free_points;
+	}
+
+
+	entries = kcalloc(count, sizeof(*entries), GFP_KERNEL);
+	if (!entries) {
+		ret = -ENOMEM;
+		goto err_free_points;
+	}
 	/* Walk the list of sync objects and initialize entries.  We do
 	 * this up-front so that we can properly return -EINVAL if there is
 	 * a syncobj with a missing fence and then never have the chance of
@@ -901,7 +920,8 @@  static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
 	signaled_count = 0;
 	for (i = 0; i < count; ++i) {
 		entries[i].task = current;
-		ret = drm_syncobj_search_fence(syncobjs[i], 0, 0,
+		entries[i].point = points[i];
+		ret = drm_syncobj_search_fence(syncobjs[i], points[i], 0,
 					       &entries[i].fence);
 		if (!entries[i].fence) {
 			if (flags & DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
@@ -940,6 +960,7 @@  static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
 	if (flags & DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT) {
 		for (i = 0; i < count; ++i) {
 			drm_syncobj_fence_get_or_add_callback(syncobjs[i],
+							      entries[i].point,
 							      &entries[i].fence,
 							      &entries[i].syncobj_cb,
 							      syncobj_wait_syncobj_func);
@@ -1003,6 +1024,9 @@  static signed long drm_syncobj_array_wait_timeout(struct drm_syncobj **syncobjs,
 	}
 	kfree(entries);
 
+err_free_points:
+	kfree(points);
+
 	return ret;
 }
 
@@ -1041,20 +1065,33 @@  static signed long drm_timeout_abs_to_jiffies(int64_t timeout_nsec)
 static int drm_syncobj_array_wait(struct drm_device *dev,
 				  struct drm_file *file_private,
 				  struct drm_syncobj_wait *wait,
-				  struct drm_syncobj **syncobjs)
+				  struct drm_syncobj_timeline_wait *timeline_wait,
+				  struct drm_syncobj **syncobjs, bool timeline)
 {
-	signed long timeout = drm_timeout_abs_to_jiffies(wait->timeout_nsec);
+	signed long timeout = 0;
 	signed long ret = 0;
 	uint32_t first = ~0;
 
-	ret = drm_syncobj_array_wait_timeout(syncobjs,
-					     wait->count_handles,
-					     wait->flags,
-					     timeout, &first);
+	if (!timeline) {
+		timeout = drm_timeout_abs_to_jiffies(wait->timeout_nsec);
+		ret = drm_syncobj_array_wait_timeout(syncobjs,
+						     NULL,
+						     wait->count_handles,
+						     wait->flags,
+						     timeout, &first);
+		wait->first_signaled = first;
+	} else {
+		timeout = drm_timeout_abs_to_jiffies(timeline_wait->timeout_nsec);
+		ret = drm_syncobj_array_wait_timeout(syncobjs,
+						     u64_to_user_ptr(timeline_wait->points),
+						     timeline_wait->count_handles,
+						     timeline_wait->flags,
+						     timeout, &first);
+		timeline_wait->first_signaled = first;
+	}
 	if (ret < 0)
 		return ret;
 
-	wait->first_signaled = first;
 	if (ret == 0)
 		return -ETIME;
 	return 0;
@@ -1142,13 +1179,47 @@  drm_syncobj_wait_ioctl(struct drm_device *dev, void *data,
 		return ret;
 
 	ret = drm_syncobj_array_wait(dev, file_private,
-				     args, syncobjs);
+				     args, NULL, syncobjs, false);
 
 	drm_syncobj_array_free(syncobjs, args->count_handles);
 
 	return ret;
 }
 
+int
+drm_syncobj_timeline_wait_ioctl(struct drm_device *dev, void *data,
+				struct drm_file *file_private)
+{
+	struct drm_syncobj_timeline_wait *args = data;
+	struct drm_syncobj **syncobjs;
+	int ret = 0;
+
+	if (!drm_core_check_feature(dev, DRIVER_SYNCOBJ))
+		return -ENODEV;
+
+	if (args->flags & ~(DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |
+			    DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT))
+		return -EINVAL;
+
+	if (args->count_handles == 0)
+		return -EINVAL;
+
+	ret = drm_syncobj_array_find(file_private,
+				     u64_to_user_ptr(args->handles),
+				     args->count_handles,
+				     &syncobjs);
+	if (ret < 0)
+		return ret;
+
+	ret = drm_syncobj_array_wait(dev, file_private,
+				     NULL, args, syncobjs, true);
+
+	drm_syncobj_array_free(syncobjs, args->count_handles);
+
+	return ret;
+}
+
+
 int
 drm_syncobj_reset_ioctl(struct drm_device *dev, void *data,
 			struct drm_file *file_private)
diff --git a/include/uapi/drm/drm.h b/include/uapi/drm/drm.h
index cebdb2541eb7..501e86d81f47 100644
--- a/include/uapi/drm/drm.h
+++ b/include/uapi/drm/drm.h
@@ -748,6 +748,19 @@  struct drm_syncobj_wait {
 	__u32 pad;
 };
 
+struct drm_syncobj_timeline_wait {
+	__u64 handles;
+	/* wait on specific timeline point for every handles*/
+	__u64 points;
+	/* absolute timeout */
+	__s64 timeout_nsec;
+	__u32 count_handles;
+	__u32 flags;
+	__u32 first_signaled; /* only valid when not waiting all */
+	__u32 pad;
+};
+
+
 struct drm_syncobj_array {
 	__u64 handles;
 	__u32 count_handles;
@@ -910,6 +923,7 @@  extern "C" {
 #define DRM_IOCTL_MODE_GET_LEASE	DRM_IOWR(0xC8, struct drm_mode_get_lease)
 #define DRM_IOCTL_MODE_REVOKE_LEASE	DRM_IOWR(0xC9, struct drm_mode_revoke_lease)
 
+#define DRM_IOCTL_SYNCOBJ_TIMELINE_WAIT	DRM_IOWR(0xCA, struct drm_syncobj_timeline_wait)
 /**
  * Device specific ioctls should only be in their respective headers
  * The device specific ioctl range is from 0x40 to 0x9f.