diff mbox series

[v5,9/9] drm: vkms: Add support to the RGB565 format

Message ID 20220404204515.42144-10-igormtorrente@gmail.com (mailing list archive)
State New, archived
Headers show
Series Add new formats support to vkms | expand

Commit Message

Igor Matheus Andrade Torrente April 4, 2022, 8:45 p.m. UTC
Adds this common format to vkms.

This commit also adds new helper macros to deal with fixed-point
arithmetic.

It was done to improve the precision of the conversion to ARGB16161616
since the "conversion ratio" is not an integer.

V3: Adapt the handlers to the new format introduced in patch 7 V3.
V5: Minor improvements

Signed-off-by: Igor Torrente <igormtorrente@gmail.com>
---
 drivers/gpu/drm/vkms/vkms_formats.c   | 70 +++++++++++++++++++++++++++
 drivers/gpu/drm/vkms/vkms_plane.c     |  6 ++-
 drivers/gpu/drm/vkms/vkms_writeback.c |  3 +-
 3 files changed, 76 insertions(+), 3 deletions(-)

Comments

Pekka Paalanen April 21, 2022, 10:58 a.m. UTC | #1
On Mon,  4 Apr 2022 17:45:15 -0300
Igor Torrente <igormtorrente@gmail.com> wrote:

> Adds this common format to vkms.
> 
> This commit also adds new helper macros to deal with fixed-point
> arithmetic.
> 
> It was done to improve the precision of the conversion to ARGB16161616
> since the "conversion ratio" is not an integer.
> 
> V3: Adapt the handlers to the new format introduced in patch 7 V3.
> V5: Minor improvements
> 
> Signed-off-by: Igor Torrente <igormtorrente@gmail.com>
> ---
>  drivers/gpu/drm/vkms/vkms_formats.c   | 70 +++++++++++++++++++++++++++
>  drivers/gpu/drm/vkms/vkms_plane.c     |  6 ++-
>  drivers/gpu/drm/vkms/vkms_writeback.c |  3 +-
>  3 files changed, 76 insertions(+), 3 deletions(-)
> 
> diff --git a/drivers/gpu/drm/vkms/vkms_formats.c b/drivers/gpu/drm/vkms/vkms_formats.c
> index 8d913fa7dbde..4af8b295f31e 100644
> --- a/drivers/gpu/drm/vkms/vkms_formats.c
> +++ b/drivers/gpu/drm/vkms/vkms_formats.c
> @@ -5,6 +5,23 @@
>  
>  #include "vkms_formats.h"
>  
> +/* The following macros help doing fixed point arithmetic. */
> +/*
> + * With Fixed-Point scale 15 we have 17 and 15 bits of integer and fractional
> + * parts respectively.
> + *  | 0000 0000 0000 0000 0.000 0000 0000 0000 |
> + * 31                                          0
> + */
> +#define FIXED_SCALE 15

I think this would usually be called a "shift" since it's used in
bit-shifts.

> +
> +#define INT_TO_FIXED(a) ((a) << FIXED_SCALE)
> +#define FIXED_MUL(a, b) ((s32)(((s64)(a) * (b)) >> FIXED_SCALE))
> +#define FIXED_DIV(a, b) ((s32)(((s64)(a) << FIXED_SCALE) / (b)))

A truncating div, ok.

> +/* This macro converts a fixed point number to int, and round half up it */
> +#define FIXED_TO_INT_ROUND(a) (((a) + (1 << (FIXED_SCALE - 1))) >> FIXED_SCALE)

Yes.

> +/* Convert divisor and dividend to Fixed-Point and performs the division */
> +#define INT_TO_FIXED_DIV(a, b) (FIXED_DIV(INT_TO_FIXED(a), INT_TO_FIXED(b)))

Ok, this is obvious to read, even though it's the same as FIXED_DIV()
alone. Not sure the compiler would optimize that extra bit-shift away...

If one wanted to, it would be possible to write type-safe functions for
these so that fixed and integer could not be mixed up.

> +
>  static int pixel_offset(const struct vkms_frame_info *frame_info, int x, int y)
>  {
>  	return frame_info->offset + (y * frame_info->pitch)
> @@ -112,6 +129,30 @@ static void XRGB16161616_to_argb_u16(struct line_buffer *stage_buffer,
>  	}
>  }
>  
> +static void RGB565_to_argb_u16(struct line_buffer *stage_buffer,
> +			       const struct vkms_frame_info *frame_info, int y)
> +{
> +	struct pixel_argb_u16 *out_pixels = stage_buffer->pixels;
> +	u16 *src_pixels = get_packed_src_addr(frame_info, y);
> +	int x, x_limit = min_t(size_t, drm_rect_width(&frame_info->dst),
> +			       stage_buffer->n_pixels);
> +
> +	for (x = 0; x < x_limit; x++, src_pixels++) {
> +		u16 rgb_565 = le16_to_cpu(*src_pixels);
> +		int fp_r = INT_TO_FIXED((rgb_565 >> 11) & 0x1f);
> +		int fp_g = INT_TO_FIXED((rgb_565 >> 5) & 0x3f);
> +		int fp_b = INT_TO_FIXED(rgb_565 & 0x1f);
> +
> +		int fp_rb_ratio = INT_TO_FIXED_DIV(65535, 31);
> +		int fp_g_ratio = INT_TO_FIXED_DIV(65535, 63);

These two should be outside of the loop since they are constants.
Likely no difference for performance because the compiler is probably
doing that already, but I think it would read better.

> +
> +		out_pixels[x].a = (u16)0xffff;
> +		out_pixels[x].r = FIXED_TO_INT_ROUND(FIXED_MUL(fp_r, fp_rb_ratio));
> +		out_pixels[x].g = FIXED_TO_INT_ROUND(FIXED_MUL(fp_g, fp_g_ratio));
> +		out_pixels[x].b = FIXED_TO_INT_ROUND(FIXED_MUL(fp_b, fp_rb_ratio));

Looks good.

> +	}
> +}
> +
>  
>  /*
>   * The following  functions take an line of argb_u16 pixels from the
> @@ -199,6 +240,31 @@ static void argb_u16_to_XRGB16161616(struct vkms_frame_info *frame_info,
>  	}
>  }
>  
> +static void argb_u16_to_RGB565(struct vkms_frame_info *frame_info,
> +			       const struct line_buffer *src_buffer, int y)
> +{
> +	int x, x_dst = frame_info->dst.x1;
> +	u16 *dst_pixels = packed_pixels_addr(frame_info, x_dst, y);
> +	struct pixel_argb_u16 *in_pixels = src_buffer->pixels;
> +	int x_limit = min_t(size_t, drm_rect_width(&frame_info->dst),
> +			    src_buffer->n_pixels);
> +
> +	for (x = 0; x < x_limit; x++, dst_pixels++) {
> +		int fp_r = INT_TO_FIXED(in_pixels[x].r);
> +		int fp_g = INT_TO_FIXED(in_pixels[x].g);
> +		int fp_b = INT_TO_FIXED(in_pixels[x].b);
> +
> +		int fp_rb_ratio = INT_TO_FIXED_DIV(65535, 31);
> +		int fp_g_ratio = INT_TO_FIXED_DIV(65535, 63);

Move these out of the loop.

> +
> +		u16 r = FIXED_TO_INT_ROUND(FIXED_DIV(fp_r, fp_rb_ratio));
> +		u16 g = FIXED_TO_INT_ROUND(FIXED_DIV(fp_g, fp_g_ratio));
> +		u16 b = FIXED_TO_INT_ROUND(FIXED_DIV(fp_b, fp_rb_ratio));
> +
> +		*dst_pixels = cpu_to_le16(r << 11 | g << 5 | b);

Looks good.

You are using signed variables (int, s64, s32) when negative values
should never occur. It doesn't seem wrong, just unexpected.

The use of int in code vs. s32 in the macros is a bit inconsistent as
well.

> +	}
> +}
> +
>  plane_format_transform_func get_plane_fmt_transform_function(u32 format)
>  {
>  	if (format == DRM_FORMAT_ARGB8888)
> @@ -209,6 +275,8 @@ plane_format_transform_func get_plane_fmt_transform_function(u32 format)
>  		return &ARGB16161616_to_argb_u16;
>  	else if (format == DRM_FORMAT_XRGB16161616)
>  		return &XRGB16161616_to_argb_u16;
> +	else if (format == DRM_FORMAT_RGB565)
> +		return &RGB565_to_argb_u16;
>  	else
>  		return NULL;
>  }
> @@ -223,6 +291,8 @@ wb_format_transform_func get_wb_fmt_transform_function(u32 format)
>  		return &argb_u16_to_ARGB16161616;
>  	else if (format == DRM_FORMAT_XRGB16161616)
>  		return &argb_u16_to_XRGB16161616;
> +	else if (format == DRM_FORMAT_RGB565)
> +		return &argb_u16_to_RGB565;

Now it's starting to become clear that a switch statement would be nice.

>  	else
>  		return NULL;
>  }
> diff --git a/drivers/gpu/drm/vkms/vkms_plane.c b/drivers/gpu/drm/vkms/vkms_plane.c
> index 60054a85204a..94a8e412886f 100644
> --- a/drivers/gpu/drm/vkms/vkms_plane.c
> +++ b/drivers/gpu/drm/vkms/vkms_plane.c
> @@ -14,14 +14,16 @@
>  
>  static const u32 vkms_formats[] = {
>  	DRM_FORMAT_XRGB8888,
> -	DRM_FORMAT_XRGB16161616
> +	DRM_FORMAT_XRGB16161616,
> +	DRM_FORMAT_RGB565
>  };
>  
>  static const u32 vkms_plane_formats[] = {
>  	DRM_FORMAT_ARGB8888,
>  	DRM_FORMAT_XRGB8888,
>  	DRM_FORMAT_XRGB16161616,
> -	DRM_FORMAT_ARGB16161616
> +	DRM_FORMAT_ARGB16161616,
> +	DRM_FORMAT_RGB565
>  };
>  
>  static struct drm_plane_state *
> diff --git a/drivers/gpu/drm/vkms/vkms_writeback.c b/drivers/gpu/drm/vkms/vkms_writeback.c
> index cb63a5da9af1..98da7bee0f4b 100644
> --- a/drivers/gpu/drm/vkms/vkms_writeback.c
> +++ b/drivers/gpu/drm/vkms/vkms_writeback.c
> @@ -16,7 +16,8 @@
>  static const u32 vkms_wb_formats[] = {
>  	DRM_FORMAT_XRGB8888,
>  	DRM_FORMAT_XRGB16161616,
> -	DRM_FORMAT_ARGB16161616
> +	DRM_FORMAT_ARGB16161616,
> +	DRM_FORMAT_RGB565
>  };
>  
>  static const struct drm_connector_funcs vkms_wb_connector_funcs = {

I wonder, would it be possible to add a unit test to make sure that
get_plane_fmt_transform_function() or get_wb_fmt_transform_function()
does not return NULL for any of the listed formats, respectively?
Or is that too paranoid?


Thanks,
pq
Igor Matheus Andrade Torrente April 27, 2022, 12:53 a.m. UTC | #2
Hi Pekka,

On 4/21/22 07:58, Pekka Paalanen wrote:
> On Mon,  4 Apr 2022 17:45:15 -0300
> Igor Torrente <igormtorrente@gmail.com> wrote:
> 
>> Adds this common format to vkms.
>>
>> This commit also adds new helper macros to deal with fixed-point
>> arithmetic.
>>
>> It was done to improve the precision of the conversion to ARGB16161616
>> since the "conversion ratio" is not an integer.
>>
>> V3: Adapt the handlers to the new format introduced in patch 7 V3.
>> V5: Minor improvements
>>
>> Signed-off-by: Igor Torrente <igormtorrente@gmail.com>
>> ---
>>   drivers/gpu/drm/vkms/vkms_formats.c   | 70 +++++++++++++++++++++++++++
>>   drivers/gpu/drm/vkms/vkms_plane.c     |  6 ++-
>>   drivers/gpu/drm/vkms/vkms_writeback.c |  3 +-
>>   3 files changed, 76 insertions(+), 3 deletions(-)
>>
>> diff --git a/drivers/gpu/drm/vkms/vkms_formats.c b/drivers/gpu/drm/vkms/vkms_formats.c
>> index 8d913fa7dbde..4af8b295f31e 100644
>> --- a/drivers/gpu/drm/vkms/vkms_formats.c
>> +++ b/drivers/gpu/drm/vkms/vkms_formats.c
>> @@ -5,6 +5,23 @@
>>   
>>   #include "vkms_formats.h"
>>   
>> +/* The following macros help doing fixed point arithmetic. */
>> +/*
>> + * With Fixed-Point scale 15 we have 17 and 15 bits of integer and fractional
>> + * parts respectively.
>> + *  | 0000 0000 0000 0000 0.000 0000 0000 0000 |
>> + * 31                                          0
>> + */
>> +#define FIXED_SCALE 15
> 
> I think this would usually be called a "shift" since it's used in
> bit-shifts.

Ok, I will rename this.

> 
>> +
>> +#define INT_TO_FIXED(a) ((a) << FIXED_SCALE)
>> +#define FIXED_MUL(a, b) ((s32)(((s64)(a) * (b)) >> FIXED_SCALE))
>> +#define FIXED_DIV(a, b) ((s32)(((s64)(a) << FIXED_SCALE) / (b)))
> 
> A truncating div, ok.
> 
>> +/* This macro converts a fixed point number to int, and round half up it */
>> +#define FIXED_TO_INT_ROUND(a) (((a) + (1 << (FIXED_SCALE - 1))) >> FIXED_SCALE)
> 
> Yes.
> 
>> +/* Convert divisor and dividend to Fixed-Point and performs the division */
>> +#define INT_TO_FIXED_DIV(a, b) (FIXED_DIV(INT_TO_FIXED(a), INT_TO_FIXED(b)))
> 
> Ok, this is obvious to read, even though it's the same as FIXED_DIV()
> alone. Not sure the compiler would optimize that extra bit-shift away...
> 
> If one wanted to, it would be possible to write type-safe functions for
> these so that fixed and integer could not be mixed up.

Ok, I will move to a function.

> 
>> +
>>   static int pixel_offset(const struct vkms_frame_info *frame_info, int x, int y)
>>   {
>>   	return frame_info->offset + (y * frame_info->pitch)
>> @@ -112,6 +129,30 @@ static void XRGB16161616_to_argb_u16(struct line_buffer *stage_buffer,
>>   	}
>>   }
>>   
>> +static void RGB565_to_argb_u16(struct line_buffer *stage_buffer,
>> +			       const struct vkms_frame_info *frame_info, int y)
>> +{
>> +	struct pixel_argb_u16 *out_pixels = stage_buffer->pixels;
>> +	u16 *src_pixels = get_packed_src_addr(frame_info, y);
>> +	int x, x_limit = min_t(size_t, drm_rect_width(&frame_info->dst),
>> +			       stage_buffer->n_pixels);
>> +
>> +	for (x = 0; x < x_limit; x++, src_pixels++) {
>> +		u16 rgb_565 = le16_to_cpu(*src_pixels);
>> +		int fp_r = INT_TO_FIXED((rgb_565 >> 11) & 0x1f);
>> +		int fp_g = INT_TO_FIXED((rgb_565 >> 5) & 0x3f);
>> +		int fp_b = INT_TO_FIXED(rgb_565 & 0x1f);
>> +
>> +		int fp_rb_ratio = INT_TO_FIXED_DIV(65535, 31);
>> +		int fp_g_ratio = INT_TO_FIXED_DIV(65535, 63);
> 
> These two should be outside of the loop since they are constants.
> Likely no difference for performance because the compiler is probably
> doing that already, but I think it would read better.

I will move it.

> 
>> +
>> +		out_pixels[x].a = (u16)0xffff;
>> +		out_pixels[x].r = FIXED_TO_INT_ROUND(FIXED_MUL(fp_r, fp_rb_ratio));
>> +		out_pixels[x].g = FIXED_TO_INT_ROUND(FIXED_MUL(fp_g, fp_g_ratio));
>> +		out_pixels[x].b = FIXED_TO_INT_ROUND(FIXED_MUL(fp_b, fp_rb_ratio));
> 
> Looks good.
> 
>> +	}
>> +}
>> +
>>   
>>   /*
>>    * The following  functions take an line of argb_u16 pixels from the
>> @@ -199,6 +240,31 @@ static void argb_u16_to_XRGB16161616(struct vkms_frame_info *frame_info,
>>   	}
>>   }
>>   
>> +static void argb_u16_to_RGB565(struct vkms_frame_info *frame_info,
>> +			       const struct line_buffer *src_buffer, int y)
>> +{
>> +	int x, x_dst = frame_info->dst.x1;
>> +	u16 *dst_pixels = packed_pixels_addr(frame_info, x_dst, y);
>> +	struct pixel_argb_u16 *in_pixels = src_buffer->pixels;
>> +	int x_limit = min_t(size_t, drm_rect_width(&frame_info->dst),
>> +			    src_buffer->n_pixels);
>> +
>> +	for (x = 0; x < x_limit; x++, dst_pixels++) {
>> +		int fp_r = INT_TO_FIXED(in_pixels[x].r);
>> +		int fp_g = INT_TO_FIXED(in_pixels[x].g);
>> +		int fp_b = INT_TO_FIXED(in_pixels[x].b);
>> +
>> +		int fp_rb_ratio = INT_TO_FIXED_DIV(65535, 31);
>> +		int fp_g_ratio = INT_TO_FIXED_DIV(65535, 63);
> 
> Move these out of the loop.
> 
>> +
>> +		u16 r = FIXED_TO_INT_ROUND(FIXED_DIV(fp_r, fp_rb_ratio));
>> +		u16 g = FIXED_TO_INT_ROUND(FIXED_DIV(fp_g, fp_g_ratio));
>> +		u16 b = FIXED_TO_INT_ROUND(FIXED_DIV(fp_b, fp_rb_ratio));
>> +
>> +		*dst_pixels = cpu_to_le16(r << 11 | g << 5 | b);
> 
> Looks good.
> 
> You are using signed variables (int, s64, s32) when negative values
> should never occur. It doesn't seem wrong, just unexpected.

I left the signal so I can reuse them in the YUV formats.

> 
> The use of int in code vs. s32 in the macros is a bit inconsistent as
> well.

Right. I think I will stick with s32 and s64 then.

> 
>> +	}
>> +}
>> +
>>   plane_format_transform_func get_plane_fmt_transform_function(u32 format)
>>   {
>>   	if (format == DRM_FORMAT_ARGB8888)
>> @@ -209,6 +275,8 @@ plane_format_transform_func get_plane_fmt_transform_function(u32 format)
>>   		return &ARGB16161616_to_argb_u16;
>>   	else if (format == DRM_FORMAT_XRGB16161616)
>>   		return &XRGB16161616_to_argb_u16;
>> +	else if (format == DRM_FORMAT_RGB565)
>> +		return &RGB565_to_argb_u16;
>>   	else
>>   		return NULL;
>>   }
>> @@ -223,6 +291,8 @@ wb_format_transform_func get_wb_fmt_transform_function(u32 format)
>>   		return &argb_u16_to_ARGB16161616;
>>   	else if (format == DRM_FORMAT_XRGB16161616)
>>   		return &argb_u16_to_XRGB16161616;
>> +	else if (format == DRM_FORMAT_RGB565)
>> +		return &argb_u16_to_RGB565;
> 
> Now it's starting to become clear that a switch statement would be nice.
> 
>>   	else
>>   		return NULL;
>>   }
>> diff --git a/drivers/gpu/drm/vkms/vkms_plane.c b/drivers/gpu/drm/vkms/vkms_plane.c
>> index 60054a85204a..94a8e412886f 100644
>> --- a/drivers/gpu/drm/vkms/vkms_plane.c
>> +++ b/drivers/gpu/drm/vkms/vkms_plane.c
>> @@ -14,14 +14,16 @@
>>   
>>   static const u32 vkms_formats[] = {
>>   	DRM_FORMAT_XRGB8888,
>> -	DRM_FORMAT_XRGB16161616
>> +	DRM_FORMAT_XRGB16161616,
>> +	DRM_FORMAT_RGB565
>>   };
>>   
>>   static const u32 vkms_plane_formats[] = {
>>   	DRM_FORMAT_ARGB8888,
>>   	DRM_FORMAT_XRGB8888,
>>   	DRM_FORMAT_XRGB16161616,
>> -	DRM_FORMAT_ARGB16161616
>> +	DRM_FORMAT_ARGB16161616,
>> +	DRM_FORMAT_RGB565
>>   };
>>   
>>   static struct drm_plane_state *
>> diff --git a/drivers/gpu/drm/vkms/vkms_writeback.c b/drivers/gpu/drm/vkms/vkms_writeback.c
>> index cb63a5da9af1..98da7bee0f4b 100644
>> --- a/drivers/gpu/drm/vkms/vkms_writeback.c
>> +++ b/drivers/gpu/drm/vkms/vkms_writeback.c
>> @@ -16,7 +16,8 @@
>>   static const u32 vkms_wb_formats[] = {
>>   	DRM_FORMAT_XRGB8888,
>>   	DRM_FORMAT_XRGB16161616,
>> -	DRM_FORMAT_ARGB16161616
>> +	DRM_FORMAT_ARGB16161616,
>> +	DRM_FORMAT_RGB565
>>   };
>>   
>>   static const struct drm_connector_funcs vkms_wb_connector_funcs = {
> 
> I wonder, would it be possible to add a unit test to make sure that
> get_plane_fmt_transform_function() or get_wb_fmt_transform_function()
> does not return NULL for any of the listed formats, respectively?
> Or is that too paranoid?

I'm not opposed to it. But I also don't think it needs to be in this 
series of patches either.

A new todo maybe?

> 
> 
> Thanks,
> pq
Pekka Paalanen April 27, 2022, 7:55 a.m. UTC | #3
On Tue, 26 Apr 2022 21:53:19 -0300
Igor Torrente <igormtorrente@gmail.com> wrote:

> Hi Pekka,
> 
> On 4/21/22 07:58, Pekka Paalanen wrote:
> > On Mon,  4 Apr 2022 17:45:15 -0300
> > Igor Torrente <igormtorrente@gmail.com> wrote:
> >   
> >> Adds this common format to vkms.
> >>
> >> This commit also adds new helper macros to deal with fixed-point
> >> arithmetic.
> >>
> >> It was done to improve the precision of the conversion to ARGB16161616
> >> since the "conversion ratio" is not an integer.
> >>
> >> V3: Adapt the handlers to the new format introduced in patch 7 V3.
> >> V5: Minor improvements
> >>
> >> Signed-off-by: Igor Torrente <igormtorrente@gmail.com>
> >> ---
> >>   drivers/gpu/drm/vkms/vkms_formats.c   | 70 +++++++++++++++++++++++++++
> >>   drivers/gpu/drm/vkms/vkms_plane.c     |  6 ++-
> >>   drivers/gpu/drm/vkms/vkms_writeback.c |  3 +-
> >>   3 files changed, 76 insertions(+), 3 deletions(-)
> >>
> >> diff --git a/drivers/gpu/drm/vkms/vkms_formats.c b/drivers/gpu/drm/vkms/vkms_formats.c
> >> index 8d913fa7dbde..4af8b295f31e 100644
> >> --- a/drivers/gpu/drm/vkms/vkms_formats.c
> >> +++ b/drivers/gpu/drm/vkms/vkms_formats.c
> >> @@ -5,6 +5,23 @@
> >>   
> >>   #include "vkms_formats.h"
> >>   
> >> +/* The following macros help doing fixed point arithmetic. */
> >> +/*
> >> + * With Fixed-Point scale 15 we have 17 and 15 bits of integer and fractional
> >> + * parts respectively.
> >> + *  | 0000 0000 0000 0000 0.000 0000 0000 0000 |
> >> + * 31                                          0
> >> + */
> >> +#define FIXED_SCALE 15  
> > 
> > I think this would usually be called a "shift" since it's used in
> > bit-shifts.  
> 
> Ok, I will rename this.
> 
> >   
> >> +
> >> +#define INT_TO_FIXED(a) ((a) << FIXED_SCALE)
> >> +#define FIXED_MUL(a, b) ((s32)(((s64)(a) * (b)) >> FIXED_SCALE))
> >> +#define FIXED_DIV(a, b) ((s32)(((s64)(a) << FIXED_SCALE) / (b)))  
> > 
> > A truncating div, ok.
> >   
> >> +/* This macro converts a fixed point number to int, and round half up it */
> >> +#define FIXED_TO_INT_ROUND(a) (((a) + (1 << (FIXED_SCALE - 1))) >> FIXED_SCALE)  
> > 
> > Yes.
> >   
> >> +/* Convert divisor and dividend to Fixed-Point and performs the division */
> >> +#define INT_TO_FIXED_DIV(a, b) (FIXED_DIV(INT_TO_FIXED(a), INT_TO_FIXED(b)))  
> > 
> > Ok, this is obvious to read, even though it's the same as FIXED_DIV()
> > alone. Not sure the compiler would optimize that extra bit-shift away...
> > 
> > If one wanted to, it would be possible to write type-safe functions for
> > these so that fixed and integer could not be mixed up.  
> 
> Ok, I will move to a function.

That's not all.

If you want it type-safe, then you need something like

struct vkms_fixed_point {
	s32 value;
};

And use `struct vkms_fixed_point` (by value) everywhere where you pass
a fixed point value, and never as a plain s32 type. Then it will be
impossible to do incorrect arithmetic or conversions by accident on
fixed point values.

Is it worth it? I don't know, since it's limited into this one file.

A simple 'typedef s32 vkms_fixed_point' does not work, because it does
not prevent computing with vkms_fixed_point as if it was just a normal
s32. Using a struct prevents that.

I wonder if the kernel doesn't already have something like this
available in general...

> >> +		u16 r = FIXED_TO_INT_ROUND(FIXED_DIV(fp_r, fp_rb_ratio));
> >> +		u16 g = FIXED_TO_INT_ROUND(FIXED_DIV(fp_g, fp_g_ratio));
> >> +		u16 b = FIXED_TO_INT_ROUND(FIXED_DIV(fp_b, fp_rb_ratio));
> >> +
> >> +		*dst_pixels = cpu_to_le16(r << 11 | g << 5 | b);  
> > 
> > Looks good.
> > 
> > You are using signed variables (int, s64, s32) when negative values
> > should never occur. It doesn't seem wrong, just unexpected.  
> 
> I left the signal so I can reuse them in the YUV formats.

Good point.

> 
> > 
> > The use of int in code vs. s32 in the macros is a bit inconsistent as
> > well.  
> 
> Right. I think I will stick with s32 and s64 then.

...

> >> diff --git a/drivers/gpu/drm/vkms/vkms_writeback.c b/drivers/gpu/drm/vkms/vkms_writeback.c
> >> index cb63a5da9af1..98da7bee0f4b 100644
> >> --- a/drivers/gpu/drm/vkms/vkms_writeback.c
> >> +++ b/drivers/gpu/drm/vkms/vkms_writeback.c
> >> @@ -16,7 +16,8 @@
> >>   static const u32 vkms_wb_formats[] = {
> >>   	DRM_FORMAT_XRGB8888,
> >>   	DRM_FORMAT_XRGB16161616,
> >> -	DRM_FORMAT_ARGB16161616
> >> +	DRM_FORMAT_ARGB16161616,
> >> +	DRM_FORMAT_RGB565
> >>   };
> >>   
> >>   static const struct drm_connector_funcs vkms_wb_connector_funcs = {  
> > 
> > I wonder, would it be possible to add a unit test to make sure that
> > get_plane_fmt_transform_function() or get_wb_fmt_transform_function()
> > does not return NULL for any of the listed formats, respectively?
> > Or is that too paranoid?  
> 
> I'm not opposed to it. But I also don't think it needs to be in this 
> series of patches either.
> 
> A new todo maybe?

If it's a good thing, then it belongs in this series, because those
function getters are introduced in this series, opening the door for
the mistakes that the tests would prevent. I don't mean IGT tests but
kernel internal tests. I think there is a unit test framework?

You really should get a kernel maintainer's opinion on these questions,
as I am not a kernel developer.


Thanks,
pq
Igor Matheus Andrade Torrente May 6, 2022, 11:05 p.m. UTC | #4
Hi Pekka,

On 4/27/22 04:55, Pekka Paalanen wrote:
> On Tue, 26 Apr 2022 21:53:19 -0300
> Igor Torrente <igormtorrente@gmail.com> wrote:
> 
>> Hi Pekka,
>>
>> On 4/21/22 07:58, Pekka Paalanen wrote:
>>> On Mon,  4 Apr 2022 17:45:15 -0300
>>> Igor Torrente <igormtorrente@gmail.com> wrote:
>>>    
>>>> Adds this common format to vkms.
>>>>
>>>> This commit also adds new helper macros to deal with fixed-point
>>>> arithmetic.
>>>>
>>>> It was done to improve the precision of the conversion to ARGB16161616
>>>> since the "conversion ratio" is not an integer.
>>>>
>>>> V3: Adapt the handlers to the new format introduced in patch 7 V3.
>>>> V5: Minor improvements
>>>>
>>>> Signed-off-by: Igor Torrente <igormtorrente@gmail.com>
>>>> ---
>>>>    drivers/gpu/drm/vkms/vkms_formats.c   | 70 +++++++++++++++++++++++++++
>>>>    drivers/gpu/drm/vkms/vkms_plane.c     |  6 ++-
>>>>    drivers/gpu/drm/vkms/vkms_writeback.c |  3 +-
>>>>    3 files changed, 76 insertions(+), 3 deletions(-)
>>>>
>>>> diff --git a/drivers/gpu/drm/vkms/vkms_formats.c b/drivers/gpu/drm/vkms/vkms_formats.c
>>>> index 8d913fa7dbde..4af8b295f31e 100644
>>>> --- a/drivers/gpu/drm/vkms/vkms_formats.c
>>>> +++ b/drivers/gpu/drm/vkms/vkms_formats.c
>>>> @@ -5,6 +5,23 @@
>>>>    
>>>>    #include "vkms_formats.h"
>>>>    
>>>> +/* The following macros help doing fixed point arithmetic. */
>>>> +/*
>>>> + * With Fixed-Point scale 15 we have 17 and 15 bits of integer and fractional
>>>> + * parts respectively.
>>>> + *  | 0000 0000 0000 0000 0.000 0000 0000 0000 |
>>>> + * 31                                          0
>>>> + */
>>>> +#define FIXED_SCALE 15
>>>
>>> I think this would usually be called a "shift" since it's used in
>>> bit-shifts.
>>
>> Ok, I will rename this.
>>
>>>    
>>>> +
>>>> +#define INT_TO_FIXED(a) ((a) << FIXED_SCALE)
>>>> +#define FIXED_MUL(a, b) ((s32)(((s64)(a) * (b)) >> FIXED_SCALE))
>>>> +#define FIXED_DIV(a, b) ((s32)(((s64)(a) << FIXED_SCALE) / (b)))
>>>
>>> A truncating div, ok.
>>>    
>>>> +/* This macro converts a fixed point number to int, and round half up it */
>>>> +#define FIXED_TO_INT_ROUND(a) (((a) + (1 << (FIXED_SCALE - 1))) >> FIXED_SCALE)
>>>
>>> Yes.
>>>    
>>>> +/* Convert divisor and dividend to Fixed-Point and performs the division */
>>>> +#define INT_TO_FIXED_DIV(a, b) (FIXED_DIV(INT_TO_FIXED(a), INT_TO_FIXED(b)))
>>>
>>> Ok, this is obvious to read, even though it's the same as FIXED_DIV()
>>> alone. Not sure the compiler would optimize that extra bit-shift away...
>>>
>>> If one wanted to, it would be possible to write type-safe functions for
>>> these so that fixed and integer could not be mixed up.
>>
>> Ok, I will move to a function.
> 
> That's not all.
> 
> If you want it type-safe, then you need something like
> 
> struct vkms_fixed_point {
> 	s32 value;
> };
> 
> And use `struct vkms_fixed_point` (by value) everywhere where you pass
> a fixed point value, and never as a plain s32 type. Then it will be
> impossible to do incorrect arithmetic or conversions by accident on
> fixed point values.
> 
> Is it worth it? I don't know, since it's limited into this one file.
> 
> A simple 'typedef s32 vkms_fixed_point' does not work, because it does
> not prevent computing with vkms_fixed_point as if it was just a normal
> s32. Using a struct prevents that.

ohhh. Got it!

> 
> I wonder if the kernel doesn't already have something like this
> available in general...

After some time searching I found `include/drm/drm_fixed.h`[1].

It seems fine. There are minor things to consider:

1. It doesn't have a `FIXED_TO_INT_ROUND` equivalent.
2. We can use `fixed20_12` for rgb565 but We have to use s64 for YUV
formats or add a `sfixed20_12` with s32.

In terms of consistency, do you think worth using this "library" given
that we may need to use two distinct ways to represent the fixed point
soonish? Or it's better to implement `sfixed20_12`? Or just continue 
with the
current macros?

[1] - https://elixir.bootlin.com/linux/latest/source/include/drm/drm_fixed.h

> 
>>>> +		u16 r = FIXED_TO_INT_ROUND(FIXED_DIV(fp_r, fp_rb_ratio));
>>>> +		u16 g = FIXED_TO_INT_ROUND(FIXED_DIV(fp_g, fp_g_ratio));
>>>> +		u16 b = FIXED_TO_INT_ROUND(FIXED_DIV(fp_b, fp_rb_ratio));
>>>> +
>>>> +		*dst_pixels = cpu_to_le16(r << 11 | g << 5 | b);
>>>
>>> Looks good.
>>>
>>> You are using signed variables (int, s64, s32) when negative values
>>> should never occur. It doesn't seem wrong, just unexpected.
>>
>> I left the signal so I can reuse them in the YUV formats.
> 
> Good point.
> 
>>
>>>
>>> The use of int in code vs. s32 in the macros is a bit inconsistent as
>>> well.
>>
>> Right. I think I will stick with s32 and s64 then.
> 
> ...
> 
>>>> diff --git a/drivers/gpu/drm/vkms/vkms_writeback.c b/drivers/gpu/drm/vkms/vkms_writeback.c
>>>> index cb63a5da9af1..98da7bee0f4b 100644
>>>> --- a/drivers/gpu/drm/vkms/vkms_writeback.c
>>>> +++ b/drivers/gpu/drm/vkms/vkms_writeback.c
>>>> @@ -16,7 +16,8 @@
>>>>    static const u32 vkms_wb_formats[] = {
>>>>    	DRM_FORMAT_XRGB8888,
>>>>    	DRM_FORMAT_XRGB16161616,
>>>> -	DRM_FORMAT_ARGB16161616
>>>> +	DRM_FORMAT_ARGB16161616,
>>>> +	DRM_FORMAT_RGB565
>>>>    };
>>>>    
>>>>    static const struct drm_connector_funcs vkms_wb_connector_funcs = {
>>>
>>> I wonder, would it be possible to add a unit test to make sure that
>>> get_plane_fmt_transform_function() or get_wb_fmt_transform_function()
>>> does not return NULL for any of the listed formats, respectively?
>>> Or is that too paranoid?
>>
>> I'm not opposed to it. But I also don't think it needs to be in this
>> series of patches either.
>>
>> A new todo maybe?
> 
> If it's a good thing, then it belongs in this series, because those
> function getters are introduced in this series, opening the door for
> the mistakes that the tests would prevent. I don't mean IGT tests but
> kernel internal tests. I think there is a unit test framework?

Yeah, kernel have kunit and kselftest. Idk what are the differences
between them or how to use them, but I know they exist.

> 
> You really should get a kernel maintainer's opinion on these questions,
> as I am not a kernel developer.

Ok.

> 
> 
> Thanks,
> pq
Pekka Paalanen May 9, 2022, 7:53 a.m. UTC | #5
On Fri, 6 May 2022 20:05:39 -0300
Igor Torrente <igormtorrente@gmail.com> wrote:

> Hi Pekka,
> 
> On 4/27/22 04:55, Pekka Paalanen wrote:
> > On Tue, 26 Apr 2022 21:53:19 -0300
> > Igor Torrente <igormtorrente@gmail.com> wrote:
> >   
> >> Hi Pekka,
> >>
> >> On 4/21/22 07:58, Pekka Paalanen wrote:  
> >>> On Mon,  4 Apr 2022 17:45:15 -0300
> >>> Igor Torrente <igormtorrente@gmail.com> wrote:
> >>>      
> >>>> Adds this common format to vkms.
> >>>>
> >>>> This commit also adds new helper macros to deal with fixed-point
> >>>> arithmetic.
> >>>>
> >>>> It was done to improve the precision of the conversion to ARGB16161616
> >>>> since the "conversion ratio" is not an integer.
> >>>>
> >>>> V3: Adapt the handlers to the new format introduced in patch 7 V3.
> >>>> V5: Minor improvements
> >>>>
> >>>> Signed-off-by: Igor Torrente <igormtorrente@gmail.com>
> >>>> ---
> >>>>    drivers/gpu/drm/vkms/vkms_formats.c   | 70 +++++++++++++++++++++++++++
> >>>>    drivers/gpu/drm/vkms/vkms_plane.c     |  6 ++-
> >>>>    drivers/gpu/drm/vkms/vkms_writeback.c |  3 +-
> >>>>    3 files changed, 76 insertions(+), 3 deletions(-)
> >>>>
> >>>> diff --git a/drivers/gpu/drm/vkms/vkms_formats.c b/drivers/gpu/drm/vkms/vkms_formats.c
> >>>> index 8d913fa7dbde..4af8b295f31e 100644
> >>>> --- a/drivers/gpu/drm/vkms/vkms_formats.c
> >>>> +++ b/drivers/gpu/drm/vkms/vkms_formats.c
> >>>> @@ -5,6 +5,23 @@
> >>>>    
> >>>>    #include "vkms_formats.h"
> >>>>    
> >>>> +/* The following macros help doing fixed point arithmetic. */
> >>>> +/*
> >>>> + * With Fixed-Point scale 15 we have 17 and 15 bits of integer and fractional
> >>>> + * parts respectively.
> >>>> + *  | 0000 0000 0000 0000 0.000 0000 0000 0000 |
> >>>> + * 31                                          0
> >>>> + */
> >>>> +#define FIXED_SCALE 15  
> >>>
> >>> I think this would usually be called a "shift" since it's used in
> >>> bit-shifts.  
> >>
> >> Ok, I will rename this.
> >>  
> >>>      
> >>>> +
> >>>> +#define INT_TO_FIXED(a) ((a) << FIXED_SCALE)
> >>>> +#define FIXED_MUL(a, b) ((s32)(((s64)(a) * (b)) >> FIXED_SCALE))
> >>>> +#define FIXED_DIV(a, b) ((s32)(((s64)(a) << FIXED_SCALE) / (b)))  
> >>>
> >>> A truncating div, ok.
> >>>      
> >>>> +/* This macro converts a fixed point number to int, and round half up it */
> >>>> +#define FIXED_TO_INT_ROUND(a) (((a) + (1 << (FIXED_SCALE - 1))) >> FIXED_SCALE)  
> >>>
> >>> Yes.
> >>>      
> >>>> +/* Convert divisor and dividend to Fixed-Point and performs the division */
> >>>> +#define INT_TO_FIXED_DIV(a, b) (FIXED_DIV(INT_TO_FIXED(a), INT_TO_FIXED(b)))  
> >>>
> >>> Ok, this is obvious to read, even though it's the same as FIXED_DIV()
> >>> alone. Not sure the compiler would optimize that extra bit-shift away...
> >>>
> >>> If one wanted to, it would be possible to write type-safe functions for
> >>> these so that fixed and integer could not be mixed up.  
> >>
> >> Ok, I will move to a function.  
> > 
> > That's not all.
> > 
> > If you want it type-safe, then you need something like
> > 
> > struct vkms_fixed_point {
> > 	s32 value;
> > };
> > 
> > And use `struct vkms_fixed_point` (by value) everywhere where you pass
> > a fixed point value, and never as a plain s32 type. Then it will be
> > impossible to do incorrect arithmetic or conversions by accident on
> > fixed point values.
> > 
> > Is it worth it? I don't know, since it's limited into this one file.
> > 
> > A simple 'typedef s32 vkms_fixed_point' does not work, because it does
> > not prevent computing with vkms_fixed_point as if it was just a normal
> > s32. Using a struct prevents that.  
> 
> ohhh. Got it!
> 
> > 
> > I wonder if the kernel doesn't already have something like this
> > available in general...  
> 
> After some time searching I found `include/drm/drm_fixed.h`[1].
> 
> It seems fine. There are minor things to consider:
> 
> 1. It doesn't have a `FIXED_TO_INT_ROUND` equivalent.
> 2. We can use `fixed20_12` for rgb565 but We have to use s64 for YUV
> formats or add a `sfixed20_12` with s32.
> 
> In terms of consistency, do you think worth using this "library" given
> that we may need to use two distinct ways to represent the fixed point
> soonish? Or it's better to implement `sfixed20_12`? Or just continue 
> with the
> current macros?
> 
> [1] - https://elixir.bootlin.com/linux/latest/source/include/drm/drm_fixed.h

I think that is something the kernel people should weigh in on.

The one thing I would definitely avoid is ending up using multiple
fixed point formats in VKMS.

In the mean time, your current macros seem good enough, if there is no
community interest in better type safety nor sharing the fixed point
code.


Thanks,
pq
Igor Matheus Andrade Torrente May 10, 2022, 7:24 p.m. UTC | #6
On 5/9/22 04:53, Pekka Paalanen wrote:
> On Fri, 6 May 2022 20:05:39 -0300
> Igor Torrente <igormtorrente@gmail.com> wrote:
> 
>> Hi Pekka,
>>
>> On 4/27/22 04:55, Pekka Paalanen wrote:
>>> On Tue, 26 Apr 2022 21:53:19 -0300
>>> Igor Torrente <igormtorrente@gmail.com> wrote:
>>>    
>>>> Hi Pekka,
>>>>
>>>> On 4/21/22 07:58, Pekka Paalanen wrote:
>>>>> On Mon,  4 Apr 2022 17:45:15 -0300
>>>>> Igor Torrente <igormtorrente@gmail.com> wrote:
>>>>>       
>>>>>> Adds this common format to vkms.
>>>>>>
>>>>>> This commit also adds new helper macros to deal with fixed-point
>>>>>> arithmetic.
>>>>>>
>>>>>> It was done to improve the precision of the conversion to ARGB16161616
>>>>>> since the "conversion ratio" is not an integer.
>>>>>>
>>>>>> V3: Adapt the handlers to the new format introduced in patch 7 V3.
>>>>>> V5: Minor improvements
>>>>>>
>>>>>> Signed-off-by: Igor Torrente <igormtorrente@gmail.com>
>>>>>> ---
>>>>>>     drivers/gpu/drm/vkms/vkms_formats.c   | 70 +++++++++++++++++++++++++++
>>>>>>     drivers/gpu/drm/vkms/vkms_plane.c     |  6 ++-
>>>>>>     drivers/gpu/drm/vkms/vkms_writeback.c |  3 +-
>>>>>>     3 files changed, 76 insertions(+), 3 deletions(-)
>>>>>>
>>>>>> diff --git a/drivers/gpu/drm/vkms/vkms_formats.c b/drivers/gpu/drm/vkms/vkms_formats.c
>>>>>> index 8d913fa7dbde..4af8b295f31e 100644
>>>>>> --- a/drivers/gpu/drm/vkms/vkms_formats.c
>>>>>> +++ b/drivers/gpu/drm/vkms/vkms_formats.c
>>>>>> @@ -5,6 +5,23 @@
>>>>>>     
>>>>>>     #include "vkms_formats.h"
>>>>>>     
>>>>>> +/* The following macros help doing fixed point arithmetic. */
>>>>>> +/*
>>>>>> + * With Fixed-Point scale 15 we have 17 and 15 bits of integer and fractional
>>>>>> + * parts respectively.
>>>>>> + *  | 0000 0000 0000 0000 0.000 0000 0000 0000 |
>>>>>> + * 31                                          0
>>>>>> + */
>>>>>> +#define FIXED_SCALE 15
>>>>>
>>>>> I think this would usually be called a "shift" since it's used in
>>>>> bit-shifts.
>>>>
>>>> Ok, I will rename this.
>>>>   
>>>>>       
>>>>>> +
>>>>>> +#define INT_TO_FIXED(a) ((a) << FIXED_SCALE)
>>>>>> +#define FIXED_MUL(a, b) ((s32)(((s64)(a) * (b)) >> FIXED_SCALE))
>>>>>> +#define FIXED_DIV(a, b) ((s32)(((s64)(a) << FIXED_SCALE) / (b)))
>>>>>
>>>>> A truncating div, ok.
>>>>>       
>>>>>> +/* This macro converts a fixed point number to int, and round half up it */
>>>>>> +#define FIXED_TO_INT_ROUND(a) (((a) + (1 << (FIXED_SCALE - 1))) >> FIXED_SCALE)
>>>>>
>>>>> Yes.
>>>>>       
>>>>>> +/* Convert divisor and dividend to Fixed-Point and performs the division */
>>>>>> +#define INT_TO_FIXED_DIV(a, b) (FIXED_DIV(INT_TO_FIXED(a), INT_TO_FIXED(b)))
>>>>>
>>>>> Ok, this is obvious to read, even though it's the same as FIXED_DIV()
>>>>> alone. Not sure the compiler would optimize that extra bit-shift away...
>>>>>
>>>>> If one wanted to, it would be possible to write type-safe functions for
>>>>> these so that fixed and integer could not be mixed up.
>>>>
>>>> Ok, I will move to a function.
>>>
>>> That's not all.
>>>
>>> If you want it type-safe, then you need something like
>>>
>>> struct vkms_fixed_point {
>>> 	s32 value;
>>> };
>>>
>>> And use `struct vkms_fixed_point` (by value) everywhere where you pass
>>> a fixed point value, and never as a plain s32 type. Then it will be
>>> impossible to do incorrect arithmetic or conversions by accident on
>>> fixed point values.
>>>
>>> Is it worth it? I don't know, since it's limited into this one file.
>>>
>>> A simple 'typedef s32 vkms_fixed_point' does not work, because it does
>>> not prevent computing with vkms_fixed_point as if it was just a normal
>>> s32. Using a struct prevents that.
>>
>> ohhh. Got it!
>>
>>>
>>> I wonder if the kernel doesn't already have something like this
>>> available in general...
>>
>> After some time searching I found `include/drm/drm_fixed.h`[1].
>>
>> It seems fine. There are minor things to consider:
>>
>> 1. It doesn't have a `FIXED_TO_INT_ROUND` equivalent.
>> 2. We can use `fixed20_12` for rgb565 but We have to use s64 for YUV
>> formats or add a `sfixed20_12` with s32.
>>
>> In terms of consistency, do you think worth using this "library" given
>> that we may need to use two distinct ways to represent the fixed point
>> soonish? Or it's better to implement `sfixed20_12`? Or just continue
>> with the
>> current macros?
>>
>> [1] - https://elixir.bootlin.com/linux/latest/source/include/drm/drm_fixed.h
> 
> I think that is something the kernel people should weigh in on.
> 
> The one thing I would definitely avoid is ending up using multiple
> fixed point formats in VKMS.
> 
> In the mean time, your current macros seem good enough, if there is no
> community interest in better type safety nor sharing the fixed point
> code.

OK. Thanks!

> 
> 
> Thanks,
> pq
diff mbox series

Patch

diff --git a/drivers/gpu/drm/vkms/vkms_formats.c b/drivers/gpu/drm/vkms/vkms_formats.c
index 8d913fa7dbde..4af8b295f31e 100644
--- a/drivers/gpu/drm/vkms/vkms_formats.c
+++ b/drivers/gpu/drm/vkms/vkms_formats.c
@@ -5,6 +5,23 @@ 
 
 #include "vkms_formats.h"
 
+/* The following macros help doing fixed point arithmetic. */
+/*
+ * With Fixed-Point scale 15 we have 17 and 15 bits of integer and fractional
+ * parts respectively.
+ *  | 0000 0000 0000 0000 0.000 0000 0000 0000 |
+ * 31                                          0
+ */
+#define FIXED_SCALE 15
+
+#define INT_TO_FIXED(a) ((a) << FIXED_SCALE)
+#define FIXED_MUL(a, b) ((s32)(((s64)(a) * (b)) >> FIXED_SCALE))
+#define FIXED_DIV(a, b) ((s32)(((s64)(a) << FIXED_SCALE) / (b)))
+/* This macro converts a fixed point number to int, and round half up it */
+#define FIXED_TO_INT_ROUND(a) (((a) + (1 << (FIXED_SCALE - 1))) >> FIXED_SCALE)
+/* Convert divisor and dividend to Fixed-Point and performs the division */
+#define INT_TO_FIXED_DIV(a, b) (FIXED_DIV(INT_TO_FIXED(a), INT_TO_FIXED(b)))
+
 static int pixel_offset(const struct vkms_frame_info *frame_info, int x, int y)
 {
 	return frame_info->offset + (y * frame_info->pitch)
@@ -112,6 +129,30 @@  static void XRGB16161616_to_argb_u16(struct line_buffer *stage_buffer,
 	}
 }
 
+static void RGB565_to_argb_u16(struct line_buffer *stage_buffer,
+			       const struct vkms_frame_info *frame_info, int y)
+{
+	struct pixel_argb_u16 *out_pixels = stage_buffer->pixels;
+	u16 *src_pixels = get_packed_src_addr(frame_info, y);
+	int x, x_limit = min_t(size_t, drm_rect_width(&frame_info->dst),
+			       stage_buffer->n_pixels);
+
+	for (x = 0; x < x_limit; x++, src_pixels++) {
+		u16 rgb_565 = le16_to_cpu(*src_pixels);
+		int fp_r = INT_TO_FIXED((rgb_565 >> 11) & 0x1f);
+		int fp_g = INT_TO_FIXED((rgb_565 >> 5) & 0x3f);
+		int fp_b = INT_TO_FIXED(rgb_565 & 0x1f);
+
+		int fp_rb_ratio = INT_TO_FIXED_DIV(65535, 31);
+		int fp_g_ratio = INT_TO_FIXED_DIV(65535, 63);
+
+		out_pixels[x].a = (u16)0xffff;
+		out_pixels[x].r = FIXED_TO_INT_ROUND(FIXED_MUL(fp_r, fp_rb_ratio));
+		out_pixels[x].g = FIXED_TO_INT_ROUND(FIXED_MUL(fp_g, fp_g_ratio));
+		out_pixels[x].b = FIXED_TO_INT_ROUND(FIXED_MUL(fp_b, fp_rb_ratio));
+	}
+}
+
 
 /*
  * The following  functions take an line of argb_u16 pixels from the
@@ -199,6 +240,31 @@  static void argb_u16_to_XRGB16161616(struct vkms_frame_info *frame_info,
 	}
 }
 
+static void argb_u16_to_RGB565(struct vkms_frame_info *frame_info,
+			       const struct line_buffer *src_buffer, int y)
+{
+	int x, x_dst = frame_info->dst.x1;
+	u16 *dst_pixels = packed_pixels_addr(frame_info, x_dst, y);
+	struct pixel_argb_u16 *in_pixels = src_buffer->pixels;
+	int x_limit = min_t(size_t, drm_rect_width(&frame_info->dst),
+			    src_buffer->n_pixels);
+
+	for (x = 0; x < x_limit; x++, dst_pixels++) {
+		int fp_r = INT_TO_FIXED(in_pixels[x].r);
+		int fp_g = INT_TO_FIXED(in_pixels[x].g);
+		int fp_b = INT_TO_FIXED(in_pixels[x].b);
+
+		int fp_rb_ratio = INT_TO_FIXED_DIV(65535, 31);
+		int fp_g_ratio = INT_TO_FIXED_DIV(65535, 63);
+
+		u16 r = FIXED_TO_INT_ROUND(FIXED_DIV(fp_r, fp_rb_ratio));
+		u16 g = FIXED_TO_INT_ROUND(FIXED_DIV(fp_g, fp_g_ratio));
+		u16 b = FIXED_TO_INT_ROUND(FIXED_DIV(fp_b, fp_rb_ratio));
+
+		*dst_pixels = cpu_to_le16(r << 11 | g << 5 | b);
+	}
+}
+
 plane_format_transform_func get_plane_fmt_transform_function(u32 format)
 {
 	if (format == DRM_FORMAT_ARGB8888)
@@ -209,6 +275,8 @@  plane_format_transform_func get_plane_fmt_transform_function(u32 format)
 		return &ARGB16161616_to_argb_u16;
 	else if (format == DRM_FORMAT_XRGB16161616)
 		return &XRGB16161616_to_argb_u16;
+	else if (format == DRM_FORMAT_RGB565)
+		return &RGB565_to_argb_u16;
 	else
 		return NULL;
 }
@@ -223,6 +291,8 @@  wb_format_transform_func get_wb_fmt_transform_function(u32 format)
 		return &argb_u16_to_ARGB16161616;
 	else if (format == DRM_FORMAT_XRGB16161616)
 		return &argb_u16_to_XRGB16161616;
+	else if (format == DRM_FORMAT_RGB565)
+		return &argb_u16_to_RGB565;
 	else
 		return NULL;
 }
diff --git a/drivers/gpu/drm/vkms/vkms_plane.c b/drivers/gpu/drm/vkms/vkms_plane.c
index 60054a85204a..94a8e412886f 100644
--- a/drivers/gpu/drm/vkms/vkms_plane.c
+++ b/drivers/gpu/drm/vkms/vkms_plane.c
@@ -14,14 +14,16 @@ 
 
 static const u32 vkms_formats[] = {
 	DRM_FORMAT_XRGB8888,
-	DRM_FORMAT_XRGB16161616
+	DRM_FORMAT_XRGB16161616,
+	DRM_FORMAT_RGB565
 };
 
 static const u32 vkms_plane_formats[] = {
 	DRM_FORMAT_ARGB8888,
 	DRM_FORMAT_XRGB8888,
 	DRM_FORMAT_XRGB16161616,
-	DRM_FORMAT_ARGB16161616
+	DRM_FORMAT_ARGB16161616,
+	DRM_FORMAT_RGB565
 };
 
 static struct drm_plane_state *
diff --git a/drivers/gpu/drm/vkms/vkms_writeback.c b/drivers/gpu/drm/vkms/vkms_writeback.c
index cb63a5da9af1..98da7bee0f4b 100644
--- a/drivers/gpu/drm/vkms/vkms_writeback.c
+++ b/drivers/gpu/drm/vkms/vkms_writeback.c
@@ -16,7 +16,8 @@ 
 static const u32 vkms_wb_formats[] = {
 	DRM_FORMAT_XRGB8888,
 	DRM_FORMAT_XRGB16161616,
-	DRM_FORMAT_ARGB16161616
+	DRM_FORMAT_ARGB16161616,
+	DRM_FORMAT_RGB565
 };
 
 static const struct drm_connector_funcs vkms_wb_connector_funcs = {