mirror of
https://github.com/Fishwaldo/Star64_linux.git
synced 2025-06-30 10:49:28 +00:00
gpu: ipu-v3: image-convert: relax alignment restrictions
For the planar but U/V-packed formats NV12 and NV16, 8 pixel width alignment is good enough to fulfill the 8 byte stride requirement. If we allow the input 8-pixel DMA bursts to overshoot the end of the line, the only input alignment restrictions are dictated by the pixel format and 8-byte aligned line start address. Since different tile sizes are allowed, the output tile with / height alignment doesn't need to be multiplied by number of columns / rows. Signed-off-by: Philipp Zabel <p.zabel@pengutronix.de> [slongerbeam@gmail.com: Bring in the fixes to format width and height alignment restrictions from imx-media-mem2mem.c.] Signed-off-by: Steve Longerbeam <slongerbeam@gmail.com> Signed-off-by: Philipp Zabel <p.zabel@pengutronix.de>
This commit is contained in:
parent
a3f42419e2
commit
ff652fcf84
1 changed files with 41 additions and 40 deletions
|
@ -551,31 +551,46 @@ static inline u32 tile_top_align(const struct ipu_image_pixfmt *fmt)
|
||||||
return fmt->uv_height_dec > 1 ? 2 : 1;
|
return fmt->uv_height_dec > 1 ? 2 : 1;
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
static inline u32 tile_width_align(enum ipu_image_convert_type type,
|
||||||
* We have to adjust the tile width such that the tile physaddrs and
|
const struct ipu_image_pixfmt *fmt,
|
||||||
* U and V plane offsets are multiples of 8 bytes as required by
|
enum ipu_rotate_mode rot_mode)
|
||||||
* the IPU DMA Controller. For the planar formats, this corresponds
|
|
||||||
* to a pixel alignment of 16 (but use a more formal equation since
|
|
||||||
* the variables are available). For all the packed formats, 8 is
|
|
||||||
* good enough.
|
|
||||||
*/
|
|
||||||
static inline u32 tile_width_align(const struct ipu_image_pixfmt *fmt)
|
|
||||||
{
|
{
|
||||||
return fmt->planar ? 8 * fmt->uv_width_dec : 8;
|
if (type == IMAGE_CONVERT_IN) {
|
||||||
|
/*
|
||||||
|
* The IC burst reads 8 pixels at a time. Reading beyond the
|
||||||
|
* end of the line is usually acceptable. Those pixels are
|
||||||
|
* ignored, unless the IC has to write the scaled line in
|
||||||
|
* reverse.
|
||||||
|
*/
|
||||||
|
return (!ipu_rot_mode_is_irt(rot_mode) &&
|
||||||
|
(rot_mode & IPU_ROT_BIT_HFLIP)) ? 8 : 2;
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Align to 16x16 pixel blocks for planar 4:2:0 chroma subsampled
|
||||||
|
* formats to guarantee 8-byte aligned line start addresses in the
|
||||||
|
* chroma planes when IRT is used. Align to 8x8 pixel IRT block size
|
||||||
|
* for all other formats.
|
||||||
|
*/
|
||||||
|
return (ipu_rot_mode_is_irt(rot_mode) &&
|
||||||
|
fmt->planar && !fmt->uv_packed) ?
|
||||||
|
8 * fmt->uv_width_dec : 8;
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
|
||||||
* For tile height alignment, we have to ensure that the output tile
|
|
||||||
* heights are multiples of 8 lines if the IRT is required by the
|
|
||||||
* given rotation mode (the IRT performs rotations on 8x8 blocks
|
|
||||||
* at a time). If the IRT is not used, or for input image tiles,
|
|
||||||
* 2 lines are good enough.
|
|
||||||
*/
|
|
||||||
static inline u32 tile_height_align(enum ipu_image_convert_type type,
|
static inline u32 tile_height_align(enum ipu_image_convert_type type,
|
||||||
|
const struct ipu_image_pixfmt *fmt,
|
||||||
enum ipu_rotate_mode rot_mode)
|
enum ipu_rotate_mode rot_mode)
|
||||||
{
|
{
|
||||||
return (type == IMAGE_CONVERT_OUT &&
|
if (type == IMAGE_CONVERT_IN || !ipu_rot_mode_is_irt(rot_mode))
|
||||||
ipu_rot_mode_is_irt(rot_mode)) ? 8 : 2;
|
return 2;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Align to 16x16 pixel blocks for planar 4:2:0 chroma subsampled
|
||||||
|
* formats to guarantee 8-byte aligned line start addresses in the
|
||||||
|
* chroma planes when IRT is used. Align to 8x8 pixel IRT block size
|
||||||
|
* for all other formats.
|
||||||
|
*/
|
||||||
|
return (fmt->planar && !fmt->uv_packed) ? 8 * fmt->uv_width_dec : 8;
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
|
@ -661,8 +676,9 @@ static void find_seams(struct ipu_image_convert_ctx *ctx,
|
||||||
unsigned int in_top_align = tile_top_align(in->fmt);
|
unsigned int in_top_align = tile_top_align(in->fmt);
|
||||||
unsigned int out_left_align = tile_left_align(out->fmt);
|
unsigned int out_left_align = tile_left_align(out->fmt);
|
||||||
unsigned int out_top_align = tile_top_align(out->fmt);
|
unsigned int out_top_align = tile_top_align(out->fmt);
|
||||||
unsigned int out_width_align = tile_width_align(out->fmt);
|
unsigned int out_width_align = tile_width_align(out->type, out->fmt,
|
||||||
unsigned int out_height_align = tile_height_align(out->type,
|
ctx->rot_mode);
|
||||||
|
unsigned int out_height_align = tile_height_align(out->type, out->fmt,
|
||||||
ctx->rot_mode);
|
ctx->rot_mode);
|
||||||
unsigned int in_right = in->base.rect.width;
|
unsigned int in_right = in->base.rect.width;
|
||||||
unsigned int in_bottom = in->base.rect.height;
|
unsigned int in_bottom = in->base.rect.height;
|
||||||
|
@ -1855,8 +1871,6 @@ void ipu_image_convert_adjust(struct ipu_image *in, struct ipu_image *out,
|
||||||
enum ipu_rotate_mode rot_mode)
|
enum ipu_rotate_mode rot_mode)
|
||||||
{
|
{
|
||||||
const struct ipu_image_pixfmt *infmt, *outfmt;
|
const struct ipu_image_pixfmt *infmt, *outfmt;
|
||||||
unsigned int num_in_rows, num_in_cols;
|
|
||||||
unsigned int num_out_rows, num_out_cols;
|
|
||||||
u32 w_align, h_align;
|
u32 w_align, h_align;
|
||||||
|
|
||||||
infmt = get_format(in->pix.pixelformat);
|
infmt = get_format(in->pix.pixelformat);
|
||||||
|
@ -1888,28 +1902,15 @@ void ipu_image_convert_adjust(struct ipu_image *in, struct ipu_image *out,
|
||||||
in->pix.height / 4);
|
in->pix.height / 4);
|
||||||
}
|
}
|
||||||
|
|
||||||
/* get tiling rows/cols from output format */
|
|
||||||
num_out_rows = num_stripes(out->pix.height);
|
|
||||||
num_out_cols = num_stripes(out->pix.width);
|
|
||||||
if (ipu_rot_mode_is_irt(rot_mode)) {
|
|
||||||
num_in_rows = num_out_cols;
|
|
||||||
num_in_cols = num_out_rows;
|
|
||||||
} else {
|
|
||||||
num_in_rows = num_out_rows;
|
|
||||||
num_in_cols = num_out_cols;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* align input width/height */
|
/* align input width/height */
|
||||||
w_align = ilog2(tile_width_align(infmt) * num_in_cols);
|
w_align = ilog2(tile_width_align(IMAGE_CONVERT_IN, infmt, rot_mode));
|
||||||
h_align = ilog2(tile_height_align(IMAGE_CONVERT_IN, rot_mode) *
|
h_align = ilog2(tile_height_align(IMAGE_CONVERT_IN, infmt, rot_mode));
|
||||||
num_in_rows);
|
|
||||||
in->pix.width = clamp_align(in->pix.width, MIN_W, MAX_W, w_align);
|
in->pix.width = clamp_align(in->pix.width, MIN_W, MAX_W, w_align);
|
||||||
in->pix.height = clamp_align(in->pix.height, MIN_H, MAX_H, h_align);
|
in->pix.height = clamp_align(in->pix.height, MIN_H, MAX_H, h_align);
|
||||||
|
|
||||||
/* align output width/height */
|
/* align output width/height */
|
||||||
w_align = ilog2(tile_width_align(outfmt) * num_out_cols);
|
w_align = ilog2(tile_width_align(IMAGE_CONVERT_OUT, outfmt, rot_mode));
|
||||||
h_align = ilog2(tile_height_align(IMAGE_CONVERT_OUT, rot_mode) *
|
h_align = ilog2(tile_height_align(IMAGE_CONVERT_OUT, outfmt, rot_mode));
|
||||||
num_out_rows);
|
|
||||||
out->pix.width = clamp_align(out->pix.width, MIN_W, MAX_W, w_align);
|
out->pix.width = clamp_align(out->pix.width, MIN_W, MAX_W, w_align);
|
||||||
out->pix.height = clamp_align(out->pix.height, MIN_H, MAX_H, h_align);
|
out->pix.height = clamp_align(out->pix.height, MIN_H, MAX_H, h_align);
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue